X86FrameLowering.cpp revision 17001ce25cc205ac1cd2604492c2bce310964220
13c2f0a11cce5a1e828e20675fa8467b624795e0aNick Lewycky//=======- X86FrameLowering.cpp - X86 Frame Information --------*- C++ -*-====// 233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov// 333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov// The LLVM Compiler Infrastructure 433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov// 533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov// This file is distributed under the University of Illinois Open Source 633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov// License. See LICENSE.TXT for details. 733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov// 833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov//===----------------------------------------------------------------------===// 933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov// 1016c29b5f285f375be53dabaa73e3e91107485fe4Anton Korobeynikov// This file contains the X86 implementation of TargetFrameLowering class. 1133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov// 1233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov//===----------------------------------------------------------------------===// 1333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 1416c29b5f285f375be53dabaa73e3e91107485fe4Anton Korobeynikov#include "X86FrameLowering.h" 1533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov#include "X86InstrBuilder.h" 1633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov#include "X86InstrInfo.h" 1733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov#include "X86MachineFunctionInfo.h" 1876927d758657b3a511c73467ec5a7288795c1513Rafael Espindola#include "X86Subtarget.h" 19d9e3385ced2dc887e2fe8e1c071bd2611e4d3edeAnton Korobeynikov#include "X86TargetMachine.h" 2033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov#include "llvm/Function.h" 2133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov#include "llvm/CodeGen/MachineFrameInfo.h" 2233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov#include "llvm/CodeGen/MachineFunction.h" 2333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov#include "llvm/CodeGen/MachineInstrBuilder.h" 2433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov#include "llvm/CodeGen/MachineModuleInfo.h" 2533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov#include "llvm/CodeGen/MachineRegisterInfo.h" 26f0adba9a7ec8a3031876575a6ffb7db5f1b6f855Rafael Espindola#include "llvm/MC/MCAsmInfo.h" 276a6b8c3e96b9e1ca7092eafd0cfb219cbbfbdfc4Bill Wendling#include "llvm/MC/MCSymbol.h" 2833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov#include "llvm/Target/TargetData.h" 2933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov#include "llvm/Target/TargetOptions.h" 3033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov#include "llvm/Support/CommandLine.h" 317158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng#include "llvm/ADT/SmallSet.h" 3233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 3333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikovusing namespace llvm; 3433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 3533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov// FIXME: completely move here. 3633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikovextern cl::opt<bool> ForceStackAlign; 3733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 3816c29b5f285f375be53dabaa73e3e91107485fe4Anton Korobeynikovbool X86FrameLowering::hasReservedCallFrame(const MachineFunction &MF) const { 39d0c38176690e9602a93a20a43f1bd084564a8116Anton Korobeynikov return !MF.getFrameInfo()->hasVarSizedObjects(); 40d0c38176690e9602a93a20a43f1bd084564a8116Anton Korobeynikov} 41d0c38176690e9602a93a20a43f1bd084564a8116Anton Korobeynikov 42d0c38176690e9602a93a20a43f1bd084564a8116Anton Korobeynikov/// hasFP - Return true if the specified function should have a dedicated frame 43d0c38176690e9602a93a20a43f1bd084564a8116Anton Korobeynikov/// pointer register. This is true if the function has variable sized allocas 44d0c38176690e9602a93a20a43f1bd084564a8116Anton Korobeynikov/// or if frame pointer elimination is disabled. 4516c29b5f285f375be53dabaa73e3e91107485fe4Anton Korobeynikovbool X86FrameLowering::hasFP(const MachineFunction &MF) const { 46d0c38176690e9602a93a20a43f1bd084564a8116Anton Korobeynikov const MachineFrameInfo *MFI = MF.getFrameInfo(); 47d0c38176690e9602a93a20a43f1bd084564a8116Anton Korobeynikov const MachineModuleInfo &MMI = MF.getMMI(); 48d9e3385ced2dc887e2fe8e1c071bd2611e4d3edeAnton Korobeynikov const TargetRegisterInfo *RI = TM.getRegisterInfo(); 49d0c38176690e9602a93a20a43f1bd084564a8116Anton Korobeynikov 50d0c38176690e9602a93a20a43f1bd084564a8116Anton Korobeynikov return (DisableFramePointerElim(MF) || 51d0c38176690e9602a93a20a43f1bd084564a8116Anton Korobeynikov RI->needsStackRealignment(MF) || 52d0c38176690e9602a93a20a43f1bd084564a8116Anton Korobeynikov MFI->hasVarSizedObjects() || 53d0c38176690e9602a93a20a43f1bd084564a8116Anton Korobeynikov MFI->isFrameAddressTaken() || 54d0c38176690e9602a93a20a43f1bd084564a8116Anton Korobeynikov MF.getInfo<X86MachineFunctionInfo>()->getForceFramePointer() || 55d0c38176690e9602a93a20a43f1bd084564a8116Anton Korobeynikov MMI.callsUnwindInit()); 56d0c38176690e9602a93a20a43f1bd084564a8116Anton Korobeynikov} 57d0c38176690e9602a93a20a43f1bd084564a8116Anton Korobeynikov 5833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikovstatic unsigned getSUBriOpcode(unsigned is64Bit, int64_t Imm) { 5933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (is64Bit) { 6033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (isInt<8>(Imm)) 6133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov return X86::SUB64ri8; 6233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov return X86::SUB64ri32; 6333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } else { 6433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (isInt<8>(Imm)) 6533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov return X86::SUB32ri8; 6633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov return X86::SUB32ri; 6733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 6833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov} 6933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 7033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikovstatic unsigned getADDriOpcode(unsigned is64Bit, int64_t Imm) { 7133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (is64Bit) { 7233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (isInt<8>(Imm)) 7333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov return X86::ADD64ri8; 7433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov return X86::ADD64ri32; 7533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } else { 7633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (isInt<8>(Imm)) 7733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov return X86::ADD32ri8; 7833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov return X86::ADD32ri; 7933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 8033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov} 8133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 827158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng/// findDeadCallerSavedReg - Return a caller-saved register that isn't live 837158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng/// when it reaches the "return" instruction. We can then pop a stack object 847158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng/// to this register without worry about clobbering it. 857158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Chengstatic unsigned findDeadCallerSavedReg(MachineBasicBlock &MBB, 867158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng MachineBasicBlock::iterator &MBBI, 877158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng const TargetRegisterInfo &TRI, 887158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng bool Is64Bit) { 897158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng const MachineFunction *MF = MBB.getParent(); 907158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng const Function *F = MF->getFunction(); 917158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng if (!F || MF->getMMI().callsEHReturn()) 927158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng return 0; 937158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng 947158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng static const unsigned CallerSavedRegs32Bit[] = { 9532a183c84ad0cbe492119c37f1a7941ace61dd79Andrew Trick X86::EAX, X86::EDX, X86::ECX, 0 967158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng }; 977158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng 987158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng static const unsigned CallerSavedRegs64Bit[] = { 997158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng X86::RAX, X86::RDX, X86::RCX, X86::RSI, X86::RDI, 10032a183c84ad0cbe492119c37f1a7941ace61dd79Andrew Trick X86::R8, X86::R9, X86::R10, X86::R11, 0 1017158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng }; 1027158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng 1037158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng unsigned Opc = MBBI->getOpcode(); 1047158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng switch (Opc) { 1057158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng default: return 0; 1067158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng case X86::RET: 1077158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng case X86::RETI: 1087158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng case X86::TCRETURNdi: 1097158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng case X86::TCRETURNri: 1107158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng case X86::TCRETURNmi: 1117158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng case X86::TCRETURNdi64: 1127158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng case X86::TCRETURNri64: 1137158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng case X86::TCRETURNmi64: 1147158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng case X86::EH_RETURN: 1157158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng case X86::EH_RETURN64: { 1167158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng SmallSet<unsigned, 8> Uses; 1177158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng for (unsigned i = 0, e = MBBI->getNumOperands(); i != e; ++i) { 1187158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng MachineOperand &MO = MBBI->getOperand(i); 1197158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng if (!MO.isReg() || MO.isDef()) 1207158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng continue; 1217158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng unsigned Reg = MO.getReg(); 1227158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng if (!Reg) 1237158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng continue; 1247158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng for (const unsigned *AsI = TRI.getOverlaps(Reg); *AsI; ++AsI) 1257158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng Uses.insert(*AsI); 1267158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng } 1277158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng 1287158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng const unsigned *CS = Is64Bit ? CallerSavedRegs64Bit : CallerSavedRegs32Bit; 1297158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng for (; *CS; ++CS) 1307158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng if (!Uses.count(*CS)) 1317158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng return *CS; 1327158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng } 1337158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng } 1347158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng 1357158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng return 0; 1367158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng} 1377158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng 1387158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng 13933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov/// emitSPUpdate - Emit a series of instructions to increment / decrement the 14033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov/// stack pointer by a constant value. 14133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikovstatic 14233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikovvoid emitSPUpdate(MachineBasicBlock &MBB, MachineBasicBlock::iterator &MBBI, 1437158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng unsigned StackPtr, int64_t NumBytes, 1447158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng bool Is64Bit, const TargetInstrInfo &TII, 1457158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng const TargetRegisterInfo &TRI) { 14633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov bool isSub = NumBytes < 0; 14733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov uint64_t Offset = isSub ? -NumBytes : NumBytes; 14833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov unsigned Opc = isSub ? 14933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov getSUBriOpcode(Is64Bit, Offset) : 15033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov getADDriOpcode(Is64Bit, Offset); 15133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov uint64_t Chunk = (1LL << 31) - 1; 15233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov DebugLoc DL = MBB.findDebugLoc(MBBI); 15333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 15433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov while (Offset) { 15533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov uint64_t ThisVal = (Offset > Chunk) ? Chunk : Offset; 1567158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng if (ThisVal == (Is64Bit ? 8 : 4)) { 1577158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng // Use push / pop instead. 1587158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng unsigned Reg = isSub 1591e08cd1eaef8acbcfaf7db48d859a29583c29897Dale Johannesen ? (unsigned)(Is64Bit ? X86::RAX : X86::EAX) 1607158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng : findDeadCallerSavedReg(MBB, MBBI, TRI, Is64Bit); 1617158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng if (Reg) { 1627158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng Opc = isSub 1637158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng ? (Is64Bit ? X86::PUSH64r : X86::PUSH32r) 1647158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng : (Is64Bit ? X86::POP64r : X86::POP32r); 165aff232a5941c9ffb7ad52e08f81ad53794fed56bCharles Davis MachineInstr *MI = BuildMI(MBB, MBBI, DL, TII.get(Opc)) 1667158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng .addReg(Reg, getDefRegState(!isSub) | getUndefRegState(isSub)); 167aff232a5941c9ffb7ad52e08f81ad53794fed56bCharles Davis if (isSub) 168aff232a5941c9ffb7ad52e08f81ad53794fed56bCharles Davis MI->setFlag(MachineInstr::FrameSetup); 1697158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng Offset -= ThisVal; 1707158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng continue; 1717158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng } 1727158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng } 1737158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng 17433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineInstr *MI = 17533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov BuildMI(MBB, MBBI, DL, TII.get(Opc), StackPtr) 1767158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng .addReg(StackPtr) 1777158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng .addImm(ThisVal); 178aff232a5941c9ffb7ad52e08f81ad53794fed56bCharles Davis if (isSub) 179aff232a5941c9ffb7ad52e08f81ad53794fed56bCharles Davis MI->setFlag(MachineInstr::FrameSetup); 18033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MI->getOperand(3).setIsDead(); // The EFLAGS implicit def is dead. 18133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov Offset -= ThisVal; 18233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 18333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov} 18433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 18533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov/// mergeSPUpdatesUp - Merge two stack-manipulating instructions upper iterator. 18633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikovstatic 18733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikovvoid mergeSPUpdatesUp(MachineBasicBlock &MBB, MachineBasicBlock::iterator &MBBI, 18833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov unsigned StackPtr, uint64_t *NumBytes = NULL) { 18933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (MBBI == MBB.begin()) return; 19033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 19133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineBasicBlock::iterator PI = prior(MBBI); 19233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov unsigned Opc = PI->getOpcode(); 19333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if ((Opc == X86::ADD64ri32 || Opc == X86::ADD64ri8 || 19433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov Opc == X86::ADD32ri || Opc == X86::ADD32ri8) && 19533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov PI->getOperand(0).getReg() == StackPtr) { 19633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (NumBytes) 19733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov *NumBytes += PI->getOperand(2).getImm(); 19833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MBB.erase(PI); 19933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } else if ((Opc == X86::SUB64ri32 || Opc == X86::SUB64ri8 || 20033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov Opc == X86::SUB32ri || Opc == X86::SUB32ri8) && 20133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov PI->getOperand(0).getReg() == StackPtr) { 20233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (NumBytes) 20333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov *NumBytes -= PI->getOperand(2).getImm(); 20433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MBB.erase(PI); 20533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 20633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov} 20733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 20833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov/// mergeSPUpdatesDown - Merge two stack-manipulating instructions lower iterator. 20933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikovstatic 21033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikovvoid mergeSPUpdatesDown(MachineBasicBlock &MBB, 21133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineBasicBlock::iterator &MBBI, 21233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov unsigned StackPtr, uint64_t *NumBytes = NULL) { 21333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // FIXME: THIS ISN'T RUN!!! 21433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov return; 21533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 21633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (MBBI == MBB.end()) return; 21733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 21833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineBasicBlock::iterator NI = llvm::next(MBBI); 21933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (NI == MBB.end()) return; 22033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 22133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov unsigned Opc = NI->getOpcode(); 22233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if ((Opc == X86::ADD64ri32 || Opc == X86::ADD64ri8 || 22333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov Opc == X86::ADD32ri || Opc == X86::ADD32ri8) && 22433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov NI->getOperand(0).getReg() == StackPtr) { 22533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (NumBytes) 22633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov *NumBytes -= NI->getOperand(2).getImm(); 22733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MBB.erase(NI); 22833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MBBI = NI; 22933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } else if ((Opc == X86::SUB64ri32 || Opc == X86::SUB64ri8 || 23033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov Opc == X86::SUB32ri || Opc == X86::SUB32ri8) && 23133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov NI->getOperand(0).getReg() == StackPtr) { 23233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (NumBytes) 23333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov *NumBytes += NI->getOperand(2).getImm(); 23433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MBB.erase(NI); 23533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MBBI = NI; 23633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 23733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov} 23833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 23933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov/// mergeSPUpdates - Checks the instruction before/after the passed 24033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov/// instruction. If it is an ADD/SUB instruction it is deleted argument and the 24133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov/// stack adjustment is returned as a positive value for ADD and a negative for 24233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov/// SUB. 24333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikovstatic int mergeSPUpdates(MachineBasicBlock &MBB, 24433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineBasicBlock::iterator &MBBI, 24533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov unsigned StackPtr, 24633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov bool doMergeWithPrevious) { 24733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if ((doMergeWithPrevious && MBBI == MBB.begin()) || 24833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov (!doMergeWithPrevious && MBBI == MBB.end())) 24933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov return 0; 25033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 25133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineBasicBlock::iterator PI = doMergeWithPrevious ? prior(MBBI) : MBBI; 25233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineBasicBlock::iterator NI = doMergeWithPrevious ? 0 : llvm::next(MBBI); 25333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov unsigned Opc = PI->getOpcode(); 25433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov int Offset = 0; 25533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 25633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if ((Opc == X86::ADD64ri32 || Opc == X86::ADD64ri8 || 25733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov Opc == X86::ADD32ri || Opc == X86::ADD32ri8) && 25833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov PI->getOperand(0).getReg() == StackPtr){ 25933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov Offset += PI->getOperand(2).getImm(); 26033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MBB.erase(PI); 26133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (!doMergeWithPrevious) MBBI = NI; 26233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } else if ((Opc == X86::SUB64ri32 || Opc == X86::SUB64ri8 || 26333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov Opc == X86::SUB32ri || Opc == X86::SUB32ri8) && 26433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov PI->getOperand(0).getReg() == StackPtr) { 26533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov Offset -= PI->getOperand(2).getImm(); 26633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MBB.erase(PI); 26733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (!doMergeWithPrevious) MBBI = NI; 26833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 26933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 27033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov return Offset; 27133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov} 27233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 27333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikovstatic bool isEAXLiveIn(MachineFunction &MF) { 27433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov for (MachineRegisterInfo::livein_iterator II = MF.getRegInfo().livein_begin(), 27533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov EE = MF.getRegInfo().livein_end(); II != EE; ++II) { 27633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov unsigned Reg = II->first; 27733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 27833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (Reg == X86::EAX || Reg == X86::AX || 27933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov Reg == X86::AH || Reg == X86::AL) 28033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov return true; 28133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 28233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 28333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov return false; 28433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov} 28533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 28616c29b5f285f375be53dabaa73e3e91107485fe4Anton Korobeynikovvoid X86FrameLowering::emitCalleeSavedFrameMoves(MachineFunction &MF, 28709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling MCSymbol *Label, 28809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling unsigned FramePtr) const { 28933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineFrameInfo *MFI = MF.getFrameInfo(); 29033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineModuleInfo &MMI = MF.getMMI(); 29133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 29233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Add callee saved registers to move list. 29333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov const std::vector<CalleeSavedInfo> &CSI = MFI->getCalleeSavedInfo(); 29433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (CSI.empty()) return; 29533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 29633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov std::vector<MachineMove> &Moves = MMI.getFrameMoves(); 297d9e3385ced2dc887e2fe8e1c071bd2611e4d3edeAnton Korobeynikov const TargetData *TD = TM.getTargetData(); 298d0c38176690e9602a93a20a43f1bd084564a8116Anton Korobeynikov bool HasFP = hasFP(MF); 29933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 30033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Calculate amount of bytes used for return address storing. 301e749911372c75e4e68f83a32b4092f4ffb0d2793Anton Korobeynikov int stackGrowth = -TD->getPointerSize(); 30233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 30333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // FIXME: This is dirty hack. The code itself is pretty mess right now. 30433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // It should be rewritten from scratch and generalized sometimes. 30533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 3067a2bdde0a0eebcd2125055e0eacaca040f0b766cChris Lattner // Determine maximum offset (minimum due to stack growth). 30733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov int64_t MaxOffset = 0; 30833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov for (std::vector<CalleeSavedInfo>::const_iterator 30933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov I = CSI.begin(), E = CSI.end(); I != E; ++I) 31033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MaxOffset = std::min(MaxOffset, 31133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MFI->getObjectOffset(I->getFrameIdx())); 31233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 31333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Calculate offsets. 31433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov int64_t saveAreaOffset = (HasFP ? 3 : 2) * stackGrowth; 31533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov for (std::vector<CalleeSavedInfo>::const_iterator 31633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov I = CSI.begin(), E = CSI.end(); I != E; ++I) { 31733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov int64_t Offset = MFI->getObjectOffset(I->getFrameIdx()); 31833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov unsigned Reg = I->getReg(); 31933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov Offset = MaxOffset - Offset + saveAreaOffset; 32033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 32133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Don't output a new machine move if we're re-saving the frame 32233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // pointer. This happens when the PrologEpilogInserter has inserted an extra 32333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // "PUSH" of the frame pointer -- the "emitPrologue" method automatically 32433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // generates one when frame pointers are used. If we generate a "machine 32533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // move" for this extra "PUSH", the linker will lose track of the fact that 32633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // the frame pointer should have the value of the first "PUSH" when it's 32733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // trying to unwind. 3282763538609fd455d63c192b320c73fb5d48c3e47NAKAMURA Takumi // 32933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // FIXME: This looks inelegant. It's possibly correct, but it's covering up 33033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // another bug. I.e., one where we generate a prolog like this: 33133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // 33233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // pushl %ebp 33333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // movl %esp, %ebp 33433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // pushl %ebp 33533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // pushl %esi 33633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // ... 33733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // 33833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // The immediate re-push of EBP is unnecessary. At the least, it's an 33933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // optimization bug. EBP can be used as a scratch register in certain 34033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // cases, but probably not when we have a frame pointer. 34133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (HasFP && FramePtr == Reg) 34233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov continue; 34333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 34433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineLocation CSDst(MachineLocation::VirtualFP, Offset); 34533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineLocation CSSrc(Reg); 34633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov Moves.push_back(MachineMove(Label, CSDst, CSSrc)); 34733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 34833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov} 34933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 35009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling/// getCompactUnwindRegNum - Get the compact unwind number for a given 35109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling/// register. The number corresponds to the enum lists in 35209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling/// compact_unwind_encoding.h. 35309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendlingstatic int getCompactUnwindRegNum(const unsigned *CURegs, unsigned Reg) { 35409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling int Idx = 1; 35509b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling for (; *CURegs; ++CURegs, ++Idx) 35609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling if (*CURegs == Reg) 35709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling return Idx; 35809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 35909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling return -1; 36009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling} 36109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 36209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling/// encodeCompactUnwindRegistersWithoutFrame - Create the permutation encoding 36309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling/// used with frameless stacks. It is passed the number of registers to be saved 36409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling/// and an array of the registers saved. 36509b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendlingstatic uint32_t encodeCompactUnwindRegistersWithoutFrame(unsigned SavedRegs[6], 36609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling unsigned RegCount, 36709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling bool Is64Bit) { 36809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // The saved registers are numbered from 1 to 6. In order to encode the order 36909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // in which they were saved, we re-number them according to their place in the 37009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // register order. The re-numbering is relative to the last re-numbered 37109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // register. E.g., if we have registers {6, 2, 4, 5} saved in that order: 37209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // 37309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // Orig Re-Num 37409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // ---- ------ 37509b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // 6 6 37609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // 2 2 37709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // 4 3 37809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // 5 3 37909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // 38009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling static const unsigned CU32BitRegs[] = { 38109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling X86::EBX, X86::ECX, X86::EDX, X86::EDI, X86::ESI, X86::EBP, 0 38209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling }; 38309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling static const unsigned CU64BitRegs[] = { 38409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling X86::RBX, X86::R12, X86::R13, X86::R14, X86::R15, X86::RBP, 0 38509b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling }; 38609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling const unsigned *CURegs = (Is64Bit ? CU64BitRegs : CU32BitRegs); 38709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 38809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling uint32_t RenumRegs[6]; 38909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling for (unsigned i = 6 - RegCount; i < 6; ++i) { 39009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling int CUReg = getCompactUnwindRegNum(CURegs, SavedRegs[i]); 39109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling if (CUReg == -1) return ~0U; 39209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling SavedRegs[i] = CUReg; 39309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 39409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling unsigned Countless = 0; 39509b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling for (unsigned j = 6 - RegCount; j < i; ++j) 39609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling if (SavedRegs[j] < SavedRegs[i]) 39709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling ++Countless; 39809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 39909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling RenumRegs[i] = SavedRegs[i] - Countless - 1; 40009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling } 40109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 40209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // Take the renumbered values and encode them into a 10-bit number. 40309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling uint32_t permutationEncoding = 0; 40409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling switch (RegCount) { 40509b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling case 6: 40609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling permutationEncoding |= 120 * RenumRegs[0] + 24 * RenumRegs[1] 40709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling + 6 * RenumRegs[2] + 2 * RenumRegs[3] 40809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling + RenumRegs[4]; 40909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling break; 41009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling case 5: 41109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling permutationEncoding |= 120 * RenumRegs[1] + 24 * RenumRegs[2] 41209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling + 6 * RenumRegs[3] + 2 * RenumRegs[4] 41309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling + RenumRegs[5]; 41409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling break; 41509b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling case 4: 41609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling permutationEncoding |= 60 * RenumRegs[2] + 12 * RenumRegs[3] 41709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling + 3 * RenumRegs[4] + RenumRegs[5]; 41809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling break; 41909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling case 3: 42009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling permutationEncoding |= 20 * RenumRegs[3] + 4 * RenumRegs[4] 42109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling + RenumRegs[5]; 42209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling break; 42309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling case 2: 42409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling permutationEncoding |= 5 * RenumRegs[4] + RenumRegs[5]; 42509b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling break; 42609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling case 1: 42709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling permutationEncoding |= RenumRegs[5]; 42809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling break; 42909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling } 43009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 43109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling assert((permutationEncoding & 0x3FF) == permutationEncoding && 43209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling "Invalid compact register encoding!"); 43309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling return permutationEncoding; 43409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling} 43509b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 43609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling/// encodeCompactUnwindRegistersWithFrame - Return the registers encoded for a 43709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling/// compact encoding with a frame pointer. 43809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendlingstatic uint32_t encodeCompactUnwindRegistersWithFrame(unsigned SavedRegs[6], 43909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling bool Is64Bit) { 44009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling static const unsigned CU32BitRegs[] = { 44109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling X86::EBX, X86::ECX, X86::EDX, X86::EDI, X86::ESI, X86::EBP, 0 44209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling }; 44309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling static const unsigned CU64BitRegs[] = { 44409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling X86::RBX, X86::R12, X86::R13, X86::R14, X86::R15, X86::RBP, 0 44509b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling }; 44609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling const unsigned *CURegs = (Is64Bit ? CU64BitRegs : CU32BitRegs); 44709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 44809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // Encode the registers in the order they were saved, 3-bits per register. The 44909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // registers are numbered from 1 to 6. 45009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling uint32_t RegEnc = 0; 45109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling for (int I = 5; I >= 0; --I) { 45209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling unsigned Reg = SavedRegs[I]; 45309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling if (Reg == 0) break; 45409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling int CURegNum = getCompactUnwindRegNum(CURegs, Reg); 45509b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling if (CURegNum == -1) 45609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling return ~0U; 45709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling RegEnc |= (CURegNum & 0x7) << (5 - I); 45809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling } 45909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 46009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling assert((RegEnc & 0x7FFF) == RegEnc && "Invalid compact register encoding!"); 46109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling return RegEnc; 46209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling} 46309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 46409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendlinguint32_t X86FrameLowering::getCompactUnwindEncoding(MachineFunction &MF) const { 46509b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling const X86RegisterInfo *RegInfo = TM.getRegisterInfo(); 46609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling unsigned FramePtr = RegInfo->getFrameRegister(MF); 46709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling unsigned StackPtr = RegInfo->getStackRegister(); 46809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 46909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling X86MachineFunctionInfo *X86FI = MF.getInfo<X86MachineFunctionInfo>(); 47009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling int TailCallReturnAddrDelta = X86FI->getTCReturnAddrDelta(); 47109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 47209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling bool Is64Bit = STI.is64Bit(); 47309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling bool HasFP = hasFP(MF); 47409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 47509b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling unsigned SavedRegs[6] = { 0, 0, 0, 0, 0, 0 }; 47609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling int SavedRegIdx = 6; 47709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 47809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling unsigned OffsetSize = (Is64Bit ? 8 : 4); 47909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 48009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling unsigned PushInstr = (Is64Bit ? X86::PUSH64r : X86::PUSH32r); 48109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling unsigned PushInstrSize = 1; 48209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling unsigned MoveInstr = (Is64Bit ? X86::MOV64rr : X86::MOV32rr); 48309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling unsigned MoveInstrSize = (Is64Bit ? 3 : 2); 48409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling unsigned SubtractInstr = getSUBriOpcode(Is64Bit, -TailCallReturnAddrDelta); 48509b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling unsigned SubtractInstrIdx = (Is64Bit ? 3 : 2); 48609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 487de77055a68a3fc495e01b682f00059af3e38822eBill Wendling unsigned StackDivide = (Is64Bit ? 8 : 4); 488de77055a68a3fc495e01b682f00059af3e38822eBill Wendling 48909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling unsigned InstrOffset = 0; 49009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling unsigned CFAOffset = 0; 49109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling unsigned StackAdjust = 0; 49209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 49309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling MachineBasicBlock &MBB = MF.front(); // Prologue is in entry BB. 49409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling bool ExpectEnd = false; 49509b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling for (MachineBasicBlock::iterator 49609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling MBBI = MBB.begin(), MBBE = MBB.end(); MBBI != MBBE; ++MBBI) { 49709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling MachineInstr &MI = *MBBI; 49809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling unsigned Opc = MI.getOpcode(); 49909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling if (Opc == X86::PROLOG_LABEL) continue; 50009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling if (!MI.getFlag(MachineInstr::FrameSetup)) break; 50109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 50209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // We don't exect any more prolog instructions. 50309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling if (ExpectEnd) return 0; 50409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 50509b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling if (Opc == PushInstr) { 50609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // If there are too many saved registers, we cannot use compact encoding. 50709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling if (--SavedRegIdx < 0) return 0; 50809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 50909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling SavedRegs[SavedRegIdx] = MI.getOperand(0).getReg(); 51009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling CFAOffset += OffsetSize; 51109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling InstrOffset += PushInstrSize; 51209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling } else if (Opc == MoveInstr) { 51309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling unsigned SrcReg = MI.getOperand(1).getReg(); 51409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling unsigned DstReg = MI.getOperand(0).getReg(); 51509b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 51609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling if (DstReg != FramePtr || SrcReg != StackPtr) 51709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling return 0; 51809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 51909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling CFAOffset = 0; 52009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling memset(SavedRegs, 0, sizeof(SavedRegs)); 52109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling InstrOffset += MoveInstrSize; 52209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling } else if (Opc == SubtractInstr) { 52309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling if (StackAdjust) 52409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // We all ready have a stack pointer adjustment. 52509b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling return 0; 52609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 52709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling if (!MI.getOperand(0).isReg() || 52809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling MI.getOperand(0).getReg() != MI.getOperand(1).getReg() || 52909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling MI.getOperand(0).getReg() != StackPtr || !MI.getOperand(2).isImm()) 53009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // We need this to be a stack adjustment pointer. Something like: 53109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // 53209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // %RSP<def> = SUB64ri8 %RSP, 48 53309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling return 0; 53409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 535de77055a68a3fc495e01b682f00059af3e38822eBill Wendling StackAdjust = MI.getOperand(2).getImm() / StackDivide; 53609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling SubtractInstrIdx += InstrOffset; 53709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling ExpectEnd = true; 53809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling } 53909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling } 54009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 54109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // Encode that we are using EBP/RBP as the frame pointer. 54209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling uint32_t CompactUnwindEncoding = 0; 543de77055a68a3fc495e01b682f00059af3e38822eBill Wendling CFAOffset /= StackDivide; 54409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling if (HasFP) { 54509b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling if ((CFAOffset & 0xFF) != CFAOffset) 54609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // Offset was too big for compact encoding. 54709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling return 0; 54809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 54909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // Get the encoding of the saved registers when we have a frame pointer. 55009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling uint32_t RegEnc = encodeCompactUnwindRegistersWithFrame(SavedRegs, Is64Bit); 55109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling if (RegEnc == ~0U) 55209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling return 0; 55309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 55409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling CompactUnwindEncoding |= 0x01000000; 55509b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling CompactUnwindEncoding |= (CFAOffset & 0xFF) << 16; 55609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling CompactUnwindEncoding |= RegEnc & 0x7FFF; 55709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling } else { 55809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling unsigned FullOffset = CFAOffset + StackAdjust; 55909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling if ((FullOffset & 0xFF) == FullOffset) { 56009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // Frameless stack. 56109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling CompactUnwindEncoding |= 0x02000000; 56209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling CompactUnwindEncoding |= (FullOffset & 0xFF) << 16; 56309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling } else { 56409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling if ((CFAOffset & 0x7) != CFAOffset) 56509b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // The extra stack adjustments are too big for us to handle. 56609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling return 0; 56709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 56809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // Frameless stack with an offset too large for us to encode compactly. 56909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling CompactUnwindEncoding |= 0x03000000; 57009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 57109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // Encode the offset to the nnnnnn value in the 'subl $nnnnnn, ESP' 57209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // instruction. 57309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling CompactUnwindEncoding |= (SubtractInstrIdx & 0xFF) << 16; 57409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 57509b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // Encode any extra stack stack changes (done via push instructions). 57609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling CompactUnwindEncoding |= (CFAOffset & 0x7) << 13; 57709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling } 57809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 57909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // Get the encoding of the saved registers when we don't have a frame 58009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // pointer. 58109b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling uint32_t RegEnc = encodeCompactUnwindRegistersWithoutFrame(SavedRegs, 58209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 6 - SavedRegIdx, 58309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling Is64Bit); 58409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling if (RegEnc == ~0U) return 0; 58509b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling CompactUnwindEncoding |= RegEnc & 0x3FF; 58609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling } 58709b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 58809b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling return CompactUnwindEncoding; 58909b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling} 59009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 59133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov/// emitPrologue - Push callee-saved registers onto the stack, which 59233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov/// automatically adjust the stack pointer. Adjust the stack pointer to allocate 59333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov/// space for local variables. Also emit labels used by the exception handler to 59433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov/// generate the exception handling frames. 59516c29b5f285f375be53dabaa73e3e91107485fe4Anton Korobeynikovvoid X86FrameLowering::emitPrologue(MachineFunction &MF) const { 59633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineBasicBlock &MBB = MF.front(); // Prologue goes in entry BB. 59733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineBasicBlock::iterator MBBI = MBB.begin(); 59833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineFrameInfo *MFI = MF.getFrameInfo(); 59933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov const Function *Fn = MF.getFunction(); 600d9e3385ced2dc887e2fe8e1c071bd2611e4d3edeAnton Korobeynikov const X86RegisterInfo *RegInfo = TM.getRegisterInfo(); 601d9e3385ced2dc887e2fe8e1c071bd2611e4d3edeAnton Korobeynikov const X86InstrInfo &TII = *TM.getInstrInfo(); 60233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineModuleInfo &MMI = MF.getMMI(); 60333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov X86MachineFunctionInfo *X86FI = MF.getInfo<X86MachineFunctionInfo>(); 60433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov bool needsFrameMoves = MMI.hasDebugInfo() || 605fc2bb8c4448fa884d79e437cc2d2627a7d7740a8Rafael Espindola Fn->needsUnwindTableEntry(); 60633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov uint64_t MaxAlign = MFI->getMaxAlignment(); // Desired stack alignment. 60733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov uint64_t StackSize = MFI->getStackSize(); // Number of bytes to allocate. 608d0c38176690e9602a93a20a43f1bd084564a8116Anton Korobeynikov bool HasFP = hasFP(MF); 60933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov bool Is64Bit = STI.is64Bit(); 61033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov bool IsWin64 = STI.isTargetWin64(); 61133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov unsigned StackAlign = getStackAlignment(); 61233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov unsigned SlotSize = RegInfo->getSlotSize(); 61333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov unsigned FramePtr = RegInfo->getFrameRegister(MF); 61433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov unsigned StackPtr = RegInfo->getStackRegister(); 61533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov DebugLoc DL; 61633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 61733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // If we're forcing a stack realignment we can't rely on just the frame 61833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // info, we need to know the ABI stack alignment as well in case we 61933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // have a call out. Otherwise just make sure we have some alignment - we'll 62033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // go with the minimum SlotSize. 62133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (ForceStackAlign) { 62233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (MFI->hasCalls()) 62333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MaxAlign = (StackAlign > MaxAlign) ? StackAlign : MaxAlign; 62433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov else if (MaxAlign < SlotSize) 62533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MaxAlign = SlotSize; 62633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 62733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 62833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Add RETADDR move area to callee saved frame size. 62933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov int TailCallReturnAddrDelta = X86FI->getTCReturnAddrDelta(); 63033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (TailCallReturnAddrDelta < 0) 63133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov X86FI->setCalleeSavedFrameSize( 63233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov X86FI->getCalleeSavedFrameSize() - TailCallReturnAddrDelta); 63333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 63433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // If this is x86-64 and the Red Zone is not disabled, if we are a leaf 63533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // function, and use up to 128 bytes of stack space, don't have a frame 63633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // pointer, calls, or dynamic alloca then we do not need to adjust the 63733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // stack pointer (we fit in the Red Zone). 63833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (Is64Bit && !Fn->hasFnAttr(Attribute::NoRedZone) && 63933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov !RegInfo->needsStackRealignment(MF) && 64033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov !MFI->hasVarSizedObjects() && // No dynamic alloca. 64133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov !MFI->adjustsStack() && // No calls. 64276927d758657b3a511c73467ec5a7288795c1513Rafael Espindola !IsWin64 && // Win64 has no Red Zone 64376927d758657b3a511c73467ec5a7288795c1513Rafael Espindola !EnableSegmentedStacks) { // Regular stack 64433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov uint64_t MinSize = X86FI->getCalleeSavedFrameSize(); 64533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (HasFP) MinSize += SlotSize; 64633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov StackSize = std::max(MinSize, StackSize > 128 ? StackSize - 128 : 0); 64733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MFI->setStackSize(StackSize); 64833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 64933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 65033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Insert stack pointer adjustment for later moving of return addr. Only 65133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // applies to tail call optimized functions where the callee argument stack 65233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // size is bigger than the callers. 65333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (TailCallReturnAddrDelta < 0) { 65433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineInstr *MI = 65533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov BuildMI(MBB, MBBI, DL, 65633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov TII.get(getSUBriOpcode(Is64Bit, -TailCallReturnAddrDelta)), 65733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov StackPtr) 65833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov .addReg(StackPtr) 659aff232a5941c9ffb7ad52e08f81ad53794fed56bCharles Davis .addImm(-TailCallReturnAddrDelta) 660aff232a5941c9ffb7ad52e08f81ad53794fed56bCharles Davis .setMIFlag(MachineInstr::FrameSetup); 66133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MI->getOperand(3).setIsDead(); // The EFLAGS implicit def is dead. 66233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 66333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 66433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Mapping for machine moves: 66533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // 66633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // DST: VirtualFP AND 66733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // SRC: VirtualFP => DW_CFA_def_cfa_offset 66833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // ELSE => DW_CFA_def_cfa 66933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // 67033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // SRC: VirtualFP AND 67133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // DST: Register => DW_CFA_def_cfa_register 67233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // 67333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // ELSE 67433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // OFFSET < 0 => DW_CFA_offset_extended_sf 67533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // REG < 64 => DW_CFA_offset + Reg 67633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // ELSE => DW_CFA_offset_extended 67733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 67833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov std::vector<MachineMove> &Moves = MMI.getFrameMoves(); 67933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov const TargetData *TD = MF.getTarget().getTargetData(); 68033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov uint64_t NumBytes = 0; 68133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov int stackGrowth = -TD->getPointerSize(); 68233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 68333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (HasFP) { 68433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Calculate required stack adjustment. 68533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov uint64_t FrameSize = StackSize - SlotSize; 68633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (RegInfo->needsStackRealignment(MF)) 68733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov FrameSize = (FrameSize + MaxAlign - 1) / MaxAlign * MaxAlign; 68833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 68933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov NumBytes = FrameSize - X86FI->getCalleeSavedFrameSize(); 69033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 69133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Get the offset of the stack slot for the EBP register, which is 69233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // guaranteed to be the last slot by processFunctionBeforeFrameFinalized. 69333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Update the frame offset adjustment. 69433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MFI->setOffsetAdjustment(-NumBytes); 69533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 69633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Save EBP/RBP into the appropriate stack slot. 69733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov BuildMI(MBB, MBBI, DL, TII.get(Is64Bit ? X86::PUSH64r : X86::PUSH32r)) 698aff232a5941c9ffb7ad52e08f81ad53794fed56bCharles Davis .addReg(FramePtr, RegState::Kill) 699aff232a5941c9ffb7ad52e08f81ad53794fed56bCharles Davis .setMIFlag(MachineInstr::FrameSetup); 70033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 70133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (needsFrameMoves) { 70233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Mark the place where EBP/RBP was saved. 70333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MCSymbol *FrameLabel = MMI.getContext().CreateTempSymbol(); 704fb4eb165d66b8ca5ae09c37d98d3ed937454b6afBill Wendling BuildMI(MBB, MBBI, DL, TII.get(X86::PROLOG_LABEL)) 705fb4eb165d66b8ca5ae09c37d98d3ed937454b6afBill Wendling .addSym(FrameLabel); 70633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 70733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Define the current CFA rule to use the provided offset. 70833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (StackSize) { 70933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineLocation SPDst(MachineLocation::VirtualFP); 71033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineLocation SPSrc(MachineLocation::VirtualFP, 2 * stackGrowth); 71133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov Moves.push_back(MachineMove(FrameLabel, SPDst, SPSrc)); 71233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } else { 71333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineLocation SPDst(StackPtr); 71433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineLocation SPSrc(StackPtr, stackGrowth); 71533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov Moves.push_back(MachineMove(FrameLabel, SPDst, SPSrc)); 71633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 71733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 71833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Change the rule for the FramePtr to be an "offset" rule. 71933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineLocation FPDst(MachineLocation::VirtualFP, 2 * stackGrowth); 72033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineLocation FPSrc(FramePtr); 72133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov Moves.push_back(MachineMove(FrameLabel, FPDst, FPSrc)); 72233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 72333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 72409b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // Update EBP with the new base value. 72533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov BuildMI(MBB, MBBI, DL, 72633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov TII.get(Is64Bit ? X86::MOV64rr : X86::MOV32rr), FramePtr) 727aff232a5941c9ffb7ad52e08f81ad53794fed56bCharles Davis .addReg(StackPtr) 728aff232a5941c9ffb7ad52e08f81ad53794fed56bCharles Davis .setMIFlag(MachineInstr::FrameSetup); 72933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 73033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (needsFrameMoves) { 73133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Mark effective beginning of when frame pointer becomes valid. 73233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MCSymbol *FrameLabel = MMI.getContext().CreateTempSymbol(); 733fb4eb165d66b8ca5ae09c37d98d3ed937454b6afBill Wendling BuildMI(MBB, MBBI, DL, TII.get(X86::PROLOG_LABEL)) 734fb4eb165d66b8ca5ae09c37d98d3ed937454b6afBill Wendling .addSym(FrameLabel); 73533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 73633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Define the current CFA to use the EBP/RBP register. 73733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineLocation FPDst(FramePtr); 73833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineLocation FPSrc(MachineLocation::VirtualFP); 73933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov Moves.push_back(MachineMove(FrameLabel, FPDst, FPSrc)); 74033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 74133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 74233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Mark the FramePtr as live-in in every block except the entry. 74333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov for (MachineFunction::iterator I = llvm::next(MF.begin()), E = MF.end(); 74433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov I != E; ++I) 74533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov I->addLiveIn(FramePtr); 74633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 74733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Realign stack 74833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (RegInfo->needsStackRealignment(MF)) { 74933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineInstr *MI = 75033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov BuildMI(MBB, MBBI, DL, 751fb4eb165d66b8ca5ae09c37d98d3ed937454b6afBill Wendling TII.get(Is64Bit ? X86::AND64ri32 : X86::AND32ri), StackPtr) 752fb4eb165d66b8ca5ae09c37d98d3ed937454b6afBill Wendling .addReg(StackPtr) 753fb4eb165d66b8ca5ae09c37d98d3ed937454b6afBill Wendling .addImm(-MaxAlign) 754fb4eb165d66b8ca5ae09c37d98d3ed937454b6afBill Wendling .setMIFlag(MachineInstr::FrameSetup); 75533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 75633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // The EFLAGS implicit def is dead. 75733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MI->getOperand(3).setIsDead(); 75833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 75933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } else { 76033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov NumBytes = StackSize - X86FI->getCalleeSavedFrameSize(); 76133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 76233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 76333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Skip the callee-saved push instructions. 76433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov bool PushedRegs = false; 76533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov int StackOffset = 2 * stackGrowth; 76633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 76733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov while (MBBI != MBB.end() && 76833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov (MBBI->getOpcode() == X86::PUSH32r || 76933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MBBI->getOpcode() == X86::PUSH64r)) { 77033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov PushedRegs = true; 771fb4eb165d66b8ca5ae09c37d98d3ed937454b6afBill Wendling MBBI->setFlag(MachineInstr::FrameSetup); 77233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov ++MBBI; 77333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 77433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (!HasFP && needsFrameMoves) { 77533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Mark callee-saved push instruction. 77633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MCSymbol *Label = MMI.getContext().CreateTempSymbol(); 77733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov BuildMI(MBB, MBBI, DL, TII.get(X86::PROLOG_LABEL)).addSym(Label); 77833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 77933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Define the current CFA rule to use the provided offset. 78009b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling unsigned Ptr = StackSize ? MachineLocation::VirtualFP : StackPtr; 78133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineLocation SPDst(Ptr); 78233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineLocation SPSrc(Ptr, StackOffset); 78333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov Moves.push_back(MachineMove(Label, SPDst, SPSrc)); 78433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov StackOffset += stackGrowth; 78533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 78633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 78733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 78833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov DL = MBB.findDebugLoc(MBBI); 78933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 79033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // If there is an SUB32ri of ESP immediately before this instruction, merge 79133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // the two. This can be the case when tail call elimination is enabled and 79233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // the callee has more arguments then the caller. 79333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov NumBytes -= mergeSPUpdates(MBB, MBBI, StackPtr, true); 79433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 79533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // If there is an ADD32ri or SUB32ri of ESP immediately after this 79633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // instruction, merge the two instructions. 79733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov mergeSPUpdatesDown(MBB, MBBI, StackPtr, &NumBytes); 79833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 79933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Adjust stack pointer: ESP -= numbytes. 80033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 80133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Windows and cygwin/mingw require a prologue helper routine when allocating 80233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // more than 4K bytes on the stack. Windows uses __chkstk and cygwin/mingw 80333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // uses __alloca. __alloca and the 32-bit version of __chkstk will probe the 80433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // stack and adjust the stack pointer in one go. The 64-bit version of 80533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // __chkstk is only responsible for probing the stack. The 64-bit prologue is 80633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // responsible for adjusting the stack pointer. Touching the stack at 4K 80733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // increments is necessary to ensure that the guard pages used by the OS 80833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // virtual memory manager are allocated in correct sequence. 809a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi if (NumBytes >= 4096 && STI.isTargetCOFF() && !STI.isTargetEnvMacho()) { 810a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi const char *StackProbeSymbol; 811a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi bool isSPUpdateNeeded = false; 812a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi 813a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi if (Is64Bit) { 814a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi if (STI.isTargetCygMing()) 815a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi StackProbeSymbol = "___chkstk"; 816a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi else { 817a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi StackProbeSymbol = "__chkstk"; 818a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi isSPUpdateNeeded = true; 819a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi } 820a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi } else if (STI.isTargetCygMing()) 821a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi StackProbeSymbol = "_alloca"; 822a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi else 823a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi StackProbeSymbol = "_chkstk"; 824a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi 82533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Check whether EAX is livein for this function. 82633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov bool isEAXAlive = isEAXLiveIn(MF); 82733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 828a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi if (isEAXAlive) { 829a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi // Sanity check that EAX is not livein for this function. 830a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi // It should not be, so throw an assert. 831a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi assert(!Is64Bit && "EAX is livein in x64 case!"); 832a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi 83333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Save EAX 83433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov BuildMI(MBB, MBBI, DL, TII.get(X86::PUSH32r)) 835fb4eb165d66b8ca5ae09c37d98d3ed937454b6afBill Wendling .addReg(X86::EAX, RegState::Kill) 836fb4eb165d66b8ca5ae09c37d98d3ed937454b6afBill Wendling .setMIFlag(MachineInstr::FrameSetup); 837a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi } 83833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 839a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi if (Is64Bit) { 840a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi // Handle the 64-bit Windows ABI case where we need to call __chkstk. 841a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi // Function prologue is responsible for adjusting the stack pointer. 842a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi BuildMI(MBB, MBBI, DL, TII.get(X86::MOV64ri), X86::RAX) 843fb4eb165d66b8ca5ae09c37d98d3ed937454b6afBill Wendling .addImm(NumBytes) 844fb4eb165d66b8ca5ae09c37d98d3ed937454b6afBill Wendling .setMIFlag(MachineInstr::FrameSetup); 845a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi } else { 846a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi // Allocate NumBytes-4 bytes on stack in case of isEAXAlive. 847a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi // We'll also use 4 already allocated bytes for EAX. 84833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov BuildMI(MBB, MBBI, DL, TII.get(X86::MOV32ri), X86::EAX) 849fb4eb165d66b8ca5ae09c37d98d3ed937454b6afBill Wendling .addImm(isEAXAlive ? NumBytes - 4 : NumBytes) 850fb4eb165d66b8ca5ae09c37d98d3ed937454b6afBill Wendling .setMIFlag(MachineInstr::FrameSetup); 851a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi } 852a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi 853a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi BuildMI(MBB, MBBI, DL, 854a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi TII.get(Is64Bit ? X86::W64ALLOCA : X86::CALLpcrel32)) 855a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi .addExternalSymbol(StackProbeSymbol) 856a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi .addReg(StackPtr, RegState::Define | RegState::Implicit) 857fb4eb165d66b8ca5ae09c37d98d3ed937454b6afBill Wendling .addReg(X86::EFLAGS, RegState::Define | RegState::Implicit) 858fb4eb165d66b8ca5ae09c37d98d3ed937454b6afBill Wendling .setMIFlag(MachineInstr::FrameSetup); 859a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi 860a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi // MSVC x64's __chkstk needs to adjust %rsp. 861a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi // FIXME: %rax preserves the offset and should be available. 862a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi if (isSPUpdateNeeded) 863a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi emitSPUpdate(MBB, MBBI, StackPtr, -(int64_t)NumBytes, Is64Bit, 864a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi TII, *RegInfo); 865a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi 866a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi if (isEAXAlive) { 867a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi // Restore EAX 868a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi MachineInstr *MI = addRegOffset(BuildMI(MF, DL, TII.get(X86::MOV32rm), 869a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi X86::EAX), 870a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi StackPtr, false, NumBytes - 4); 871fb4eb165d66b8ca5ae09c37d98d3ed937454b6afBill Wendling MI->setFlag(MachineInstr::FrameSetup); 872a2e0762fae050464494a50c8b5d53ac2f4ba738cNAKAMURA Takumi MBB.insert(MBBI, MI); 87333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 87433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } else if (NumBytes) 8757158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng emitSPUpdate(MBB, MBBI, StackPtr, -(int64_t)NumBytes, Is64Bit, 8767158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng TII, *RegInfo); 87733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 878f0adba9a7ec8a3031876575a6ffb7db5f1b6f855Rafael Espindola if (( (!HasFP && NumBytes) || PushedRegs) && needsFrameMoves) { 87933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Mark end of stack pointer adjustment. 88033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MCSymbol *Label = MMI.getContext().CreateTempSymbol(); 881fb4eb165d66b8ca5ae09c37d98d3ed937454b6afBill Wendling BuildMI(MBB, MBBI, DL, TII.get(X86::PROLOG_LABEL)) 882fb4eb165d66b8ca5ae09c37d98d3ed937454b6afBill Wendling .addSym(Label); 88333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 88433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (!HasFP && NumBytes) { 88533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Define the current CFA rule to use the provided offset. 88633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (StackSize) { 88733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineLocation SPDst(MachineLocation::VirtualFP); 88833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineLocation SPSrc(MachineLocation::VirtualFP, 88933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov -StackSize + stackGrowth); 89033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov Moves.push_back(MachineMove(Label, SPDst, SPSrc)); 89133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } else { 89233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineLocation SPDst(StackPtr); 89333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineLocation SPSrc(StackPtr, stackGrowth); 89433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov Moves.push_back(MachineMove(Label, SPDst, SPSrc)); 89533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 89633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 89733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 89833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Emit DWARF info specifying the offsets of the callee-saved registers. 89933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (PushedRegs) 90033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov emitCalleeSavedFrameMoves(MF, Label, HasFP ? FramePtr : StackPtr); 90133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 90209b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling 90309b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling // Darwin 10.7 and greater has support for compact unwind encoding. 904c8725d11f8756c57bdbceccc61062a9d560261c5Bill Wendling if (STI.getTargetTriple().isMacOSX() && 905ac86d43eae8bbfe5284d8e5fa17c141d1a7b1194Eli Friedman !STI.getTargetTriple().isMacOSXVersionLT(10, 7)) 90609b02c8dddf822e84c30cc08e7759d6ceebb2334Bill Wendling MMI.setCompactUnwindEncoding(getCompactUnwindEncoding(MF)); 90733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov} 90833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 90916c29b5f285f375be53dabaa73e3e91107485fe4Anton Korobeynikovvoid X86FrameLowering::emitEpilogue(MachineFunction &MF, 9103c2f0a11cce5a1e828e20675fa8467b624795e0aNick Lewycky MachineBasicBlock &MBB) const { 91133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov const MachineFrameInfo *MFI = MF.getFrameInfo(); 91233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov X86MachineFunctionInfo *X86FI = MF.getInfo<X86MachineFunctionInfo>(); 913d9e3385ced2dc887e2fe8e1c071bd2611e4d3edeAnton Korobeynikov const X86RegisterInfo *RegInfo = TM.getRegisterInfo(); 914d9e3385ced2dc887e2fe8e1c071bd2611e4d3edeAnton Korobeynikov const X86InstrInfo &TII = *TM.getInstrInfo(); 9154f28c1c71450c711e96aa283de53739d8b4504cdJakob Stoklund Olesen MachineBasicBlock::iterator MBBI = MBB.getLastNonDebugInstr(); 9164f28c1c71450c711e96aa283de53739d8b4504cdJakob Stoklund Olesen assert(MBBI != MBB.end() && "Returning block has no instructions"); 91733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov unsigned RetOpcode = MBBI->getOpcode(); 91833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov DebugLoc DL = MBBI->getDebugLoc(); 91933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov bool Is64Bit = STI.is64Bit(); 92033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov unsigned StackAlign = getStackAlignment(); 92133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov unsigned SlotSize = RegInfo->getSlotSize(); 92233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov unsigned FramePtr = RegInfo->getFrameRegister(MF); 92333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov unsigned StackPtr = RegInfo->getStackRegister(); 92433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 92533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov switch (RetOpcode) { 92633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov default: 92733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov llvm_unreachable("Can only insert epilog into returning blocks"); 92833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov case X86::RET: 92933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov case X86::RETI: 93033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov case X86::TCRETURNdi: 93133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov case X86::TCRETURNri: 93233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov case X86::TCRETURNmi: 93333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov case X86::TCRETURNdi64: 93433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov case X86::TCRETURNri64: 93533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov case X86::TCRETURNmi64: 93633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov case X86::EH_RETURN: 93733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov case X86::EH_RETURN64: 93833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov break; // These are ok 93933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 94033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 94133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Get the number of bytes to allocate from the FrameInfo. 94233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov uint64_t StackSize = MFI->getStackSize(); 94333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov uint64_t MaxAlign = MFI->getMaxAlignment(); 94433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov unsigned CSSize = X86FI->getCalleeSavedFrameSize(); 94533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov uint64_t NumBytes = 0; 94633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 94733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // If we're forcing a stack realignment we can't rely on just the frame 94833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // info, we need to know the ABI stack alignment as well in case we 94933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // have a call out. Otherwise just make sure we have some alignment - we'll 95033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // go with the minimum. 95133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (ForceStackAlign) { 95233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (MFI->hasCalls()) 95333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MaxAlign = (StackAlign > MaxAlign) ? StackAlign : MaxAlign; 95433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov else 95533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MaxAlign = MaxAlign ? MaxAlign : 4; 95633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 95733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 958d0c38176690e9602a93a20a43f1bd084564a8116Anton Korobeynikov if (hasFP(MF)) { 95933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Calculate required stack adjustment. 96033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov uint64_t FrameSize = StackSize - SlotSize; 96133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (RegInfo->needsStackRealignment(MF)) 96233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov FrameSize = (FrameSize + MaxAlign - 1)/MaxAlign*MaxAlign; 96333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 96433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov NumBytes = FrameSize - CSSize; 96533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 96633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Pop EBP. 96733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov BuildMI(MBB, MBBI, DL, 96833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov TII.get(Is64Bit ? X86::POP64r : X86::POP32r), FramePtr); 96933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } else { 97033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov NumBytes = StackSize - CSSize; 97133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 97233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 97333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Skip the callee-saved pop instructions. 97433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineBasicBlock::iterator LastCSPop = MBBI; 97533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov while (MBBI != MBB.begin()) { 97633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineBasicBlock::iterator PI = prior(MBBI); 97733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov unsigned Opc = PI->getOpcode(); 97833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 9794f28c1c71450c711e96aa283de53739d8b4504cdJakob Stoklund Olesen if (Opc != X86::POP32r && Opc != X86::POP64r && Opc != X86::DBG_VALUE && 98033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov !PI->getDesc().isTerminator()) 98133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov break; 98233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 98333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov --MBBI; 98433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 98533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 98633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov DL = MBBI->getDebugLoc(); 98733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 98833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // If there is an ADD32ri or SUB32ri of ESP immediately before this 98933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // instruction, merge the two instructions. 99033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (NumBytes || MFI->hasVarSizedObjects()) 99133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov mergeSPUpdatesUp(MBB, MBBI, StackPtr, &NumBytes); 99233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 99333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // If dynamic alloca is used, then reset esp to point to the last callee-saved 99433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // slot before popping them off! Same applies for the case, when stack was 99533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // realigned. 99633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (RegInfo->needsStackRealignment(MF)) { 99733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // We cannot use LEA here, because stack pointer was realigned. We need to 99833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // deallocate local frame back. 99933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (CSSize) { 10007158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng emitSPUpdate(MBB, MBBI, StackPtr, NumBytes, Is64Bit, TII, *RegInfo); 100133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MBBI = prior(LastCSPop); 100233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 100333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 100433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov BuildMI(MBB, MBBI, DL, 100533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov TII.get(Is64Bit ? X86::MOV64rr : X86::MOV32rr), 100633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov StackPtr).addReg(FramePtr); 100733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } else if (MFI->hasVarSizedObjects()) { 100833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (CSSize) { 100933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov unsigned Opc = Is64Bit ? X86::LEA64r : X86::LEA32r; 101033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineInstr *MI = 101133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov addRegOffset(BuildMI(MF, DL, TII.get(Opc), StackPtr), 101233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov FramePtr, false, -CSSize); 101333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MBB.insert(MBBI, MI); 101433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } else { 101533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov BuildMI(MBB, MBBI, DL, 101633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov TII.get(Is64Bit ? X86::MOV64rr : X86::MOV32rr), StackPtr) 101733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov .addReg(FramePtr); 101833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 101933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } else if (NumBytes) { 102033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Adjust stack pointer back: ESP += numbytes. 10217158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng emitSPUpdate(MBB, MBBI, StackPtr, NumBytes, Is64Bit, TII, *RegInfo); 102233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 102333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 102433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // We're returning from function via eh_return. 102533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (RetOpcode == X86::EH_RETURN || RetOpcode == X86::EH_RETURN64) { 10264f28c1c71450c711e96aa283de53739d8b4504cdJakob Stoklund Olesen MBBI = MBB.getLastNonDebugInstr(); 102733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineOperand &DestAddr = MBBI->getOperand(0); 102833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov assert(DestAddr.isReg() && "Offset should be in register!"); 102933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov BuildMI(MBB, MBBI, DL, 103033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov TII.get(Is64Bit ? X86::MOV64rr : X86::MOV32rr), 103133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov StackPtr).addReg(DestAddr.getReg()); 103233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } else if (RetOpcode == X86::TCRETURNri || RetOpcode == X86::TCRETURNdi || 103333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov RetOpcode == X86::TCRETURNmi || 103433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov RetOpcode == X86::TCRETURNri64 || RetOpcode == X86::TCRETURNdi64 || 103533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov RetOpcode == X86::TCRETURNmi64) { 103633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov bool isMem = RetOpcode == X86::TCRETURNmi || RetOpcode == X86::TCRETURNmi64; 103733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Tail call return: adjust the stack pointer and jump to callee. 1038f7ca976e74eafeeab0e9097f0fb07d6bb447415bJakob Stoklund Olesen MBBI = MBB.getLastNonDebugInstr(); 103933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineOperand &JumpTarget = MBBI->getOperand(0); 104033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineOperand &StackAdjust = MBBI->getOperand(isMem ? 5 : 1); 104133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov assert(StackAdjust.isImm() && "Expecting immediate value."); 104233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 104333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Adjust stack pointer. 104433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov int StackAdj = StackAdjust.getImm(); 104533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov int MaxTCDelta = X86FI->getTCReturnAddrDelta(); 104633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov int Offset = 0; 104733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov assert(MaxTCDelta <= 0 && "MaxTCDelta should never be positive"); 104833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 104933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Incoporate the retaddr area. 105033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov Offset = StackAdj-MaxTCDelta; 105133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov assert(Offset >= 0 && "Offset should never be negative"); 105233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 105333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (Offset) { 10547a2bdde0a0eebcd2125055e0eacaca040f0b766cChris Lattner // Check for possible merge with preceding ADD instruction. 105533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov Offset += mergeSPUpdates(MBB, MBBI, StackPtr, true); 10567158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng emitSPUpdate(MBB, MBBI, StackPtr, Offset, Is64Bit, TII, *RegInfo); 105733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 105833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 105933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Jump to label or value in register. 106033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov if (RetOpcode == X86::TCRETURNdi || RetOpcode == X86::TCRETURNdi64) { 10613d2125c9dbac695c93f42c0f59fd040e413fd711Evan Cheng MachineInstrBuilder MIB = 10623d2125c9dbac695c93f42c0f59fd040e413fd711Evan Cheng BuildMI(MBB, MBBI, DL, TII.get((RetOpcode == X86::TCRETURNdi) 10633d2125c9dbac695c93f42c0f59fd040e413fd711Evan Cheng ? X86::TAILJMPd : X86::TAILJMPd64)); 10643d2125c9dbac695c93f42c0f59fd040e413fd711Evan Cheng if (JumpTarget.isGlobal()) 10653d2125c9dbac695c93f42c0f59fd040e413fd711Evan Cheng MIB.addGlobalAddress(JumpTarget.getGlobal(), JumpTarget.getOffset(), 10663d2125c9dbac695c93f42c0f59fd040e413fd711Evan Cheng JumpTarget.getTargetFlags()); 10673d2125c9dbac695c93f42c0f59fd040e413fd711Evan Cheng else { 10683d2125c9dbac695c93f42c0f59fd040e413fd711Evan Cheng assert(JumpTarget.isSymbol()); 10693d2125c9dbac695c93f42c0f59fd040e413fd711Evan Cheng MIB.addExternalSymbol(JumpTarget.getSymbolName(), 10703d2125c9dbac695c93f42c0f59fd040e413fd711Evan Cheng JumpTarget.getTargetFlags()); 10713d2125c9dbac695c93f42c0f59fd040e413fd711Evan Cheng } 107233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } else if (RetOpcode == X86::TCRETURNmi || RetOpcode == X86::TCRETURNmi64) { 107333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineInstrBuilder MIB = 107433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov BuildMI(MBB, MBBI, DL, TII.get((RetOpcode == X86::TCRETURNmi) 107533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov ? X86::TAILJMPm : X86::TAILJMPm64)); 107633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov for (unsigned i = 0; i != 5; ++i) 107733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MIB.addOperand(MBBI->getOperand(i)); 107833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } else if (RetOpcode == X86::TCRETURNri64) { 107933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov BuildMI(MBB, MBBI, DL, TII.get(X86::TAILJMPr64)). 108033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov addReg(JumpTarget.getReg(), RegState::Kill); 108133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } else { 108233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov BuildMI(MBB, MBBI, DL, TII.get(X86::TAILJMPr)). 108333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov addReg(JumpTarget.getReg(), RegState::Kill); 108433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 108533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 108633464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MachineInstr *NewMI = prior(MBBI); 108733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov for (unsigned i = 2, e = MBBI->getNumOperands(); i != e; ++i) 108833464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov NewMI->addOperand(MBBI->getOperand(i)); 108933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 109033464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Delete the pseudo instruction TCRETURN. 109133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov MBB.erase(MBBI); 109233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } else if ((RetOpcode == X86::RET || RetOpcode == X86::RETI) && 109333464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov (X86FI->getTCReturnAddrDelta() < 0)) { 109433464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov // Add the return addr area delta back since we are not tail calling. 109533464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov int delta = -1*X86FI->getTCReturnAddrDelta(); 10964f28c1c71450c711e96aa283de53739d8b4504cdJakob Stoklund Olesen MBBI = MBB.getLastNonDebugInstr(); 109733464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov 10987a2bdde0a0eebcd2125055e0eacaca040f0b766cChris Lattner // Check for possible merge with preceding ADD instruction. 109933464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov delta += mergeSPUpdates(MBB, MBBI, StackPtr, true); 11007158e08b8e619f4dcac9834c57f5f8afd6eea2ebEvan Cheng emitSPUpdate(MBB, MBBI, StackPtr, delta, Is64Bit, TII, *RegInfo); 110133464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov } 110233464912237efaa0ed7060829e66b59055bdd48bAnton Korobeynikov} 1103d9e3385ced2dc887e2fe8e1c071bd2611e4d3edeAnton Korobeynikov 110416c29b5f285f375be53dabaa73e3e91107485fe4Anton Korobeynikovint X86FrameLowering::getFrameIndexOffset(const MachineFunction &MF, int FI) const { 110582f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov const X86RegisterInfo *RI = 110682f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov static_cast<const X86RegisterInfo*>(MF.getTarget().getRegisterInfo()); 110782f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov const MachineFrameInfo *MFI = MF.getFrameInfo(); 110882f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov int Offset = MFI->getObjectOffset(FI) - getOffsetOfLocalArea(); 110982f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov uint64_t StackSize = MFI->getStackSize(); 111082f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov 111182f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov if (RI->needsStackRealignment(MF)) { 111282f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov if (FI < 0) { 111382f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov // Skip the saved EBP. 111482f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov Offset += RI->getSlotSize(); 111582f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov } else { 111617001ce25cc205ac1cd2604492c2bce310964220Duncan Sands assert((-(Offset + StackSize)) % MFI->getObjectAlignment(FI) == 0); 111782f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov return Offset + StackSize; 111882f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov } 111982f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov // FIXME: Support tail calls 112082f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov } else { 112182f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov if (!hasFP(MF)) 112282f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov return Offset + StackSize; 112382f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov 112482f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov // Skip the saved EBP. 112582f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov Offset += RI->getSlotSize(); 112682f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov 112782f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov // Skip the RETADDR move area 112882f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov const X86MachineFunctionInfo *X86FI = MF.getInfo<X86MachineFunctionInfo>(); 112982f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov int TailCallReturnAddrDelta = X86FI->getTCReturnAddrDelta(); 113082f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov if (TailCallReturnAddrDelta < 0) 113182f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov Offset -= TailCallReturnAddrDelta; 113282f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov } 113382f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov 113482f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov return Offset; 113582f58740c76b42af8370247b23677a0318f6dde8Anton Korobeynikov} 1136cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov 113716c29b5f285f375be53dabaa73e3e91107485fe4Anton Korobeynikovbool X86FrameLowering::spillCalleeSavedRegisters(MachineBasicBlock &MBB, 1138cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov MachineBasicBlock::iterator MI, 1139cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov const std::vector<CalleeSavedInfo> &CSI, 1140cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov const TargetRegisterInfo *TRI) const { 1141cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov if (CSI.empty()) 1142cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov return false; 1143cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov 1144cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov DebugLoc DL = MBB.findDebugLoc(MI); 1145cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov 1146cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov MachineFunction &MF = *MBB.getParent(); 1147cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov 1148cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov unsigned SlotSize = STI.is64Bit() ? 8 : 4; 1149cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov unsigned FPReg = TRI->getFrameRegister(MF); 1150cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov unsigned CalleeFrameSize = 0; 1151cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov 1152cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov const TargetInstrInfo &TII = *MF.getTarget().getInstrInfo(); 1153cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov X86MachineFunctionInfo *X86FI = MF.getInfo<X86MachineFunctionInfo>(); 1154cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov 1155419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi // Push GPRs. It increases frame size. 1156cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov unsigned Opc = STI.is64Bit() ? X86::PUSH64r : X86::PUSH32r; 1157cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov for (unsigned i = CSI.size(); i != 0; --i) { 1158cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov unsigned Reg = CSI[i-1].getReg(); 1159419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi if (!X86::GR64RegClass.contains(Reg) && 1160419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi !X86::GR32RegClass.contains(Reg)) 1161419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi continue; 1162cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov // Add the callee-saved register as live-in. It's killed at the spill. 1163cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov MBB.addLiveIn(Reg); 1164cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov if (Reg == FPReg) 1165cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov // X86RegisterInfo::emitPrologue will handle spilling of frame register. 1166cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov continue; 1167419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi CalleeFrameSize += SlotSize; 1168aff232a5941c9ffb7ad52e08f81ad53794fed56bCharles Davis BuildMI(MBB, MI, DL, TII.get(Opc)).addReg(Reg, RegState::Kill) 1169aff232a5941c9ffb7ad52e08f81ad53794fed56bCharles Davis .setMIFlag(MachineInstr::FrameSetup); 1170cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov } 1171cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov 1172cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov X86FI->setCalleeSavedFrameSize(CalleeFrameSize); 1173419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi 1174419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi // Make XMM regs spilled. X86 does not have ability of push/pop XMM. 1175419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi // It can be done by spilling XMMs to stack frame. 1176419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi // Note that only Win64 ABI might spill XMMs. 1177419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi for (unsigned i = CSI.size(); i != 0; --i) { 1178419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi unsigned Reg = CSI[i-1].getReg(); 1179419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi if (X86::GR64RegClass.contains(Reg) || 1180419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi X86::GR32RegClass.contains(Reg)) 1181419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi continue; 1182419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi // Add the callee-saved register as live-in. It's killed at the spill. 1183419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi MBB.addLiveIn(Reg); 1184419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi const TargetRegisterClass *RC = TRI->getMinimalPhysRegClass(Reg); 1185419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi TII.storeRegToStackSlot(MBB, MI, Reg, true, CSI[i-1].getFrameIdx(), 1186419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi RC, TRI); 1187419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi } 1188419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi 1189cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov return true; 1190cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov} 1191cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov 119216c29b5f285f375be53dabaa73e3e91107485fe4Anton Korobeynikovbool X86FrameLowering::restoreCalleeSavedRegisters(MachineBasicBlock &MBB, 1193cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov MachineBasicBlock::iterator MI, 1194cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov const std::vector<CalleeSavedInfo> &CSI, 1195cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov const TargetRegisterInfo *TRI) const { 1196cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov if (CSI.empty()) 1197cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov return false; 1198cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov 1199cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov DebugLoc DL = MBB.findDebugLoc(MI); 1200cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov 1201cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov MachineFunction &MF = *MBB.getParent(); 1202cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov const TargetInstrInfo &TII = *MF.getTarget().getInstrInfo(); 1203419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi 1204419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi // Reload XMMs from stack frame. 1205419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi for (unsigned i = 0, e = CSI.size(); i != e; ++i) { 1206419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi unsigned Reg = CSI[i].getReg(); 1207419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi if (X86::GR64RegClass.contains(Reg) || 1208419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi X86::GR32RegClass.contains(Reg)) 1209419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi continue; 1210419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi const TargetRegisterClass *RC = TRI->getMinimalPhysRegClass(Reg); 1211419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi TII.loadRegFromStackSlot(MBB, MI, Reg, CSI[i].getFrameIdx(), 1212419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi RC, TRI); 1213419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi } 1214419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi 1215419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi // POP GPRs. 1216cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov unsigned FPReg = TRI->getFrameRegister(MF); 1217cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov unsigned Opc = STI.is64Bit() ? X86::POP64r : X86::POP32r; 1218cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov for (unsigned i = 0, e = CSI.size(); i != e; ++i) { 1219cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov unsigned Reg = CSI[i].getReg(); 1220419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi if (!X86::GR64RegClass.contains(Reg) && 1221419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi !X86::GR32RegClass.contains(Reg)) 1222419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi continue; 1223cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov if (Reg == FPReg) 1224cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov // X86RegisterInfo::emitEpilogue will handle restoring of frame register. 1225cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov continue; 1226419f23278388a8999b5c0bbe73ce823f63747f28NAKAMURA Takumi BuildMI(MBB, MI, DL, TII.get(Opc), Reg); 1227cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov } 1228cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov return true; 1229cd775ceff0b25a0b026f643a7990c2924bd310a3Anton Korobeynikov} 123094c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov 123194c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikovvoid 123216c29b5f285f375be53dabaa73e3e91107485fe4Anton KorobeynikovX86FrameLowering::processFunctionBeforeCalleeSavedScan(MachineFunction &MF, 123394c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov RegScavenger *RS) const { 123494c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov MachineFrameInfo *MFI = MF.getFrameInfo(); 123594c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov const X86RegisterInfo *RegInfo = TM.getRegisterInfo(); 123694c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov unsigned SlotSize = RegInfo->getSlotSize(); 123794c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov 123894c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov X86MachineFunctionInfo *X86FI = MF.getInfo<X86MachineFunctionInfo>(); 123994c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov int32_t TailCallReturnAddrDelta = X86FI->getTCReturnAddrDelta(); 124094c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov 124194c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov if (TailCallReturnAddrDelta < 0) { 124294c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov // create RETURNADDR area 124394c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov // arg 124494c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov // arg 124594c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov // RETADDR 124694c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov // { ... 124794c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov // RETADDR area 124894c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov // ... 124994c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov // } 125094c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov // [EBP] 125194c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov MFI->CreateFixedObject(-TailCallReturnAddrDelta, 125294c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov (-1U*SlotSize)+TailCallReturnAddrDelta, true); 125394c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov } 125494c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov 125594c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov if (hasFP(MF)) { 125694c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov assert((TailCallReturnAddrDelta <= 0) && 125794c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov "The Delta should always be zero or negative"); 125816c29b5f285f375be53dabaa73e3e91107485fe4Anton Korobeynikov const TargetFrameLowering &TFI = *MF.getTarget().getFrameLowering(); 125994c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov 126094c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov // Create a frame entry for the EBP register that must be saved. 126194c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov int FrameIdx = MFI->CreateFixedObject(SlotSize, 126294c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov -(int)SlotSize + 126394c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov TFI.getOffsetOfLocalArea() + 126494c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov TailCallReturnAddrDelta, 126594c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov true); 126694c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov assert(FrameIdx == MFI->getObjectIndexBegin() && 126794c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov "Slot for EBP register must be last in order to be found!"); 126817001ce25cc205ac1cd2604492c2bce310964220Duncan Sands (void)FrameIdx; 126994c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov } 127094c5ae08750f314bc3cf1bf882b686244a3927d9Anton Korobeynikov} 127176927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 127276927d758657b3a511c73467ec5a7288795c1513Rafael Espindolastatic bool 127376927d758657b3a511c73467ec5a7288795c1513Rafael EspindolaHasNestArgument(const MachineFunction *MF) { 127476927d758657b3a511c73467ec5a7288795c1513Rafael Espindola const Function *F = MF->getFunction(); 127576927d758657b3a511c73467ec5a7288795c1513Rafael Espindola for (Function::const_arg_iterator I = F->arg_begin(), E = F->arg_end(); 127676927d758657b3a511c73467ec5a7288795c1513Rafael Espindola I != E; I++) { 127776927d758657b3a511c73467ec5a7288795c1513Rafael Espindola if (I->hasNestAttr()) 127876927d758657b3a511c73467ec5a7288795c1513Rafael Espindola return true; 127976927d758657b3a511c73467ec5a7288795c1513Rafael Espindola } 128076927d758657b3a511c73467ec5a7288795c1513Rafael Espindola return false; 128176927d758657b3a511c73467ec5a7288795c1513Rafael Espindola} 128276927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 128376927d758657b3a511c73467ec5a7288795c1513Rafael Espindolastatic unsigned 128476927d758657b3a511c73467ec5a7288795c1513Rafael EspindolaGetScratchRegister(bool Is64Bit, const MachineFunction &MF) { 128576927d758657b3a511c73467ec5a7288795c1513Rafael Espindola if (Is64Bit) { 128676927d758657b3a511c73467ec5a7288795c1513Rafael Espindola return X86::R11; 128776927d758657b3a511c73467ec5a7288795c1513Rafael Espindola } else { 128876927d758657b3a511c73467ec5a7288795c1513Rafael Espindola CallingConv::ID CallingConvention = MF.getFunction()->getCallingConv(); 128976927d758657b3a511c73467ec5a7288795c1513Rafael Espindola bool IsNested = HasNestArgument(&MF); 129076927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 129176927d758657b3a511c73467ec5a7288795c1513Rafael Espindola if (CallingConvention == CallingConv::X86_FastCall) { 129276927d758657b3a511c73467ec5a7288795c1513Rafael Espindola if (IsNested) { 1293e81abfd30b7c81735e9f3d79006c2653690aa592Rafael Espindola report_fatal_error("Segmented stacks does not support fastcall with " 1294e81abfd30b7c81735e9f3d79006c2653690aa592Rafael Espindola "nested function."); 129576927d758657b3a511c73467ec5a7288795c1513Rafael Espindola return -1; 129676927d758657b3a511c73467ec5a7288795c1513Rafael Espindola } else { 129776927d758657b3a511c73467ec5a7288795c1513Rafael Espindola return X86::EAX; 129876927d758657b3a511c73467ec5a7288795c1513Rafael Espindola } 129976927d758657b3a511c73467ec5a7288795c1513Rafael Espindola } else { 130076927d758657b3a511c73467ec5a7288795c1513Rafael Espindola if (IsNested) 130176927d758657b3a511c73467ec5a7288795c1513Rafael Espindola return X86::EDX; 130276927d758657b3a511c73467ec5a7288795c1513Rafael Espindola else 130376927d758657b3a511c73467ec5a7288795c1513Rafael Espindola return X86::ECX; 130476927d758657b3a511c73467ec5a7288795c1513Rafael Espindola } 130576927d758657b3a511c73467ec5a7288795c1513Rafael Espindola } 130676927d758657b3a511c73467ec5a7288795c1513Rafael Espindola} 130776927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 130876927d758657b3a511c73467ec5a7288795c1513Rafael Espindolavoid 130976927d758657b3a511c73467ec5a7288795c1513Rafael EspindolaX86FrameLowering::adjustForSegmentedStacks(MachineFunction &MF) const { 131076927d758657b3a511c73467ec5a7288795c1513Rafael Espindola MachineBasicBlock &prologueMBB = MF.front(); 131176927d758657b3a511c73467ec5a7288795c1513Rafael Espindola MachineFrameInfo *MFI = MF.getFrameInfo(); 131276927d758657b3a511c73467ec5a7288795c1513Rafael Espindola const X86InstrInfo &TII = *TM.getInstrInfo(); 131376927d758657b3a511c73467ec5a7288795c1513Rafael Espindola uint64_t StackSize; 131476927d758657b3a511c73467ec5a7288795c1513Rafael Espindola bool Is64Bit = STI.is64Bit(); 131576927d758657b3a511c73467ec5a7288795c1513Rafael Espindola unsigned TlsReg, TlsOffset; 131676927d758657b3a511c73467ec5a7288795c1513Rafael Espindola DebugLoc DL; 131776927d758657b3a511c73467ec5a7288795c1513Rafael Espindola const X86Subtarget *ST = &MF.getTarget().getSubtarget<X86Subtarget>(); 131876927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 131976927d758657b3a511c73467ec5a7288795c1513Rafael Espindola unsigned ScratchReg = GetScratchRegister(Is64Bit, MF); 132076927d758657b3a511c73467ec5a7288795c1513Rafael Espindola assert(!MF.getRegInfo().isLiveIn(ScratchReg) && 132176927d758657b3a511c73467ec5a7288795c1513Rafael Espindola "Scratch register is live-in"); 132276927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 132376927d758657b3a511c73467ec5a7288795c1513Rafael Espindola if (MF.getFunction()->isVarArg()) 132476927d758657b3a511c73467ec5a7288795c1513Rafael Espindola report_fatal_error("Segmented stacks do not support vararg functions."); 132576927d758657b3a511c73467ec5a7288795c1513Rafael Espindola if (!ST->isTargetLinux()) 132676927d758657b3a511c73467ec5a7288795c1513Rafael Espindola report_fatal_error("Segmented stacks supported only on linux."); 132776927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 132876927d758657b3a511c73467ec5a7288795c1513Rafael Espindola MachineBasicBlock *allocMBB = MF.CreateMachineBasicBlock(); 132976927d758657b3a511c73467ec5a7288795c1513Rafael Espindola MachineBasicBlock *checkMBB = MF.CreateMachineBasicBlock(); 133076927d758657b3a511c73467ec5a7288795c1513Rafael Espindola X86MachineFunctionInfo *X86FI = MF.getInfo<X86MachineFunctionInfo>(); 133176927d758657b3a511c73467ec5a7288795c1513Rafael Espindola bool IsNested = false; 133276927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 133376927d758657b3a511c73467ec5a7288795c1513Rafael Espindola // We need to know if the function has a nest argument only in 64 bit mode. 133476927d758657b3a511c73467ec5a7288795c1513Rafael Espindola if (Is64Bit) 133576927d758657b3a511c73467ec5a7288795c1513Rafael Espindola IsNested = HasNestArgument(&MF); 133676927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 13374e68054b20725f6ec1cac33630258f749fe5debeBill Wendling // The MOV R10, RAX needs to be in a different block, since the RET we emit in 13384e68054b20725f6ec1cac33630258f749fe5debeBill Wendling // allocMBB needs to be last (terminating) instruction. 13394e68054b20725f6ec1cac33630258f749fe5debeBill Wendling MachineBasicBlock *restoreR10MBB = NULL; 13404e68054b20725f6ec1cac33630258f749fe5debeBill Wendling if (IsNested) 13414e68054b20725f6ec1cac33630258f749fe5debeBill Wendling restoreR10MBB = MF.CreateMachineBasicBlock(); 13424e68054b20725f6ec1cac33630258f749fe5debeBill Wendling 134376927d758657b3a511c73467ec5a7288795c1513Rafael Espindola for (MachineBasicBlock::livein_iterator i = prologueMBB.livein_begin(), 134476927d758657b3a511c73467ec5a7288795c1513Rafael Espindola e = prologueMBB.livein_end(); i != e; i++) { 134576927d758657b3a511c73467ec5a7288795c1513Rafael Espindola allocMBB->addLiveIn(*i); 134676927d758657b3a511c73467ec5a7288795c1513Rafael Espindola checkMBB->addLiveIn(*i); 13474e68054b20725f6ec1cac33630258f749fe5debeBill Wendling 13484e68054b20725f6ec1cac33630258f749fe5debeBill Wendling if (IsNested) 13494e68054b20725f6ec1cac33630258f749fe5debeBill Wendling restoreR10MBB->addLiveIn(*i); 135076927d758657b3a511c73467ec5a7288795c1513Rafael Espindola } 135176927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 13524e68054b20725f6ec1cac33630258f749fe5debeBill Wendling if (IsNested) { 135376927d758657b3a511c73467ec5a7288795c1513Rafael Espindola allocMBB->addLiveIn(X86::R10); 13544e68054b20725f6ec1cac33630258f749fe5debeBill Wendling restoreR10MBB->addLiveIn(X86::RAX); 13554e68054b20725f6ec1cac33630258f749fe5debeBill Wendling } 135676927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 13574e68054b20725f6ec1cac33630258f749fe5debeBill Wendling if (IsNested) 13584e68054b20725f6ec1cac33630258f749fe5debeBill Wendling MF.push_front(restoreR10MBB); 135976927d758657b3a511c73467ec5a7288795c1513Rafael Espindola MF.push_front(allocMBB); 136076927d758657b3a511c73467ec5a7288795c1513Rafael Espindola MF.push_front(checkMBB); 136176927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 136276927d758657b3a511c73467ec5a7288795c1513Rafael Espindola // Eventually StackSize will be calculated by a link-time pass; which will 136376927d758657b3a511c73467ec5a7288795c1513Rafael Espindola // also decide whether checking code needs to be injected into this particular 136476927d758657b3a511c73467ec5a7288795c1513Rafael Espindola // prologue. 136576927d758657b3a511c73467ec5a7288795c1513Rafael Espindola StackSize = MFI->getStackSize(); 136676927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 136776927d758657b3a511c73467ec5a7288795c1513Rafael Espindola // Read the limit off the current stacklet off the stack_guard location. 136876927d758657b3a511c73467ec5a7288795c1513Rafael Espindola if (Is64Bit) { 136976927d758657b3a511c73467ec5a7288795c1513Rafael Espindola TlsReg = X86::FS; 137076927d758657b3a511c73467ec5a7288795c1513Rafael Espindola TlsOffset = 0x70; 137176927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 137276927d758657b3a511c73467ec5a7288795c1513Rafael Espindola BuildMI(checkMBB, DL, TII.get(X86::LEA64r), ScratchReg).addReg(X86::RSP) 137376927d758657b3a511c73467ec5a7288795c1513Rafael Espindola .addImm(0).addReg(0).addImm(-StackSize).addReg(0); 137476927d758657b3a511c73467ec5a7288795c1513Rafael Espindola BuildMI(checkMBB, DL, TII.get(X86::CMP64rm)).addReg(ScratchReg) 137576927d758657b3a511c73467ec5a7288795c1513Rafael Espindola .addReg(0).addImm(0).addReg(0).addImm(TlsOffset).addReg(TlsReg); 137676927d758657b3a511c73467ec5a7288795c1513Rafael Espindola } else { 137776927d758657b3a511c73467ec5a7288795c1513Rafael Espindola TlsReg = X86::GS; 137876927d758657b3a511c73467ec5a7288795c1513Rafael Espindola TlsOffset = 0x30; 137976927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 138076927d758657b3a511c73467ec5a7288795c1513Rafael Espindola BuildMI(checkMBB, DL, TII.get(X86::LEA32r), ScratchReg).addReg(X86::ESP) 138176927d758657b3a511c73467ec5a7288795c1513Rafael Espindola .addImm(0).addReg(0).addImm(-StackSize).addReg(0); 138276927d758657b3a511c73467ec5a7288795c1513Rafael Espindola BuildMI(checkMBB, DL, TII.get(X86::CMP32rm)).addReg(ScratchReg) 138376927d758657b3a511c73467ec5a7288795c1513Rafael Espindola .addReg(0).addImm(0).addReg(0).addImm(TlsOffset).addReg(TlsReg); 138476927d758657b3a511c73467ec5a7288795c1513Rafael Espindola } 138576927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 138676927d758657b3a511c73467ec5a7288795c1513Rafael Espindola // This jump is taken if SP >= (Stacklet Limit + Stack Space required). 138776927d758657b3a511c73467ec5a7288795c1513Rafael Espindola // It jumps to normal execution of the function body. 138876927d758657b3a511c73467ec5a7288795c1513Rafael Espindola BuildMI(checkMBB, DL, TII.get(X86::JG_4)).addMBB(&prologueMBB); 138976927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 139076927d758657b3a511c73467ec5a7288795c1513Rafael Espindola // On 32 bit we first push the arguments size and then the frame size. On 64 139176927d758657b3a511c73467ec5a7288795c1513Rafael Espindola // bit, we pass the stack frame size in r10 and the argument size in r11. 139276927d758657b3a511c73467ec5a7288795c1513Rafael Espindola if (Is64Bit) { 139376927d758657b3a511c73467ec5a7288795c1513Rafael Espindola // Functions with nested arguments use R10, so it needs to be saved across 139476927d758657b3a511c73467ec5a7288795c1513Rafael Espindola // the call to _morestack 139576927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 139676927d758657b3a511c73467ec5a7288795c1513Rafael Espindola if (IsNested) 139776927d758657b3a511c73467ec5a7288795c1513Rafael Espindola BuildMI(allocMBB, DL, TII.get(X86::MOV64rr), X86::RAX).addReg(X86::R10); 139876927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 139976927d758657b3a511c73467ec5a7288795c1513Rafael Espindola BuildMI(allocMBB, DL, TII.get(X86::MOV64ri), X86::R10) 140076927d758657b3a511c73467ec5a7288795c1513Rafael Espindola .addImm(StackSize); 140176927d758657b3a511c73467ec5a7288795c1513Rafael Espindola BuildMI(allocMBB, DL, TII.get(X86::MOV64ri), X86::R11) 140276927d758657b3a511c73467ec5a7288795c1513Rafael Espindola .addImm(X86FI->getArgumentStackSize()); 140376927d758657b3a511c73467ec5a7288795c1513Rafael Espindola MF.getRegInfo().setPhysRegUsed(X86::R10); 140476927d758657b3a511c73467ec5a7288795c1513Rafael Espindola MF.getRegInfo().setPhysRegUsed(X86::R11); 140576927d758657b3a511c73467ec5a7288795c1513Rafael Espindola } else { 140676927d758657b3a511c73467ec5a7288795c1513Rafael Espindola // Since we'll call __morestack, stack alignment needs to be preserved. 140776927d758657b3a511c73467ec5a7288795c1513Rafael Espindola BuildMI(allocMBB, DL, TII.get(X86::SUB32ri), X86::ESP).addReg(X86::ESP) 140876927d758657b3a511c73467ec5a7288795c1513Rafael Espindola .addImm(8); 140976927d758657b3a511c73467ec5a7288795c1513Rafael Espindola BuildMI(allocMBB, DL, TII.get(X86::PUSHi32)) 141076927d758657b3a511c73467ec5a7288795c1513Rafael Espindola .addImm(X86FI->getArgumentStackSize()); 141176927d758657b3a511c73467ec5a7288795c1513Rafael Espindola BuildMI(allocMBB, DL, TII.get(X86::PUSHi32)) 141276927d758657b3a511c73467ec5a7288795c1513Rafael Espindola .addImm(StackSize); 141376927d758657b3a511c73467ec5a7288795c1513Rafael Espindola } 141476927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 141576927d758657b3a511c73467ec5a7288795c1513Rafael Espindola // __morestack is in libgcc 141676927d758657b3a511c73467ec5a7288795c1513Rafael Espindola if (Is64Bit) 141776927d758657b3a511c73467ec5a7288795c1513Rafael Espindola BuildMI(allocMBB, DL, TII.get(X86::CALL64pcrel32)) 141876927d758657b3a511c73467ec5a7288795c1513Rafael Espindola .addExternalSymbol("__morestack"); 141976927d758657b3a511c73467ec5a7288795c1513Rafael Espindola else 142076927d758657b3a511c73467ec5a7288795c1513Rafael Espindola BuildMI(allocMBB, DL, TII.get(X86::CALLpcrel32)) 142176927d758657b3a511c73467ec5a7288795c1513Rafael Espindola .addExternalSymbol("__morestack"); 142276927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 142376927d758657b3a511c73467ec5a7288795c1513Rafael Espindola // __morestack only seems to remove 8 bytes off the stack. Add back the 142476927d758657b3a511c73467ec5a7288795c1513Rafael Espindola // additional 8 bytes we added before pushing the arguments. 142576927d758657b3a511c73467ec5a7288795c1513Rafael Espindola if (!Is64Bit) 142676927d758657b3a511c73467ec5a7288795c1513Rafael Espindola BuildMI(allocMBB, DL, TII.get(X86::ADD32ri), X86::ESP).addReg(X86::ESP) 142776927d758657b3a511c73467ec5a7288795c1513Rafael Espindola .addImm(8); 14284e68054b20725f6ec1cac33630258f749fe5debeBill Wendling BuildMI(allocMBB, DL, TII.get(X86::RET)); 142976927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 14304e68054b20725f6ec1cac33630258f749fe5debeBill Wendling if (IsNested) 14314e68054b20725f6ec1cac33630258f749fe5debeBill Wendling BuildMI(restoreR10MBB, DL, TII.get(X86::MOV64rr), X86::R10) 14324e68054b20725f6ec1cac33630258f749fe5debeBill Wendling .addReg(X86::RAX); 143376927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 14344e68054b20725f6ec1cac33630258f749fe5debeBill Wendling if (IsNested) { 14354e68054b20725f6ec1cac33630258f749fe5debeBill Wendling allocMBB->addSuccessor(restoreR10MBB); 14364e68054b20725f6ec1cac33630258f749fe5debeBill Wendling restoreR10MBB->addSuccessor(&prologueMBB); 14374e68054b20725f6ec1cac33630258f749fe5debeBill Wendling } else { 14384e68054b20725f6ec1cac33630258f749fe5debeBill Wendling allocMBB->addSuccessor(&prologueMBB); 14394e68054b20725f6ec1cac33630258f749fe5debeBill Wendling } 144082222c20be24adda7c218f3fdaf2e0ae049c955bBill Wendling 144176927d758657b3a511c73467ec5a7288795c1513Rafael Espindola checkMBB->addSuccessor(allocMBB); 144276927d758657b3a511c73467ec5a7288795c1513Rafael Espindola checkMBB->addSuccessor(&prologueMBB); 144376927d758657b3a511c73467ec5a7288795c1513Rafael Espindola 144451f0c7641983469cbd29f8862a121645471a885aJakob Stoklund Olesen#ifdef XDEBUG 144576927d758657b3a511c73467ec5a7288795c1513Rafael Espindola MF.verify(); 144676927d758657b3a511c73467ec5a7288795c1513Rafael Espindola#endif 144776927d758657b3a511c73467ec5a7288795c1513Rafael Espindola} 1448