Jia Liu | 31d157a | 2012-02-18 12:03:15 +0000 | [diff] [blame] | 1 | //===-- HexagonFrameLowering.cpp - Define frame lowering ------------------===// |
Tony Linthicum | b4b5415 | 2011-12-12 21:14:40 +0000 | [diff] [blame] | 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | // |
| 9 | //===----------------------------------------------------------------------===// |
Benjamin Kramer | f3fd7ee | 2012-02-06 10:19:29 +0000 | [diff] [blame] | 10 | |
Craig Topper | 79aa341 | 2012-03-17 18:46:09 +0000 | [diff] [blame] | 11 | #include "HexagonFrameLowering.h" |
Tony Linthicum | b4b5415 | 2011-12-12 21:14:40 +0000 | [diff] [blame] | 12 | #include "Hexagon.h" |
| 13 | #include "HexagonInstrInfo.h" |
| 14 | #include "HexagonRegisterInfo.h" |
| 15 | #include "HexagonSubtarget.h" |
| 16 | #include "HexagonTargetMachine.h" |
| 17 | #include "HexagonMachineFunctionInfo.h" |
Benjamin Kramer | f3fd7ee | 2012-02-06 10:19:29 +0000 | [diff] [blame] | 18 | #include "llvm/Function.h" |
Tony Linthicum | b4b5415 | 2011-12-12 21:14:40 +0000 | [diff] [blame] | 19 | #include "llvm/Type.h" |
| 20 | #include "llvm/ADT/BitVector.h" |
| 21 | #include "llvm/ADT/STLExtras.h" |
Benjamin Kramer | f3fd7ee | 2012-02-06 10:19:29 +0000 | [diff] [blame] | 22 | #include "llvm/CodeGen/AsmPrinter.h" |
| 23 | #include "llvm/CodeGen/MachineInstrBuilder.h" |
| 24 | #include "llvm/CodeGen/MachineFunction.h" |
| 25 | #include "llvm/CodeGen/MachineFunctionPass.h" |
| 26 | #include "llvm/CodeGen/MachineFrameInfo.h" |
| 27 | #include "llvm/CodeGen/MachineModuleInfo.h" |
| 28 | #include "llvm/CodeGen/MachineRegisterInfo.h" |
| 29 | #include "llvm/CodeGen/RegisterScavenging.h" |
| 30 | #include "llvm/MC/MachineLocation.h" |
| 31 | #include "llvm/MC/MCAsmInfo.h" |
| 32 | #include "llvm/Target/TargetInstrInfo.h" |
Tony Linthicum | b4b5415 | 2011-12-12 21:14:40 +0000 | [diff] [blame] | 33 | #include "llvm/Target/TargetMachine.h" |
| 34 | #include "llvm/Target/TargetOptions.h" |
Benjamin Kramer | f3fd7ee | 2012-02-06 10:19:29 +0000 | [diff] [blame] | 35 | #include "llvm/Support/CommandLine.h" |
Tony Linthicum | b4b5415 | 2011-12-12 21:14:40 +0000 | [diff] [blame] | 36 | |
Tony Linthicum | b4b5415 | 2011-12-12 21:14:40 +0000 | [diff] [blame] | 37 | using namespace llvm; |
| 38 | |
| 39 | static cl::opt<bool> DisableDeallocRet( |
| 40 | "disable-hexagon-dealloc-ret", |
| 41 | cl::Hidden, |
| 42 | cl::desc("Disable Dealloc Return for Hexagon target")); |
| 43 | |
| 44 | /// determineFrameLayout - Determine the size of the frame and maximum call |
| 45 | /// frame size. |
| 46 | void HexagonFrameLowering::determineFrameLayout(MachineFunction &MF) const { |
| 47 | MachineFrameInfo *MFI = MF.getFrameInfo(); |
| 48 | |
| 49 | // Get the number of bytes to allocate from the FrameInfo. |
| 50 | unsigned FrameSize = MFI->getStackSize(); |
| 51 | |
| 52 | // Get the alignments provided by the target. |
| 53 | unsigned TargetAlign = MF.getTarget().getFrameLowering()->getStackAlignment(); |
| 54 | // Get the maximum call frame size of all the calls. |
| 55 | unsigned maxCallFrameSize = MFI->getMaxCallFrameSize(); |
| 56 | |
| 57 | // If we have dynamic alloca then maxCallFrameSize needs to be aligned so |
| 58 | // that allocations will be aligned. |
| 59 | if (MFI->hasVarSizedObjects()) |
| 60 | maxCallFrameSize = RoundUpToAlignment(maxCallFrameSize, TargetAlign); |
| 61 | |
| 62 | // Update maximum call frame size. |
| 63 | MFI->setMaxCallFrameSize(maxCallFrameSize); |
| 64 | |
| 65 | // Include call frame size in total. |
| 66 | FrameSize += maxCallFrameSize; |
| 67 | |
| 68 | // Make sure the frame is aligned. |
| 69 | FrameSize = RoundUpToAlignment(FrameSize, TargetAlign); |
| 70 | |
| 71 | // Update frame info. |
| 72 | MFI->setStackSize(FrameSize); |
| 73 | } |
| 74 | |
| 75 | |
| 76 | void HexagonFrameLowering::emitPrologue(MachineFunction &MF) const { |
| 77 | MachineBasicBlock &MBB = MF.front(); |
| 78 | MachineFrameInfo *MFI = MF.getFrameInfo(); |
| 79 | MachineModuleInfo &MMI = MF.getMMI(); |
| 80 | MachineBasicBlock::iterator MBBI = MBB.begin(); |
| 81 | const HexagonRegisterInfo *QRI = |
| 82 | static_cast<const HexagonRegisterInfo *>(MF.getTarget().getRegisterInfo()); |
| 83 | DebugLoc dl = MBBI != MBB.end() ? MBBI->getDebugLoc() : DebugLoc(); |
| 84 | determineFrameLayout(MF); |
| 85 | |
| 86 | // Check if frame moves are needed for EH. |
| 87 | bool needsFrameMoves = MMI.hasDebugInfo() || |
| 88 | !MF.getFunction()->needsUnwindTableEntry(); |
| 89 | |
| 90 | // Get the number of bytes to allocate from the FrameInfo. |
| 91 | int NumBytes = (int) MFI->getStackSize(); |
| 92 | |
| 93 | // LLVM expects allocframe not to be the first instruction in the |
| 94 | // basic block. |
| 95 | MachineBasicBlock::iterator InsertPt = MBB.begin(); |
| 96 | |
| 97 | // |
| 98 | // ALLOCA adjust regs. Iterate over ADJDYNALLOC nodes and change the offset. |
| 99 | // |
| 100 | HexagonMachineFunctionInfo *FuncInfo = |
| 101 | MF.getInfo<HexagonMachineFunctionInfo>(); |
| 102 | const std::vector<MachineInstr*>& AdjustRegs = |
| 103 | FuncInfo->getAllocaAdjustInsts(); |
| 104 | for (std::vector<MachineInstr*>::const_iterator i = AdjustRegs.begin(), |
| 105 | e = AdjustRegs.end(); |
| 106 | i != e; ++i) { |
| 107 | MachineInstr* MI = *i; |
| 108 | assert((MI->getOpcode() == Hexagon::ADJDYNALLOC) && |
| 109 | "Expected adjust alloca node"); |
| 110 | |
| 111 | MachineOperand& MO = MI->getOperand(2); |
| 112 | assert(MO.isImm() && "Expected immediate"); |
| 113 | MO.setImm(MFI->getMaxCallFrameSize()); |
| 114 | } |
| 115 | |
| 116 | std::vector<MachineMove> &Moves = MMI.getFrameMoves(); |
| 117 | |
| 118 | if (needsFrameMoves) { |
| 119 | // Advance CFA. DW_CFA_def_cfa |
| 120 | unsigned FPReg = QRI->getFrameRegister(); |
| 121 | unsigned RAReg = QRI->getRARegister(); |
| 122 | |
| 123 | MachineLocation Dst(MachineLocation::VirtualFP); |
| 124 | MachineLocation Src(FPReg, -8); |
| 125 | Moves.push_back(MachineMove(0, Dst, Src)); |
| 126 | |
| 127 | // R31 = (R31 - #4) |
| 128 | MachineLocation LRDst(RAReg, -4); |
| 129 | MachineLocation LRSrc(RAReg); |
| 130 | Moves.push_back(MachineMove(0, LRDst, LRSrc)); |
| 131 | |
| 132 | // R30 = (R30 - #8) |
| 133 | MachineLocation SPDst(FPReg, -8); |
| 134 | MachineLocation SPSrc(FPReg); |
| 135 | Moves.push_back(MachineMove(0, SPDst, SPSrc)); |
| 136 | } |
| 137 | |
| 138 | // |
| 139 | // Only insert ALLOCFRAME if we need to. |
| 140 | // |
| 141 | if (hasFP(MF)) { |
| 142 | // Check for overflow. |
| 143 | // Hexagon_TODO: Ugh! hardcoding. Is there an API that can be used? |
Tony Linthicum | 22614a0 | 2011-12-12 21:52:59 +0000 | [diff] [blame] | 144 | const int ALLOCFRAME_MAX = 16384; |
Tony Linthicum | b4b5415 | 2011-12-12 21:14:40 +0000 | [diff] [blame] | 145 | const TargetInstrInfo &TII = *MF.getTarget().getInstrInfo(); |
| 146 | |
| 147 | if (NumBytes >= ALLOCFRAME_MAX) { |
| 148 | // Emit allocframe(#0). |
| 149 | BuildMI(MBB, InsertPt, dl, TII.get(Hexagon::ALLOCFRAME)).addImm(0); |
| 150 | |
| 151 | // Subtract offset from frame pointer. |
| 152 | BuildMI(MBB, InsertPt, dl, TII.get(Hexagon::CONST32_Int_Real), |
| 153 | HEXAGON_RESERVED_REG_1).addImm(NumBytes); |
| 154 | BuildMI(MBB, InsertPt, dl, TII.get(Hexagon::SUB_rr), |
| 155 | QRI->getStackRegister()). |
| 156 | addReg(QRI->getStackRegister()). |
| 157 | addReg(HEXAGON_RESERVED_REG_1); |
| 158 | } else { |
| 159 | BuildMI(MBB, InsertPt, dl, TII.get(Hexagon::ALLOCFRAME)).addImm(NumBytes); |
| 160 | } |
| 161 | } |
| 162 | } |
| 163 | // Returns true if MBB has a machine instructions that indicates a tail call |
| 164 | // in the block. |
| 165 | bool HexagonFrameLowering::hasTailCall(MachineBasicBlock &MBB) const { |
| 166 | MachineBasicBlock::iterator MBBI = MBB.getLastNonDebugInstr(); |
| 167 | unsigned RetOpcode = MBBI->getOpcode(); |
| 168 | |
| 169 | return RetOpcode == Hexagon::TCRETURNtg || RetOpcode == Hexagon::TCRETURNtext;} |
| 170 | |
| 171 | void HexagonFrameLowering::emitEpilogue(MachineFunction &MF, |
| 172 | MachineBasicBlock &MBB) const { |
| 173 | MachineBasicBlock::iterator MBBI = prior(MBB.end()); |
| 174 | DebugLoc dl = MBBI->getDebugLoc(); |
| 175 | // |
| 176 | // Only insert deallocframe if we need to. |
| 177 | // |
| 178 | if (hasFP(MF)) { |
| 179 | MachineBasicBlock::iterator MBBI = prior(MBB.end()); |
| 180 | MachineBasicBlock::iterator MBBI_end = MBB.end(); |
| 181 | // |
| 182 | // For Hexagon, we don't need the frame size. |
| 183 | // |
| 184 | MachineFrameInfo *MFI = MF.getFrameInfo(); |
| 185 | int NumBytes = (int) MFI->getStackSize(); |
| 186 | |
| 187 | const TargetInstrInfo &TII = *MF.getTarget().getInstrInfo(); |
| 188 | |
| 189 | // Replace 'jumpr r31' instruction with dealloc_return for V4 and higher |
| 190 | // versions. |
| 191 | if (STI.hasV4TOps() && MBBI->getOpcode() == Hexagon::JMPR |
| 192 | && !DisableDeallocRet) { |
| 193 | // Remove jumpr node. |
| 194 | MBB.erase(MBBI); |
| 195 | // Add dealloc_return. |
| 196 | BuildMI(MBB, MBBI_end, dl, TII.get(Hexagon::DEALLOC_RET_V4)) |
| 197 | .addImm(NumBytes); |
| 198 | } else { // Add deallocframe for V2 and V3. |
| 199 | BuildMI(MBB, MBBI, dl, TII.get(Hexagon::DEALLOCFRAME)).addImm(NumBytes); |
| 200 | } |
| 201 | } |
| 202 | } |
| 203 | |
| 204 | bool HexagonFrameLowering::hasFP(const MachineFunction &MF) const { |
| 205 | const MachineFrameInfo *MFI = MF.getFrameInfo(); |
| 206 | const HexagonMachineFunctionInfo *FuncInfo = |
| 207 | MF.getInfo<HexagonMachineFunctionInfo>(); |
| 208 | return (MFI->hasCalls() || (MFI->getStackSize() > 0) || |
| 209 | FuncInfo->hasClobberLR() ); |
| 210 | } |
| 211 | |
Jakob Stoklund Olesen | 4aecc76 | 2012-05-30 22:40:03 +0000 | [diff] [blame^] | 212 | static inline |
| 213 | unsigned uniqueSuperReg(unsigned Reg, const TargetRegisterInfo *TRI) { |
| 214 | MCSuperRegIterator SRI(Reg, TRI); |
| 215 | assert(SRI.isValid() && "Expected a superreg"); |
| 216 | unsigned SuperReg = *SRI; |
| 217 | ++SRI; |
| 218 | assert(!SRI.isValid() && "Expected exactly one superreg"); |
| 219 | return SuperReg; |
| 220 | } |
| 221 | |
Tony Linthicum | b4b5415 | 2011-12-12 21:14:40 +0000 | [diff] [blame] | 222 | bool |
| 223 | HexagonFrameLowering::spillCalleeSavedRegisters( |
| 224 | MachineBasicBlock &MBB, |
| 225 | MachineBasicBlock::iterator MI, |
| 226 | const std::vector<CalleeSavedInfo> &CSI, |
| 227 | const TargetRegisterInfo *TRI) const { |
| 228 | MachineFunction *MF = MBB.getParent(); |
| 229 | const TargetInstrInfo &TII = *MF->getTarget().getInstrInfo(); |
| 230 | |
| 231 | if (CSI.empty()) { |
| 232 | return false; |
| 233 | } |
| 234 | |
| 235 | // We can only schedule double loads if we spill contiguous callee-saved regs |
| 236 | // For instance, we cannot scheduled double-word loads if we spill r24, |
| 237 | // r26, and r27. |
| 238 | // Hexagon_TODO: We can try to double-word align odd registers for -O2 and |
| 239 | // above. |
| 240 | bool ContiguousRegs = true; |
| 241 | |
| 242 | for (unsigned i = 0; i < CSI.size(); ++i) { |
| 243 | unsigned Reg = CSI[i].getReg(); |
| 244 | |
| 245 | // |
| 246 | // Check if we can use a double-word store. |
| 247 | // |
Jakob Stoklund Olesen | 4aecc76 | 2012-05-30 22:40:03 +0000 | [diff] [blame^] | 248 | unsigned SuperReg = uniqueSuperReg(Reg, TRI); |
Tony Linthicum | b4b5415 | 2011-12-12 21:14:40 +0000 | [diff] [blame] | 249 | bool CanUseDblStore = false; |
| 250 | const TargetRegisterClass* SuperRegClass = 0; |
| 251 | |
| 252 | if (ContiguousRegs && (i < CSI.size()-1)) { |
Jakob Stoklund Olesen | 4aecc76 | 2012-05-30 22:40:03 +0000 | [diff] [blame^] | 253 | unsigned SuperRegNext = uniqueSuperReg(CSI[i+1].getReg(), TRI); |
| 254 | SuperRegClass = TRI->getMinimalPhysRegClass(SuperReg); |
| 255 | CanUseDblStore = (SuperRegNext == SuperReg); |
Tony Linthicum | b4b5415 | 2011-12-12 21:14:40 +0000 | [diff] [blame] | 256 | } |
| 257 | |
| 258 | |
| 259 | if (CanUseDblStore) { |
Jakob Stoklund Olesen | 4aecc76 | 2012-05-30 22:40:03 +0000 | [diff] [blame^] | 260 | TII.storeRegToStackSlot(MBB, MI, SuperReg, true, |
Tony Linthicum | b4b5415 | 2011-12-12 21:14:40 +0000 | [diff] [blame] | 261 | CSI[i+1].getFrameIdx(), SuperRegClass, TRI); |
Jakob Stoklund Olesen | 4aecc76 | 2012-05-30 22:40:03 +0000 | [diff] [blame^] | 262 | MBB.addLiveIn(SuperReg); |
Tony Linthicum | b4b5415 | 2011-12-12 21:14:40 +0000 | [diff] [blame] | 263 | ++i; |
| 264 | } else { |
| 265 | // Cannot use a double-word store. |
| 266 | ContiguousRegs = false; |
| 267 | const TargetRegisterClass *RC = TRI->getMinimalPhysRegClass(Reg); |
| 268 | TII.storeRegToStackSlot(MBB, MI, Reg, true, CSI[i].getFrameIdx(), RC, |
| 269 | TRI); |
| 270 | MBB.addLiveIn(Reg); |
| 271 | } |
| 272 | } |
| 273 | return true; |
| 274 | } |
| 275 | |
| 276 | |
| 277 | bool HexagonFrameLowering::restoreCalleeSavedRegisters( |
| 278 | MachineBasicBlock &MBB, |
| 279 | MachineBasicBlock::iterator MI, |
| 280 | const std::vector<CalleeSavedInfo> &CSI, |
| 281 | const TargetRegisterInfo *TRI) const { |
| 282 | |
| 283 | MachineFunction *MF = MBB.getParent(); |
| 284 | const TargetInstrInfo &TII = *MF->getTarget().getInstrInfo(); |
| 285 | |
| 286 | if (CSI.empty()) { |
| 287 | return false; |
| 288 | } |
| 289 | |
| 290 | // We can only schedule double loads if we spill contiguous callee-saved regs |
| 291 | // For instance, we cannot scheduled double-word loads if we spill r24, |
| 292 | // r26, and r27. |
| 293 | // Hexagon_TODO: We can try to double-word align odd registers for -O2 and |
| 294 | // above. |
| 295 | bool ContiguousRegs = true; |
| 296 | |
| 297 | for (unsigned i = 0; i < CSI.size(); ++i) { |
| 298 | unsigned Reg = CSI[i].getReg(); |
| 299 | |
| 300 | // |
| 301 | // Check if we can use a double-word load. |
| 302 | // |
Jakob Stoklund Olesen | 4aecc76 | 2012-05-30 22:40:03 +0000 | [diff] [blame^] | 303 | unsigned SuperReg = uniqueSuperReg(Reg, TRI); |
Tony Linthicum | b4b5415 | 2011-12-12 21:14:40 +0000 | [diff] [blame] | 304 | const TargetRegisterClass* SuperRegClass = 0; |
Tony Linthicum | b4b5415 | 2011-12-12 21:14:40 +0000 | [diff] [blame] | 305 | bool CanUseDblLoad = false; |
| 306 | if (ContiguousRegs && (i < CSI.size()-1)) { |
Jakob Stoklund Olesen | 4aecc76 | 2012-05-30 22:40:03 +0000 | [diff] [blame^] | 307 | unsigned SuperRegNext = uniqueSuperReg(CSI[i+1].getReg(), TRI); |
| 308 | SuperRegClass = TRI->getMinimalPhysRegClass(SuperReg); |
| 309 | CanUseDblLoad = (SuperRegNext == SuperReg); |
Tony Linthicum | b4b5415 | 2011-12-12 21:14:40 +0000 | [diff] [blame] | 310 | } |
| 311 | |
| 312 | |
| 313 | if (CanUseDblLoad) { |
Jakob Stoklund Olesen | 4aecc76 | 2012-05-30 22:40:03 +0000 | [diff] [blame^] | 314 | TII.loadRegFromStackSlot(MBB, MI, SuperReg, CSI[i+1].getFrameIdx(), |
Tony Linthicum | b4b5415 | 2011-12-12 21:14:40 +0000 | [diff] [blame] | 315 | SuperRegClass, TRI); |
Jakob Stoklund Olesen | 4aecc76 | 2012-05-30 22:40:03 +0000 | [diff] [blame^] | 316 | MBB.addLiveIn(SuperReg); |
Tony Linthicum | b4b5415 | 2011-12-12 21:14:40 +0000 | [diff] [blame] | 317 | ++i; |
| 318 | } else { |
| 319 | // Cannot use a double-word load. |
| 320 | ContiguousRegs = false; |
| 321 | const TargetRegisterClass *RC = TRI->getMinimalPhysRegClass(Reg); |
| 322 | TII.loadRegFromStackSlot(MBB, MI, Reg, CSI[i].getFrameIdx(), RC, TRI); |
| 323 | MBB.addLiveIn(Reg); |
| 324 | } |
| 325 | } |
| 326 | return true; |
| 327 | } |
| 328 | |
| 329 | int HexagonFrameLowering::getFrameIndexOffset(const MachineFunction &MF, |
| 330 | int FI) const { |
| 331 | return MF.getFrameInfo()->getObjectOffset(FI); |
| 332 | } |