Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 1 | //===-- HexagonPeephole.cpp - Hexagon Peephole Optimiztions ---------------===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | // This peephole pass optimizes in the following cases. |
| 9 | // 1. Optimizes redundant sign extends for the following case |
| 10 | // Transform the following pattern |
| 11 | // %vreg170<def> = SXTW %vreg166 |
| 12 | // ... |
| 13 | // %vreg176<def> = COPY %vreg170:subreg_loreg |
| 14 | // |
| 15 | // Into |
| 16 | // %vreg176<def> = COPY vreg166 |
| 17 | // |
| 18 | // 2. Optimizes redundant negation of predicates. |
| 19 | // %vreg15<def> = CMPGTrr %vreg6, %vreg2 |
| 20 | // ... |
| 21 | // %vreg16<def> = NOT_p %vreg15<kill> |
| 22 | // ... |
| 23 | // JMP_c %vreg16<kill>, <BB#1>, %PC<imp-def,dead> |
| 24 | // |
| 25 | // Into |
| 26 | // %vreg15<def> = CMPGTrr %vreg6, %vreg2; |
| 27 | // ... |
| 28 | // JMP_cNot %vreg15<kill>, <BB#1>, %PC<imp-def,dead>; |
| 29 | // |
| 30 | // Note: The peephole pass makes the instrucstions like |
| 31 | // %vreg170<def> = SXTW %vreg166 or %vreg16<def> = NOT_p %vreg15<kill> |
Robert Wilhelm | 2788d3e | 2013-09-28 13:42:22 +0000 | [diff] [blame] | 32 | // redundant and relies on some form of dead removal instructions, like |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 33 | // DCE or DIE to actually eliminate them. |
| 34 | |
| 35 | |
| 36 | //===----------------------------------------------------------------------===// |
| 37 | |
Craig Topper | b25fda9 | 2012-03-17 18:46:09 +0000 | [diff] [blame] | 38 | #include "Hexagon.h" |
| 39 | #include "HexagonTargetMachine.h" |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 40 | #include "llvm/ADT/DenseMap.h" |
| 41 | #include "llvm/ADT/Statistic.h" |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 42 | #include "llvm/CodeGen/MachineFunction.h" |
| 43 | #include "llvm/CodeGen/MachineFunctionPass.h" |
| 44 | #include "llvm/CodeGen/MachineInstrBuilder.h" |
| 45 | #include "llvm/CodeGen/MachineRegisterInfo.h" |
Chandler Carruth | ed0881b | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 46 | #include "llvm/CodeGen/Passes.h" |
Chandler Carruth | 9fb823b | 2013-01-02 11:36:10 +0000 | [diff] [blame] | 47 | #include "llvm/IR/Constants.h" |
Chandler Carruth | ed0881b | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 48 | #include "llvm/PassSupport.h" |
Craig Topper | b25fda9 | 2012-03-17 18:46:09 +0000 | [diff] [blame] | 49 | #include "llvm/Support/CommandLine.h" |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 50 | #include "llvm/Support/Debug.h" |
| 51 | #include "llvm/Support/raw_ostream.h" |
Chandler Carruth | ed0881b | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 52 | #include "llvm/Target/TargetInstrInfo.h" |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 53 | #include "llvm/Target/TargetMachine.h" |
| 54 | #include "llvm/Target/TargetRegisterInfo.h" |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 55 | #include <algorithm> |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 56 | |
| 57 | using namespace llvm; |
| 58 | |
Chandler Carruth | 84e68b2 | 2014-04-22 02:41:26 +0000 | [diff] [blame] | 59 | #define DEBUG_TYPE "hexagon-peephole" |
| 60 | |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 61 | static cl::opt<bool> DisableHexagonPeephole("disable-hexagon-peephole", |
| 62 | cl::Hidden, cl::ZeroOrMore, cl::init(false), |
| 63 | cl::desc("Disable Peephole Optimization")); |
| 64 | |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 65 | static cl::opt<bool> DisablePNotP("disable-hexagon-pnotp", |
| 66 | cl::Hidden, cl::ZeroOrMore, cl::init(false), |
| 67 | cl::desc("Disable Optimization of PNotP")); |
| 68 | |
| 69 | static cl::opt<bool> DisableOptSZExt("disable-hexagon-optszext", |
| 70 | cl::Hidden, cl::ZeroOrMore, cl::init(false), |
| 71 | cl::desc("Disable Optimization of Sign/Zero Extends")); |
| 72 | |
Pranav Bhandarkar | 7dda912 | 2013-05-02 20:22:51 +0000 | [diff] [blame] | 73 | static cl::opt<bool> DisableOptExtTo64("disable-hexagon-opt-ext-to-64", |
| 74 | cl::Hidden, cl::ZeroOrMore, cl::init(false), |
| 75 | cl::desc("Disable Optimization of extensions to i64.")); |
| 76 | |
Krzysztof Parzyszek | 18ee119 | 2013-05-06 21:58:00 +0000 | [diff] [blame] | 77 | namespace llvm { |
| 78 | void initializeHexagonPeepholePass(PassRegistry&); |
| 79 | } |
| 80 | |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 81 | namespace { |
| 82 | struct HexagonPeephole : public MachineFunctionPass { |
| 83 | const HexagonInstrInfo *QII; |
| 84 | const HexagonRegisterInfo *QRI; |
| 85 | const MachineRegisterInfo *MRI; |
| 86 | |
| 87 | public: |
| 88 | static char ID; |
Krzysztof Parzyszek | 18ee119 | 2013-05-06 21:58:00 +0000 | [diff] [blame] | 89 | HexagonPeephole() : MachineFunctionPass(ID) { |
| 90 | initializeHexagonPeepholePass(*PassRegistry::getPassRegistry()); |
| 91 | } |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 92 | |
Craig Topper | 906c2cd | 2014-04-29 07:58:16 +0000 | [diff] [blame] | 93 | bool runOnMachineFunction(MachineFunction &MF) override; |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 94 | |
Craig Topper | 906c2cd | 2014-04-29 07:58:16 +0000 | [diff] [blame] | 95 | const char *getPassName() const override { |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 96 | return "Hexagon optimize redundant zero and size extends"; |
| 97 | } |
| 98 | |
Craig Topper | 906c2cd | 2014-04-29 07:58:16 +0000 | [diff] [blame] | 99 | void getAnalysisUsage(AnalysisUsage &AU) const override { |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 100 | MachineFunctionPass::getAnalysisUsage(AU); |
| 101 | } |
| 102 | |
| 103 | private: |
| 104 | void ChangeOpInto(MachineOperand &Dst, MachineOperand &Src); |
| 105 | }; |
| 106 | } |
| 107 | |
| 108 | char HexagonPeephole::ID = 0; |
| 109 | |
Krzysztof Parzyszek | 18ee119 | 2013-05-06 21:58:00 +0000 | [diff] [blame] | 110 | INITIALIZE_PASS(HexagonPeephole, "hexagon-peephole", "Hexagon Peephole", |
| 111 | false, false) |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 112 | |
Krzysztof Parzyszek | 18ee119 | 2013-05-06 21:58:00 +0000 | [diff] [blame] | 113 | bool HexagonPeephole::runOnMachineFunction(MachineFunction &MF) { |
Eric Christopher | fc6de42 | 2014-08-05 02:39:49 +0000 | [diff] [blame] | 114 | QII = static_cast<const HexagonInstrInfo *>(MF.getSubtarget().getInstrInfo()); |
Eric Christopher | d913448 | 2014-08-04 21:25:23 +0000 | [diff] [blame] | 115 | QRI = MF.getTarget().getSubtarget<HexagonSubtarget>().getRegisterInfo(); |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 116 | MRI = &MF.getRegInfo(); |
| 117 | |
| 118 | DenseMap<unsigned, unsigned> PeepholeMap; |
Pranav Bhandarkar | 823f9eb | 2012-09-05 16:01:40 +0000 | [diff] [blame] | 119 | DenseMap<unsigned, std::pair<unsigned, unsigned> > PeepholeDoubleRegsMap; |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 120 | |
| 121 | if (DisableHexagonPeephole) return false; |
| 122 | |
| 123 | // Loop over all of the basic blocks. |
| 124 | for (MachineFunction::iterator MBBb = MF.begin(), MBBe = MF.end(); |
| 125 | MBBb != MBBe; ++MBBb) { |
| 126 | MachineBasicBlock* MBB = MBBb; |
| 127 | PeepholeMap.clear(); |
Pranav Bhandarkar | 823f9eb | 2012-09-05 16:01:40 +0000 | [diff] [blame] | 128 | PeepholeDoubleRegsMap.clear(); |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 129 | |
| 130 | // Traverse the basic block. |
| 131 | for (MachineBasicBlock::iterator MII = MBB->begin(); MII != MBB->end(); |
| 132 | ++MII) { |
| 133 | MachineInstr *MI = MII; |
| 134 | // Look for sign extends: |
| 135 | // %vreg170<def> = SXTW %vreg166 |
Colin LeMahieu | eb52f69 | 2014-12-11 16:43:06 +0000 | [diff] [blame] | 136 | if (!DisableOptSZExt && MI->getOpcode() == Hexagon::A2_sxtw) { |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 137 | assert (MI->getNumOperands() == 2); |
| 138 | MachineOperand &Dst = MI->getOperand(0); |
| 139 | MachineOperand &Src = MI->getOperand(1); |
| 140 | unsigned DstReg = Dst.getReg(); |
| 141 | unsigned SrcReg = Src.getReg(); |
| 142 | // Just handle virtual registers. |
| 143 | if (TargetRegisterInfo::isVirtualRegister(DstReg) && |
| 144 | TargetRegisterInfo::isVirtualRegister(SrcReg)) { |
| 145 | // Map the following: |
| 146 | // %vreg170<def> = SXTW %vreg166 |
| 147 | // PeepholeMap[170] = vreg166 |
| 148 | PeepholeMap[DstReg] = SrcReg; |
| 149 | } |
| 150 | } |
| 151 | |
Pranav Bhandarkar | 7dda912 | 2013-05-02 20:22:51 +0000 | [diff] [blame] | 152 | // Look for %vreg170<def> = COMBINE_ir_V4 (0, %vreg169) |
| 153 | // %vreg170:DoublRegs, %vreg169:IntRegs |
| 154 | if (!DisableOptExtTo64 && |
| 155 | MI->getOpcode () == Hexagon::COMBINE_Ir_V4) { |
| 156 | assert (MI->getNumOperands() == 3); |
| 157 | MachineOperand &Dst = MI->getOperand(0); |
| 158 | MachineOperand &Src1 = MI->getOperand(1); |
| 159 | MachineOperand &Src2 = MI->getOperand(2); |
| 160 | if (Src1.getImm() != 0) |
| 161 | continue; |
| 162 | unsigned DstReg = Dst.getReg(); |
| 163 | unsigned SrcReg = Src2.getReg(); |
| 164 | PeepholeMap[DstReg] = SrcReg; |
| 165 | } |
| 166 | |
Pranav Bhandarkar | 823f9eb | 2012-09-05 16:01:40 +0000 | [diff] [blame] | 167 | // Look for this sequence below |
| 168 | // %vregDoubleReg1 = LSRd_ri %vregDoubleReg0, 32 |
| 169 | // %vregIntReg = COPY %vregDoubleReg1:subreg_loreg. |
| 170 | // and convert into |
| 171 | // %vregIntReg = COPY %vregDoubleReg0:subreg_hireg. |
Colin LeMahieu | aa1bade | 2014-12-16 23:36:15 +0000 | [diff] [blame^] | 172 | if (MI->getOpcode() == Hexagon::S2_lsr_i_p) { |
Pranav Bhandarkar | 823f9eb | 2012-09-05 16:01:40 +0000 | [diff] [blame] | 173 | assert(MI->getNumOperands() == 3); |
| 174 | MachineOperand &Dst = MI->getOperand(0); |
| 175 | MachineOperand &Src1 = MI->getOperand(1); |
| 176 | MachineOperand &Src2 = MI->getOperand(2); |
| 177 | if (Src2.getImm() != 32) |
| 178 | continue; |
| 179 | unsigned DstReg = Dst.getReg(); |
| 180 | unsigned SrcReg = Src1.getReg(); |
| 181 | PeepholeDoubleRegsMap[DstReg] = |
| 182 | std::make_pair(*&SrcReg, 1/*Hexagon::subreg_hireg*/); |
| 183 | } |
| 184 | |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 185 | // Look for P=NOT(P). |
| 186 | if (!DisablePNotP && |
Colin LeMahieu | 5cf5632 | 2014-12-08 23:55:43 +0000 | [diff] [blame] | 187 | (MI->getOpcode() == Hexagon::C2_not)) { |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 188 | assert (MI->getNumOperands() == 2); |
| 189 | MachineOperand &Dst = MI->getOperand(0); |
| 190 | MachineOperand &Src = MI->getOperand(1); |
| 191 | unsigned DstReg = Dst.getReg(); |
| 192 | unsigned SrcReg = Src.getReg(); |
| 193 | // Just handle virtual registers. |
| 194 | if (TargetRegisterInfo::isVirtualRegister(DstReg) && |
| 195 | TargetRegisterInfo::isVirtualRegister(SrcReg)) { |
| 196 | // Map the following: |
| 197 | // %vreg170<def> = NOT_xx %vreg166 |
| 198 | // PeepholeMap[170] = vreg166 |
| 199 | PeepholeMap[DstReg] = SrcReg; |
| 200 | } |
| 201 | } |
| 202 | |
| 203 | // Look for copy: |
| 204 | // %vreg176<def> = COPY %vreg170:subreg_loreg |
| 205 | if (!DisableOptSZExt && MI->isCopy()) { |
| 206 | assert (MI->getNumOperands() == 2); |
| 207 | MachineOperand &Dst = MI->getOperand(0); |
| 208 | MachineOperand &Src = MI->getOperand(1); |
| 209 | |
| 210 | // Make sure we are copying the lower 32 bits. |
| 211 | if (Src.getSubReg() != Hexagon::subreg_loreg) |
| 212 | continue; |
| 213 | |
| 214 | unsigned DstReg = Dst.getReg(); |
| 215 | unsigned SrcReg = Src.getReg(); |
| 216 | if (TargetRegisterInfo::isVirtualRegister(DstReg) && |
| 217 | TargetRegisterInfo::isVirtualRegister(SrcReg)) { |
| 218 | // Try to find in the map. |
| 219 | if (unsigned PeepholeSrc = PeepholeMap.lookup(SrcReg)) { |
| 220 | // Change the 1st operand. |
| 221 | MI->RemoveOperand(1); |
| 222 | MI->addOperand(MachineOperand::CreateReg(PeepholeSrc, false)); |
Pranav Bhandarkar | 823f9eb | 2012-09-05 16:01:40 +0000 | [diff] [blame] | 223 | } else { |
| 224 | DenseMap<unsigned, std::pair<unsigned, unsigned> >::iterator DI = |
| 225 | PeepholeDoubleRegsMap.find(SrcReg); |
| 226 | if (DI != PeepholeDoubleRegsMap.end()) { |
| 227 | std::pair<unsigned,unsigned> PeepholeSrc = DI->second; |
| 228 | MI->RemoveOperand(1); |
| 229 | MI->addOperand(MachineOperand::CreateReg(PeepholeSrc.first, |
| 230 | false /*isDef*/, |
| 231 | false /*isImp*/, |
| 232 | false /*isKill*/, |
| 233 | false /*isDead*/, |
| 234 | false /*isUndef*/, |
| 235 | false /*isEarlyClobber*/, |
| 236 | PeepholeSrc.second)); |
| 237 | } |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 238 | } |
| 239 | } |
| 240 | } |
| 241 | |
| 242 | // Look for Predicated instructions. |
| 243 | if (!DisablePNotP) { |
| 244 | bool Done = false; |
| 245 | if (QII->isPredicated(MI)) { |
| 246 | MachineOperand &Op0 = MI->getOperand(0); |
| 247 | unsigned Reg0 = Op0.getReg(); |
| 248 | const TargetRegisterClass *RC0 = MRI->getRegClass(Reg0); |
| 249 | if (RC0->getID() == Hexagon::PredRegsRegClassID) { |
| 250 | // Handle instructions that have a prediate register in op0 |
| 251 | // (most cases of predicable instructions). |
| 252 | if (TargetRegisterInfo::isVirtualRegister(Reg0)) { |
| 253 | // Try to find in the map. |
| 254 | if (unsigned PeepholeSrc = PeepholeMap.lookup(Reg0)) { |
| 255 | // Change the 1st operand and, flip the opcode. |
| 256 | MI->getOperand(0).setReg(PeepholeSrc); |
| 257 | int NewOp = QII->getInvertedPredicatedOpcode(MI->getOpcode()); |
| 258 | MI->setDesc(QII->get(NewOp)); |
| 259 | Done = true; |
| 260 | } |
| 261 | } |
| 262 | } |
| 263 | } |
| 264 | |
| 265 | if (!Done) { |
| 266 | // Handle special instructions. |
| 267 | unsigned Op = MI->getOpcode(); |
| 268 | unsigned NewOp = 0; |
| 269 | unsigned PR = 1, S1 = 2, S2 = 3; // Operand indices. |
| 270 | |
| 271 | switch (Op) { |
Colin LeMahieu | e83bc74 | 2014-11-25 20:20:09 +0000 | [diff] [blame] | 272 | case Hexagon::C2_mux: |
Colin LeMahieu | 9665f98 | 2014-12-05 21:09:27 +0000 | [diff] [blame] | 273 | case Hexagon::C2_muxii: |
Colin LeMahieu | e83bc74 | 2014-11-25 20:20:09 +0000 | [diff] [blame] | 274 | case Hexagon::TFR_condset_ii: |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 275 | NewOp = Op; |
| 276 | break; |
| 277 | case Hexagon::TFR_condset_ri: |
| 278 | NewOp = Hexagon::TFR_condset_ir; |
| 279 | break; |
| 280 | case Hexagon::TFR_condset_ir: |
| 281 | NewOp = Hexagon::TFR_condset_ri; |
| 282 | break; |
Colin LeMahieu | 9665f98 | 2014-12-05 21:09:27 +0000 | [diff] [blame] | 283 | case Hexagon::C2_muxri: |
| 284 | NewOp = Hexagon::C2_muxir; |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 285 | break; |
Colin LeMahieu | 9665f98 | 2014-12-05 21:09:27 +0000 | [diff] [blame] | 286 | case Hexagon::C2_muxir: |
| 287 | NewOp = Hexagon::C2_muxri; |
Sirish Pande | 30804c2 | 2012-02-15 18:52:27 +0000 | [diff] [blame] | 288 | break; |
| 289 | } |
| 290 | if (NewOp) { |
| 291 | unsigned PSrc = MI->getOperand(PR).getReg(); |
| 292 | if (unsigned POrig = PeepholeMap.lookup(PSrc)) { |
| 293 | MI->getOperand(PR).setReg(POrig); |
| 294 | MI->setDesc(QII->get(NewOp)); |
| 295 | // Swap operands S1 and S2. |
| 296 | MachineOperand Op1 = MI->getOperand(S1); |
| 297 | MachineOperand Op2 = MI->getOperand(S2); |
| 298 | ChangeOpInto(MI->getOperand(S1), Op2); |
| 299 | ChangeOpInto(MI->getOperand(S2), Op1); |
| 300 | } |
| 301 | } // if (NewOp) |
| 302 | } // if (!Done) |
| 303 | |
| 304 | } // if (!DisablePNotP) |
| 305 | |
| 306 | } // Instruction |
| 307 | } // Basic Block |
| 308 | return true; |
| 309 | } |
| 310 | |
| 311 | void HexagonPeephole::ChangeOpInto(MachineOperand &Dst, MachineOperand &Src) { |
| 312 | assert (&Dst != &Src && "Cannot duplicate into itself"); |
| 313 | switch (Dst.getType()) { |
| 314 | case MachineOperand::MO_Register: |
| 315 | if (Src.isReg()) { |
| 316 | Dst.setReg(Src.getReg()); |
| 317 | } else if (Src.isImm()) { |
| 318 | Dst.ChangeToImmediate(Src.getImm()); |
| 319 | } else { |
| 320 | llvm_unreachable("Unexpected src operand type"); |
| 321 | } |
| 322 | break; |
| 323 | |
| 324 | case MachineOperand::MO_Immediate: |
| 325 | if (Src.isImm()) { |
| 326 | Dst.setImm(Src.getImm()); |
| 327 | } else if (Src.isReg()) { |
| 328 | Dst.ChangeToRegister(Src.getReg(), Src.isDef(), Src.isImplicit(), |
| 329 | Src.isKill(), Src.isDead(), Src.isUndef(), |
| 330 | Src.isDebug()); |
| 331 | } else { |
| 332 | llvm_unreachable("Unexpected src operand type"); |
| 333 | } |
| 334 | break; |
| 335 | |
| 336 | default: |
| 337 | llvm_unreachable("Unexpected dst operand type"); |
| 338 | break; |
| 339 | } |
| 340 | } |
| 341 | |
| 342 | FunctionPass *llvm::createHexagonPeephole() { |
| 343 | return new HexagonPeephole(); |
| 344 | } |