Bob Wilson | 70cd88f | 2009-08-05 23:12:45 +0000 | [diff] [blame] | 1 | //===-- NEONPreAllocPass.cpp - Allocate adjacent NEON registers--*- C++ -*-===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | |
| 10 | #define DEBUG_TYPE "neon-prealloc" |
| 11 | #include "ARM.h" |
| 12 | #include "ARMInstrInfo.h" |
| 13 | #include "llvm/CodeGen/MachineInstr.h" |
| 14 | #include "llvm/CodeGen/MachineInstrBuilder.h" |
Evan Cheng | 826bdfa | 2010-05-04 20:38:12 +0000 | [diff] [blame] | 15 | #include "llvm/CodeGen/MachineRegisterInfo.h" |
Bob Wilson | 70cd88f | 2009-08-05 23:12:45 +0000 | [diff] [blame] | 16 | #include "llvm/CodeGen/MachineFunctionPass.h" |
| 17 | using namespace llvm; |
| 18 | |
| 19 | namespace { |
Nick Lewycky | 6726b6d | 2009-10-25 06:33:48 +0000 | [diff] [blame] | 20 | class NEONPreAllocPass : public MachineFunctionPass { |
Bob Wilson | 70cd88f | 2009-08-05 23:12:45 +0000 | [diff] [blame] | 21 | const TargetInstrInfo *TII; |
Evan Cheng | 826bdfa | 2010-05-04 20:38:12 +0000 | [diff] [blame] | 22 | MachineRegisterInfo *MRI; |
Bob Wilson | 70cd88f | 2009-08-05 23:12:45 +0000 | [diff] [blame] | 23 | |
| 24 | public: |
| 25 | static char ID; |
| 26 | NEONPreAllocPass() : MachineFunctionPass(&ID) {} |
| 27 | |
| 28 | virtual bool runOnMachineFunction(MachineFunction &MF); |
| 29 | |
| 30 | virtual const char *getPassName() const { |
| 31 | return "NEON register pre-allocation pass"; |
| 32 | } |
| 33 | |
| 34 | private: |
Evan Cheng | 826bdfa | 2010-05-04 20:38:12 +0000 | [diff] [blame] | 35 | bool FormsRegSequence(MachineInstr *MI, |
Evan Cheng | 5c6aba2 | 2010-05-14 18:54:59 +0000 | [diff] [blame] | 36 | unsigned FirstOpnd, unsigned NumRegs, |
| 37 | unsigned Offset, unsigned Stride) const; |
Bob Wilson | 70cd88f | 2009-08-05 23:12:45 +0000 | [diff] [blame] | 38 | bool PreAllocNEONRegisters(MachineBasicBlock &MBB); |
| 39 | }; |
| 40 | |
| 41 | char NEONPreAllocPass::ID = 0; |
| 42 | } |
| 43 | |
Bob Wilson | ff8952e | 2009-10-07 17:24:55 +0000 | [diff] [blame] | 44 | static bool isNEONMultiRegOp(int Opcode, unsigned &FirstOpnd, unsigned &NumRegs, |
| 45 | unsigned &Offset, unsigned &Stride) { |
| 46 | // Default to unit stride with no offset. |
| 47 | Stride = 1; |
| 48 | Offset = 0; |
| 49 | |
Bob Wilson | 70cd88f | 2009-08-05 23:12:45 +0000 | [diff] [blame] | 50 | switch (Opcode) { |
| 51 | default: |
| 52 | break; |
| 53 | |
Bob Wilson | 621f195 | 2010-03-23 05:25:43 +0000 | [diff] [blame] | 54 | case ARM::VLD1q8: |
| 55 | case ARM::VLD1q16: |
| 56 | case ARM::VLD1q32: |
| 57 | case ARM::VLD1q64: |
Bob Wilson | 70cd88f | 2009-08-05 23:12:45 +0000 | [diff] [blame] | 58 | case ARM::VLD2d8: |
| 59 | case ARM::VLD2d16: |
| 60 | case ARM::VLD2d32: |
Bob Wilson | 243fcc5 | 2009-09-01 04:26:28 +0000 | [diff] [blame] | 61 | case ARM::VLD2LNd8: |
| 62 | case ARM::VLD2LNd16: |
| 63 | case ARM::VLD2LNd32: |
Bob Wilson | 70cd88f | 2009-08-05 23:12:45 +0000 | [diff] [blame] | 64 | FirstOpnd = 0; |
| 65 | NumRegs = 2; |
| 66 | return true; |
| 67 | |
Bob Wilson | 0bf7d99 | 2009-10-08 22:27:33 +0000 | [diff] [blame] | 68 | case ARM::VLD2q8: |
| 69 | case ARM::VLD2q16: |
| 70 | case ARM::VLD2q32: |
| 71 | FirstOpnd = 0; |
| 72 | NumRegs = 4; |
| 73 | return true; |
| 74 | |
Bob Wilson | 95ffecd | 2010-03-20 18:35:24 +0000 | [diff] [blame] | 75 | case ARM::VLD2LNq16: |
| 76 | case ARM::VLD2LNq32: |
Bob Wilson | 30aea9d | 2009-10-08 18:56:10 +0000 | [diff] [blame] | 77 | FirstOpnd = 0; |
| 78 | NumRegs = 2; |
| 79 | Offset = 0; |
| 80 | Stride = 2; |
| 81 | return true; |
| 82 | |
Bob Wilson | 95ffecd | 2010-03-20 18:35:24 +0000 | [diff] [blame] | 83 | case ARM::VLD2LNq16odd: |
| 84 | case ARM::VLD2LNq32odd: |
Bob Wilson | 30aea9d | 2009-10-08 18:56:10 +0000 | [diff] [blame] | 85 | FirstOpnd = 0; |
| 86 | NumRegs = 2; |
| 87 | Offset = 1; |
| 88 | Stride = 2; |
| 89 | return true; |
| 90 | |
Bob Wilson | 70cd88f | 2009-08-05 23:12:45 +0000 | [diff] [blame] | 91 | case ARM::VLD3d8: |
| 92 | case ARM::VLD3d16: |
| 93 | case ARM::VLD3d32: |
Bob Wilson | a697975 | 2010-03-22 18:13:18 +0000 | [diff] [blame] | 94 | case ARM::VLD1d64T: |
Bob Wilson | 243fcc5 | 2009-09-01 04:26:28 +0000 | [diff] [blame] | 95 | case ARM::VLD3LNd8: |
| 96 | case ARM::VLD3LNd16: |
| 97 | case ARM::VLD3LNd32: |
Bob Wilson | 70cd88f | 2009-08-05 23:12:45 +0000 | [diff] [blame] | 98 | FirstOpnd = 0; |
| 99 | NumRegs = 3; |
| 100 | return true; |
| 101 | |
Bob Wilson | 95ffecd | 2010-03-20 18:35:24 +0000 | [diff] [blame] | 102 | case ARM::VLD3q8_UPD: |
| 103 | case ARM::VLD3q16_UPD: |
| 104 | case ARM::VLD3q32_UPD: |
Bob Wilson | ff8952e | 2009-10-07 17:24:55 +0000 | [diff] [blame] | 105 | FirstOpnd = 0; |
| 106 | NumRegs = 3; |
| 107 | Offset = 0; |
| 108 | Stride = 2; |
| 109 | return true; |
| 110 | |
Bob Wilson | 95ffecd | 2010-03-20 18:35:24 +0000 | [diff] [blame] | 111 | case ARM::VLD3q8odd_UPD: |
| 112 | case ARM::VLD3q16odd_UPD: |
| 113 | case ARM::VLD3q32odd_UPD: |
Bob Wilson | ff8952e | 2009-10-07 17:24:55 +0000 | [diff] [blame] | 114 | FirstOpnd = 0; |
| 115 | NumRegs = 3; |
| 116 | Offset = 1; |
| 117 | Stride = 2; |
| 118 | return true; |
| 119 | |
Bob Wilson | 95ffecd | 2010-03-20 18:35:24 +0000 | [diff] [blame] | 120 | case ARM::VLD3LNq16: |
| 121 | case ARM::VLD3LNq32: |
Bob Wilson | 0bf7d99 | 2009-10-08 22:27:33 +0000 | [diff] [blame] | 122 | FirstOpnd = 0; |
| 123 | NumRegs = 3; |
| 124 | Offset = 0; |
| 125 | Stride = 2; |
| 126 | return true; |
| 127 | |
Bob Wilson | 95ffecd | 2010-03-20 18:35:24 +0000 | [diff] [blame] | 128 | case ARM::VLD3LNq16odd: |
| 129 | case ARM::VLD3LNq32odd: |
Bob Wilson | 0bf7d99 | 2009-10-08 22:27:33 +0000 | [diff] [blame] | 130 | FirstOpnd = 0; |
| 131 | NumRegs = 3; |
| 132 | Offset = 1; |
| 133 | Stride = 2; |
| 134 | return true; |
| 135 | |
Bob Wilson | 70cd88f | 2009-08-05 23:12:45 +0000 | [diff] [blame] | 136 | case ARM::VLD4d8: |
| 137 | case ARM::VLD4d16: |
| 138 | case ARM::VLD4d32: |
Bob Wilson | a697975 | 2010-03-22 18:13:18 +0000 | [diff] [blame] | 139 | case ARM::VLD1d64Q: |
Bob Wilson | 243fcc5 | 2009-09-01 04:26:28 +0000 | [diff] [blame] | 140 | case ARM::VLD4LNd8: |
| 141 | case ARM::VLD4LNd16: |
| 142 | case ARM::VLD4LNd32: |
Bob Wilson | 70cd88f | 2009-08-05 23:12:45 +0000 | [diff] [blame] | 143 | FirstOpnd = 0; |
| 144 | NumRegs = 4; |
| 145 | return true; |
Bob Wilson | b36ec86 | 2009-08-06 18:47:44 +0000 | [diff] [blame] | 146 | |
Bob Wilson | 95ffecd | 2010-03-20 18:35:24 +0000 | [diff] [blame] | 147 | case ARM::VLD4q8_UPD: |
| 148 | case ARM::VLD4q16_UPD: |
| 149 | case ARM::VLD4q32_UPD: |
Bob Wilson | 7708c22 | 2009-10-07 18:09:32 +0000 | [diff] [blame] | 150 | FirstOpnd = 0; |
| 151 | NumRegs = 4; |
| 152 | Offset = 0; |
| 153 | Stride = 2; |
| 154 | return true; |
| 155 | |
Bob Wilson | 95ffecd | 2010-03-20 18:35:24 +0000 | [diff] [blame] | 156 | case ARM::VLD4q8odd_UPD: |
| 157 | case ARM::VLD4q16odd_UPD: |
| 158 | case ARM::VLD4q32odd_UPD: |
Bob Wilson | 7708c22 | 2009-10-07 18:09:32 +0000 | [diff] [blame] | 159 | FirstOpnd = 0; |
| 160 | NumRegs = 4; |
| 161 | Offset = 1; |
| 162 | Stride = 2; |
| 163 | return true; |
| 164 | |
Bob Wilson | 95ffecd | 2010-03-20 18:35:24 +0000 | [diff] [blame] | 165 | case ARM::VLD4LNq16: |
| 166 | case ARM::VLD4LNq32: |
Bob Wilson | 62e053e | 2009-10-08 22:53:57 +0000 | [diff] [blame] | 167 | FirstOpnd = 0; |
| 168 | NumRegs = 4; |
| 169 | Offset = 0; |
| 170 | Stride = 2; |
| 171 | return true; |
| 172 | |
Bob Wilson | 95ffecd | 2010-03-20 18:35:24 +0000 | [diff] [blame] | 173 | case ARM::VLD4LNq16odd: |
| 174 | case ARM::VLD4LNq32odd: |
Bob Wilson | 62e053e | 2009-10-08 22:53:57 +0000 | [diff] [blame] | 175 | FirstOpnd = 0; |
| 176 | NumRegs = 4; |
| 177 | Offset = 1; |
| 178 | Stride = 2; |
| 179 | return true; |
| 180 | |
Bob Wilson | 11d9899 | 2010-03-23 06:20:33 +0000 | [diff] [blame] | 181 | case ARM::VST1q8: |
| 182 | case ARM::VST1q16: |
| 183 | case ARM::VST1q32: |
| 184 | case ARM::VST1q64: |
Bob Wilson | b36ec86 | 2009-08-06 18:47:44 +0000 | [diff] [blame] | 185 | case ARM::VST2d8: |
| 186 | case ARM::VST2d16: |
| 187 | case ARM::VST2d32: |
Bob Wilson | 8a3198b | 2009-09-01 18:51:56 +0000 | [diff] [blame] | 188 | case ARM::VST2LNd8: |
| 189 | case ARM::VST2LNd16: |
| 190 | case ARM::VST2LNd32: |
Bob Wilson | 226036e | 2010-03-20 22:13:40 +0000 | [diff] [blame] | 191 | FirstOpnd = 2; |
Bob Wilson | b36ec86 | 2009-08-06 18:47:44 +0000 | [diff] [blame] | 192 | NumRegs = 2; |
| 193 | return true; |
| 194 | |
Bob Wilson | d285575 | 2009-10-07 18:47:39 +0000 | [diff] [blame] | 195 | case ARM::VST2q8: |
| 196 | case ARM::VST2q16: |
| 197 | case ARM::VST2q32: |
Bob Wilson | 226036e | 2010-03-20 22:13:40 +0000 | [diff] [blame] | 198 | FirstOpnd = 2; |
Bob Wilson | d285575 | 2009-10-07 18:47:39 +0000 | [diff] [blame] | 199 | NumRegs = 4; |
| 200 | return true; |
| 201 | |
Bob Wilson | 95ffecd | 2010-03-20 18:35:24 +0000 | [diff] [blame] | 202 | case ARM::VST2LNq16: |
| 203 | case ARM::VST2LNq32: |
Bob Wilson | 226036e | 2010-03-20 22:13:40 +0000 | [diff] [blame] | 204 | FirstOpnd = 2; |
Bob Wilson | c5c6edb | 2009-10-08 23:38:24 +0000 | [diff] [blame] | 205 | NumRegs = 2; |
| 206 | Offset = 0; |
| 207 | Stride = 2; |
| 208 | return true; |
| 209 | |
Bob Wilson | 95ffecd | 2010-03-20 18:35:24 +0000 | [diff] [blame] | 210 | case ARM::VST2LNq16odd: |
| 211 | case ARM::VST2LNq32odd: |
Bob Wilson | 226036e | 2010-03-20 22:13:40 +0000 | [diff] [blame] | 212 | FirstOpnd = 2; |
Bob Wilson | c5c6edb | 2009-10-08 23:38:24 +0000 | [diff] [blame] | 213 | NumRegs = 2; |
| 214 | Offset = 1; |
| 215 | Stride = 2; |
| 216 | return true; |
| 217 | |
Bob Wilson | b36ec86 | 2009-08-06 18:47:44 +0000 | [diff] [blame] | 218 | case ARM::VST3d8: |
| 219 | case ARM::VST3d16: |
| 220 | case ARM::VST3d32: |
Bob Wilson | a697975 | 2010-03-22 18:13:18 +0000 | [diff] [blame] | 221 | case ARM::VST1d64T: |
Bob Wilson | 8a3198b | 2009-09-01 18:51:56 +0000 | [diff] [blame] | 222 | case ARM::VST3LNd8: |
| 223 | case ARM::VST3LNd16: |
| 224 | case ARM::VST3LNd32: |
Bob Wilson | 226036e | 2010-03-20 22:13:40 +0000 | [diff] [blame] | 225 | FirstOpnd = 2; |
Bob Wilson | b36ec86 | 2009-08-06 18:47:44 +0000 | [diff] [blame] | 226 | NumRegs = 3; |
| 227 | return true; |
| 228 | |
Bob Wilson | 95ffecd | 2010-03-20 18:35:24 +0000 | [diff] [blame] | 229 | case ARM::VST3q8_UPD: |
| 230 | case ARM::VST3q16_UPD: |
| 231 | case ARM::VST3q32_UPD: |
Bob Wilson | 226036e | 2010-03-20 22:13:40 +0000 | [diff] [blame] | 232 | FirstOpnd = 4; |
Bob Wilson | 66a7063 | 2009-10-07 20:30:08 +0000 | [diff] [blame] | 233 | NumRegs = 3; |
| 234 | Offset = 0; |
| 235 | Stride = 2; |
| 236 | return true; |
| 237 | |
Bob Wilson | 95ffecd | 2010-03-20 18:35:24 +0000 | [diff] [blame] | 238 | case ARM::VST3q8odd_UPD: |
| 239 | case ARM::VST3q16odd_UPD: |
| 240 | case ARM::VST3q32odd_UPD: |
Bob Wilson | 226036e | 2010-03-20 22:13:40 +0000 | [diff] [blame] | 241 | FirstOpnd = 4; |
Bob Wilson | 66a7063 | 2009-10-07 20:30:08 +0000 | [diff] [blame] | 242 | NumRegs = 3; |
| 243 | Offset = 1; |
| 244 | Stride = 2; |
| 245 | return true; |
| 246 | |
Bob Wilson | 95ffecd | 2010-03-20 18:35:24 +0000 | [diff] [blame] | 247 | case ARM::VST3LNq16: |
| 248 | case ARM::VST3LNq32: |
Bob Wilson | 226036e | 2010-03-20 22:13:40 +0000 | [diff] [blame] | 249 | FirstOpnd = 2; |
Bob Wilson | 8cdb269 | 2009-10-08 23:51:31 +0000 | [diff] [blame] | 250 | NumRegs = 3; |
| 251 | Offset = 0; |
| 252 | Stride = 2; |
| 253 | return true; |
| 254 | |
Bob Wilson | 95ffecd | 2010-03-20 18:35:24 +0000 | [diff] [blame] | 255 | case ARM::VST3LNq16odd: |
| 256 | case ARM::VST3LNq32odd: |
Bob Wilson | 226036e | 2010-03-20 22:13:40 +0000 | [diff] [blame] | 257 | FirstOpnd = 2; |
Bob Wilson | 8cdb269 | 2009-10-08 23:51:31 +0000 | [diff] [blame] | 258 | NumRegs = 3; |
| 259 | Offset = 1; |
| 260 | Stride = 2; |
| 261 | return true; |
| 262 | |
Bob Wilson | b36ec86 | 2009-08-06 18:47:44 +0000 | [diff] [blame] | 263 | case ARM::VST4d8: |
| 264 | case ARM::VST4d16: |
| 265 | case ARM::VST4d32: |
Bob Wilson | a697975 | 2010-03-22 18:13:18 +0000 | [diff] [blame] | 266 | case ARM::VST1d64Q: |
Bob Wilson | 8a3198b | 2009-09-01 18:51:56 +0000 | [diff] [blame] | 267 | case ARM::VST4LNd8: |
| 268 | case ARM::VST4LNd16: |
| 269 | case ARM::VST4LNd32: |
Bob Wilson | 226036e | 2010-03-20 22:13:40 +0000 | [diff] [blame] | 270 | FirstOpnd = 2; |
Bob Wilson | b36ec86 | 2009-08-06 18:47:44 +0000 | [diff] [blame] | 271 | NumRegs = 4; |
| 272 | return true; |
Bob Wilson | 114a266 | 2009-08-12 20:51:55 +0000 | [diff] [blame] | 273 | |
Bob Wilson | 95ffecd | 2010-03-20 18:35:24 +0000 | [diff] [blame] | 274 | case ARM::VST4q8_UPD: |
| 275 | case ARM::VST4q16_UPD: |
| 276 | case ARM::VST4q32_UPD: |
Bob Wilson | 226036e | 2010-03-20 22:13:40 +0000 | [diff] [blame] | 277 | FirstOpnd = 4; |
Bob Wilson | 63c9063 | 2009-10-07 20:49:18 +0000 | [diff] [blame] | 278 | NumRegs = 4; |
| 279 | Offset = 0; |
| 280 | Stride = 2; |
| 281 | return true; |
| 282 | |
Bob Wilson | 95ffecd | 2010-03-20 18:35:24 +0000 | [diff] [blame] | 283 | case ARM::VST4q8odd_UPD: |
| 284 | case ARM::VST4q16odd_UPD: |
| 285 | case ARM::VST4q32odd_UPD: |
Bob Wilson | 226036e | 2010-03-20 22:13:40 +0000 | [diff] [blame] | 286 | FirstOpnd = 4; |
Bob Wilson | 63c9063 | 2009-10-07 20:49:18 +0000 | [diff] [blame] | 287 | NumRegs = 4; |
| 288 | Offset = 1; |
| 289 | Stride = 2; |
| 290 | return true; |
| 291 | |
Bob Wilson | 95ffecd | 2010-03-20 18:35:24 +0000 | [diff] [blame] | 292 | case ARM::VST4LNq16: |
| 293 | case ARM::VST4LNq32: |
Bob Wilson | 226036e | 2010-03-20 22:13:40 +0000 | [diff] [blame] | 294 | FirstOpnd = 2; |
Bob Wilson | 5631139 | 2009-10-09 00:01:36 +0000 | [diff] [blame] | 295 | NumRegs = 4; |
| 296 | Offset = 0; |
| 297 | Stride = 2; |
| 298 | return true; |
| 299 | |
Bob Wilson | 95ffecd | 2010-03-20 18:35:24 +0000 | [diff] [blame] | 300 | case ARM::VST4LNq16odd: |
| 301 | case ARM::VST4LNq32odd: |
Bob Wilson | 226036e | 2010-03-20 22:13:40 +0000 | [diff] [blame] | 302 | FirstOpnd = 2; |
Bob Wilson | 5631139 | 2009-10-09 00:01:36 +0000 | [diff] [blame] | 303 | NumRegs = 4; |
| 304 | Offset = 1; |
| 305 | Stride = 2; |
| 306 | return true; |
| 307 | |
Bob Wilson | 114a266 | 2009-08-12 20:51:55 +0000 | [diff] [blame] | 308 | case ARM::VTBL2: |
| 309 | FirstOpnd = 1; |
| 310 | NumRegs = 2; |
| 311 | return true; |
| 312 | |
| 313 | case ARM::VTBL3: |
| 314 | FirstOpnd = 1; |
| 315 | NumRegs = 3; |
| 316 | return true; |
| 317 | |
| 318 | case ARM::VTBL4: |
| 319 | FirstOpnd = 1; |
| 320 | NumRegs = 4; |
| 321 | return true; |
| 322 | |
| 323 | case ARM::VTBX2: |
| 324 | FirstOpnd = 2; |
| 325 | NumRegs = 2; |
| 326 | return true; |
| 327 | |
| 328 | case ARM::VTBX3: |
| 329 | FirstOpnd = 2; |
| 330 | NumRegs = 3; |
| 331 | return true; |
| 332 | |
| 333 | case ARM::VTBX4: |
| 334 | FirstOpnd = 2; |
| 335 | NumRegs = 4; |
| 336 | return true; |
Bob Wilson | 70cd88f | 2009-08-05 23:12:45 +0000 | [diff] [blame] | 337 | } |
| 338 | |
| 339 | return false; |
| 340 | } |
| 341 | |
Evan Cheng | e9e2ba0 | 2010-05-10 21:26:24 +0000 | [diff] [blame] | 342 | bool |
| 343 | NEONPreAllocPass::FormsRegSequence(MachineInstr *MI, |
Evan Cheng | 5c6aba2 | 2010-05-14 18:54:59 +0000 | [diff] [blame] | 344 | unsigned FirstOpnd, unsigned NumRegs, |
| 345 | unsigned Offset, unsigned Stride) const { |
Evan Cheng | e9e2ba0 | 2010-05-10 21:26:24 +0000 | [diff] [blame] | 346 | MachineOperand &FMO = MI->getOperand(FirstOpnd); |
| 347 | assert(FMO.isReg() && FMO.getSubReg() == 0 && "unexpected operand"); |
| 348 | unsigned VirtReg = FMO.getReg(); |
Daniel Dunbar | 1860e7d | 2010-05-13 03:19:36 +0000 | [diff] [blame] | 349 | (void)VirtReg; |
Evan Cheng | e9e2ba0 | 2010-05-10 21:26:24 +0000 | [diff] [blame] | 350 | assert(TargetRegisterInfo::isVirtualRegister(VirtReg) && |
| 351 | "expected a virtual register"); |
Evan Cheng | 5c6aba2 | 2010-05-14 18:54:59 +0000 | [diff] [blame] | 352 | |
| 353 | unsigned LastSubIdx = 0; |
Evan Cheng | e9e2ba0 | 2010-05-10 21:26:24 +0000 | [diff] [blame] | 354 | if (FMO.isDef()) { |
| 355 | MachineInstr *RegSeq = 0; |
| 356 | for (unsigned R = 0; R < NumRegs; ++R) { |
| 357 | const MachineOperand &MO = MI->getOperand(FirstOpnd + R); |
| 358 | assert(MO.isReg() && MO.getSubReg() == 0 && "unexpected operand"); |
| 359 | unsigned VirtReg = MO.getReg(); |
| 360 | assert(TargetRegisterInfo::isVirtualRegister(VirtReg) && |
| 361 | "expected a virtual register"); |
Evan Cheng | 676b2df | 2010-05-05 22:15:40 +0000 | [diff] [blame] | 362 | // Feeding into a REG_SEQUENCE. |
| 363 | if (!MRI->hasOneNonDBGUse(VirtReg)) |
| 364 | return false; |
| 365 | MachineInstr *UseMI = &*MRI->use_nodbg_begin(VirtReg); |
| 366 | if (!UseMI->isRegSequence()) |
| 367 | return false; |
| 368 | if (RegSeq && RegSeq != UseMI) |
| 369 | return false; |
Evan Cheng | 5c6aba2 | 2010-05-14 18:54:59 +0000 | [diff] [blame] | 370 | unsigned OpIdx = 1 + (Offset + R * Stride) * 2; |
| 371 | if (UseMI->getOperand(OpIdx).getReg() != VirtReg) |
| 372 | llvm_unreachable("Malformed REG_SEQUENCE instruction!"); |
| 373 | unsigned SubIdx = UseMI->getOperand(OpIdx + 1).getImm(); |
| 374 | if (LastSubIdx) { |
| 375 | if (LastSubIdx != SubIdx-Stride) |
| 376 | return false; |
| 377 | } else { |
Jakob Stoklund Olesen | 558661d | 2010-05-24 16:54:32 +0000 | [diff] [blame] | 378 | // Must start from dsub_0 or qsub_0. |
| 379 | if (SubIdx != (ARM::dsub_0+Offset) && |
| 380 | SubIdx != (ARM::qsub_0+Offset)) |
Evan Cheng | 5c6aba2 | 2010-05-14 18:54:59 +0000 | [diff] [blame] | 381 | return false; |
| 382 | } |
Evan Cheng | 676b2df | 2010-05-05 22:15:40 +0000 | [diff] [blame] | 383 | RegSeq = UseMI; |
Evan Cheng | 5c6aba2 | 2010-05-14 18:54:59 +0000 | [diff] [blame] | 384 | LastSubIdx = SubIdx; |
Evan Cheng | 676b2df | 2010-05-05 22:15:40 +0000 | [diff] [blame] | 385 | } |
Evan Cheng | e9e2ba0 | 2010-05-10 21:26:24 +0000 | [diff] [blame] | 386 | |
Evan Cheng | 5c6aba2 | 2010-05-14 18:54:59 +0000 | [diff] [blame] | 387 | // In the case of vld3, etc., make sure the trailing operand of |
| 388 | // REG_SEQUENCE is an undef. |
| 389 | if (NumRegs == 3) { |
| 390 | unsigned OpIdx = 1 + (Offset + 3 * Stride) * 2; |
| 391 | const MachineOperand &MO = RegSeq->getOperand(OpIdx); |
Evan Cheng | e9e2ba0 | 2010-05-10 21:26:24 +0000 | [diff] [blame] | 392 | unsigned VirtReg = MO.getReg(); |
| 393 | MachineInstr *DefMI = MRI->getVRegDef(VirtReg); |
| 394 | if (!DefMI || !DefMI->isImplicitDef()) |
| 395 | return false; |
| 396 | } |
| 397 | return true; |
| 398 | } |
| 399 | |
| 400 | unsigned LastSrcReg = 0; |
Evan Cheng | 5bdc2aa | 2010-05-12 01:42:50 +0000 | [diff] [blame] | 401 | SmallVector<unsigned, 4> SubIds; |
Evan Cheng | e9e2ba0 | 2010-05-10 21:26:24 +0000 | [diff] [blame] | 402 | for (unsigned R = 0; R < NumRegs; ++R) { |
| 403 | const MachineOperand &MO = MI->getOperand(FirstOpnd + R); |
| 404 | assert(MO.isReg() && MO.getSubReg() == 0 && "unexpected operand"); |
| 405 | unsigned VirtReg = MO.getReg(); |
| 406 | assert(TargetRegisterInfo::isVirtualRegister(VirtReg) && |
| 407 | "expected a virtual register"); |
| 408 | // Extracting from a Q or QQ register. |
| 409 | MachineInstr *DefMI = MRI->getVRegDef(VirtReg); |
Jakob Stoklund Olesen | 0bc25f4 | 2010-07-08 16:40:22 +0000 | [diff] [blame] | 410 | if (!DefMI || !DefMI->isCopy() || !DefMI->getOperand(1).getSubReg()) |
Evan Cheng | e9e2ba0 | 2010-05-10 21:26:24 +0000 | [diff] [blame] | 411 | return false; |
| 412 | VirtReg = DefMI->getOperand(1).getReg(); |
| 413 | if (LastSrcReg && LastSrcReg != VirtReg) |
| 414 | return false; |
Evan Cheng | 0ce537a | 2010-05-11 01:19:40 +0000 | [diff] [blame] | 415 | LastSrcReg = VirtReg; |
Evan Cheng | e9e2ba0 | 2010-05-10 21:26:24 +0000 | [diff] [blame] | 416 | const TargetRegisterClass *RC = MRI->getRegClass(VirtReg); |
Evan Cheng | b990a2f | 2010-05-14 23:21:14 +0000 | [diff] [blame] | 417 | if (RC != ARM::QPRRegisterClass && |
| 418 | RC != ARM::QQPRRegisterClass && |
| 419 | RC != ARM::QQQQPRRegisterClass) |
Evan Cheng | e9e2ba0 | 2010-05-10 21:26:24 +0000 | [diff] [blame] | 420 | return false; |
Jakob Stoklund Olesen | 0bc25f4 | 2010-07-08 16:40:22 +0000 | [diff] [blame] | 421 | unsigned SubIdx = DefMI->getOperand(1).getSubReg(); |
Evan Cheng | 0ce537a | 2010-05-11 01:19:40 +0000 | [diff] [blame] | 422 | if (LastSubIdx) { |
Evan Cheng | 5c6aba2 | 2010-05-14 18:54:59 +0000 | [diff] [blame] | 423 | if (LastSubIdx != SubIdx-Stride) |
Evan Cheng | 0ce537a | 2010-05-11 01:19:40 +0000 | [diff] [blame] | 424 | return false; |
| 425 | } else { |
Jakob Stoklund Olesen | 558661d | 2010-05-24 16:54:32 +0000 | [diff] [blame] | 426 | // Must start from dsub_0 or qsub_0. |
| 427 | if (SubIdx != (ARM::dsub_0+Offset) && |
| 428 | SubIdx != (ARM::qsub_0+Offset)) |
Evan Cheng | 0ce537a | 2010-05-11 01:19:40 +0000 | [diff] [blame] | 429 | return false; |
| 430 | } |
Evan Cheng | 5bdc2aa | 2010-05-12 01:42:50 +0000 | [diff] [blame] | 431 | SubIds.push_back(SubIdx); |
Evan Cheng | e9e2ba0 | 2010-05-10 21:26:24 +0000 | [diff] [blame] | 432 | LastSubIdx = SubIdx; |
Evan Cheng | 826bdfa | 2010-05-04 20:38:12 +0000 | [diff] [blame] | 433 | } |
Evan Cheng | 5bdc2aa | 2010-05-12 01:42:50 +0000 | [diff] [blame] | 434 | |
| 435 | // FIXME: Update the uses of EXTRACT_SUBREG from REG_SEQUENCE is |
| 436 | // currently required for correctness. e.g. |
Bob Wilson | dd726e5 | 2010-06-08 00:42:08 +0000 | [diff] [blame] | 437 | // %reg1041<def> = REG_SEQUENCE %reg1040<kill>, 5, %reg1035<kill>, 6 |
Evan Cheng | 5bdc2aa | 2010-05-12 01:42:50 +0000 | [diff] [blame] | 438 | // %reg1042<def> = EXTRACT_SUBREG %reg1041, 6 |
| 439 | // %reg1043<def> = EXTRACT_SUBREG %reg1041, 5 |
| 440 | // VST1q16 %reg1025<kill>, 0, %reg1043<kill>, %reg1042<kill>, |
Bob Wilson | dd726e5 | 2010-06-08 00:42:08 +0000 | [diff] [blame] | 441 | // reg1042 and reg1043 should be replaced with reg1041:6 and reg1041:5 |
Evan Cheng | 5bdc2aa | 2010-05-12 01:42:50 +0000 | [diff] [blame] | 442 | // respectively. |
| 443 | // We need to change how we model uses of REG_SEQUENCE. |
| 444 | for (unsigned R = 0; R < NumRegs; ++R) { |
| 445 | MachineOperand &MO = MI->getOperand(FirstOpnd + R); |
| 446 | unsigned OldReg = MO.getReg(); |
| 447 | MachineInstr *DefMI = MRI->getVRegDef(OldReg); |
Jakob Stoklund Olesen | 0bc25f4 | 2010-07-08 16:40:22 +0000 | [diff] [blame] | 448 | assert(DefMI->isCopy()); |
Evan Cheng | 5bdc2aa | 2010-05-12 01:42:50 +0000 | [diff] [blame] | 449 | MO.setReg(LastSrcReg); |
| 450 | MO.setSubReg(SubIds[R]); |
Jakob Stoklund Olesen | a2846b4 | 2010-06-16 22:11:08 +0000 | [diff] [blame] | 451 | MO.setIsKill(false); |
Evan Cheng | 5bdc2aa | 2010-05-12 01:42:50 +0000 | [diff] [blame] | 452 | // Delete the EXTRACT_SUBREG if its result is now dead. |
| 453 | if (MRI->use_empty(OldReg)) |
| 454 | DefMI->eraseFromParent(); |
| 455 | } |
| 456 | |
Evan Cheng | 826bdfa | 2010-05-04 20:38:12 +0000 | [diff] [blame] | 457 | return true; |
| 458 | } |
| 459 | |
Bob Wilson | 70cd88f | 2009-08-05 23:12:45 +0000 | [diff] [blame] | 460 | bool NEONPreAllocPass::PreAllocNEONRegisters(MachineBasicBlock &MBB) { |
| 461 | bool Modified = false; |
| 462 | |
| 463 | MachineBasicBlock::iterator MBBI = MBB.begin(), E = MBB.end(); |
| 464 | for (; MBBI != E; ++MBBI) { |
| 465 | MachineInstr *MI = &*MBBI; |
Bob Wilson | ff8952e | 2009-10-07 17:24:55 +0000 | [diff] [blame] | 466 | unsigned FirstOpnd, NumRegs, Offset, Stride; |
| 467 | if (!isNEONMultiRegOp(MI->getOpcode(), FirstOpnd, NumRegs, Offset, Stride)) |
Bob Wilson | 70cd88f | 2009-08-05 23:12:45 +0000 | [diff] [blame] | 468 | continue; |
Bob Wilson | 07f6e80 | 2010-06-16 21:34:01 +0000 | [diff] [blame] | 469 | if (FormsRegSequence(MI, FirstOpnd, NumRegs, Offset, Stride)) |
Evan Cheng | 826bdfa | 2010-05-04 20:38:12 +0000 | [diff] [blame] | 470 | continue; |
Bob Wilson | 70cd88f | 2009-08-05 23:12:45 +0000 | [diff] [blame] | 471 | |
Chris Lattner | 7896c9f | 2009-12-03 00:50:42 +0000 | [diff] [blame] | 472 | MachineBasicBlock::iterator NextI = llvm::next(MBBI); |
Bob Wilson | 70cd88f | 2009-08-05 23:12:45 +0000 | [diff] [blame] | 473 | for (unsigned R = 0; R < NumRegs; ++R) { |
| 474 | MachineOperand &MO = MI->getOperand(FirstOpnd + R); |
| 475 | assert(MO.isReg() && MO.getSubReg() == 0 && "unexpected operand"); |
| 476 | unsigned VirtReg = MO.getReg(); |
| 477 | assert(TargetRegisterInfo::isVirtualRegister(VirtReg) && |
| 478 | "expected a virtual register"); |
| 479 | |
| 480 | // For now, just assign a fixed set of adjacent registers. |
| 481 | // This leaves plenty of room for future improvements. |
| 482 | static const unsigned NEONDRegs[] = { |
Bob Wilson | ff8952e | 2009-10-07 17:24:55 +0000 | [diff] [blame] | 483 | ARM::D0, ARM::D1, ARM::D2, ARM::D3, |
| 484 | ARM::D4, ARM::D5, ARM::D6, ARM::D7 |
Bob Wilson | 70cd88f | 2009-08-05 23:12:45 +0000 | [diff] [blame] | 485 | }; |
Bob Wilson | ff8952e | 2009-10-07 17:24:55 +0000 | [diff] [blame] | 486 | MO.setReg(NEONDRegs[Offset + R * Stride]); |
Bob Wilson | 70cd88f | 2009-08-05 23:12:45 +0000 | [diff] [blame] | 487 | |
| 488 | if (MO.isUse()) { |
| 489 | // Insert a copy from VirtReg. |
Bob Wilson | 349d82d | 2009-10-06 22:01:15 +0000 | [diff] [blame] | 490 | TII->copyRegToReg(MBB, MBBI, MO.getReg(), VirtReg, |
Dan Gohman | 34dcc6f | 2010-05-06 20:33:48 +0000 | [diff] [blame] | 491 | ARM::DPRRegisterClass, ARM::DPRRegisterClass, |
| 492 | DebugLoc()); |
Bob Wilson | 70cd88f | 2009-08-05 23:12:45 +0000 | [diff] [blame] | 493 | if (MO.isKill()) { |
| 494 | MachineInstr *CopyMI = prior(MBBI); |
| 495 | CopyMI->findRegisterUseOperand(VirtReg)->setIsKill(); |
| 496 | } |
| 497 | MO.setIsKill(); |
| 498 | } else if (MO.isDef() && !MO.isDead()) { |
| 499 | // Add a copy to VirtReg. |
Bob Wilson | 349d82d | 2009-10-06 22:01:15 +0000 | [diff] [blame] | 500 | TII->copyRegToReg(MBB, NextI, VirtReg, MO.getReg(), |
Dan Gohman | 34dcc6f | 2010-05-06 20:33:48 +0000 | [diff] [blame] | 501 | ARM::DPRRegisterClass, ARM::DPRRegisterClass, |
| 502 | DebugLoc()); |
Bob Wilson | 70cd88f | 2009-08-05 23:12:45 +0000 | [diff] [blame] | 503 | } |
| 504 | } |
| 505 | } |
| 506 | |
| 507 | return Modified; |
| 508 | } |
| 509 | |
| 510 | bool NEONPreAllocPass::runOnMachineFunction(MachineFunction &MF) { |
| 511 | TII = MF.getTarget().getInstrInfo(); |
Evan Cheng | 826bdfa | 2010-05-04 20:38:12 +0000 | [diff] [blame] | 512 | MRI = &MF.getRegInfo(); |
Bob Wilson | 70cd88f | 2009-08-05 23:12:45 +0000 | [diff] [blame] | 513 | |
| 514 | bool Modified = false; |
| 515 | for (MachineFunction::iterator MFI = MF.begin(), E = MF.end(); MFI != E; |
| 516 | ++MFI) { |
| 517 | MachineBasicBlock &MBB = *MFI; |
| 518 | Modified |= PreAllocNEONRegisters(MBB); |
| 519 | } |
| 520 | |
| 521 | return Modified; |
| 522 | } |
| 523 | |
| 524 | /// createNEONPreAllocPass - returns an instance of the NEON register |
| 525 | /// pre-allocation pass. |
| 526 | FunctionPass *llvm::createNEONPreAllocPass() { |
| 527 | return new NEONPreAllocPass(); |
| 528 | } |