blob: c85d1e99705aeff3ab1b68970faae4004970611d [file] [log] [blame]
Anton Korobeynikov7aaf94b2009-11-03 01:04:26 +00001//===-- NEONMoveFix.cpp - Convert vfp reg-reg moves into neon ---*- C++ -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
10#define DEBUG_TYPE "neon-mov-fix"
11#include "ARM.h"
12#include "ARMMachineFunctionInfo.h"
13#include "ARMInstrInfo.h"
14#include "llvm/CodeGen/MachineInstr.h"
15#include "llvm/CodeGen/MachineInstrBuilder.h"
16#include "llvm/CodeGen/MachineFunctionPass.h"
17#include "llvm/ADT/Statistic.h"
18#include "llvm/Support/Debug.h"
19#include "llvm/Support/raw_ostream.h"
20using namespace llvm;
21
22STATISTIC(NumVMovs, "Number of reg-reg moves converted");
23
24namespace {
25 struct NEONMoveFixPass : public MachineFunctionPass {
26 static char ID;
Owen Anderson90c579d2010-08-06 18:33:48 +000027 NEONMoveFixPass() : MachineFunctionPass(ID) {}
Anton Korobeynikov7aaf94b2009-11-03 01:04:26 +000028
29 virtual bool runOnMachineFunction(MachineFunction &Fn);
30
31 virtual const char *getPassName() const {
32 return "NEON reg-reg move conversion";
33 }
34
35 private:
36 const TargetRegisterInfo *TRI;
37 const ARMBaseInstrInfo *TII;
Evan Cheng6557bce2011-02-22 19:53:14 +000038 bool isA8;
Anton Korobeynikov7aaf94b2009-11-03 01:04:26 +000039
40 typedef DenseMap<unsigned, const MachineInstr*> RegMap;
41
42 bool InsertMoves(MachineBasicBlock &MBB);
43 };
44 char NEONMoveFixPass::ID = 0;
45}
46
Evan Cheng6557bce2011-02-22 19:53:14 +000047static bool inNEONDomain(unsigned Domain, bool isA8) {
Evan Cheng2b943562011-02-23 02:35:33 +000048 return (Domain & ARMII::DomainNEON) ||
49 (isA8 && (Domain & ARMII::DomainNEONA8));
Evan Cheng6557bce2011-02-22 19:53:14 +000050}
51
Anton Korobeynikov7aaf94b2009-11-03 01:04:26 +000052bool NEONMoveFixPass::InsertMoves(MachineBasicBlock &MBB) {
53 RegMap Defs;
54 bool Modified = false;
55
56 // Walk over MBB tracking the def points of the registers.
57 MachineBasicBlock::iterator MII = MBB.begin(), E = MBB.end();
58 MachineBasicBlock::iterator NextMII;
59 for (; MII != E; MII = NextMII) {
Chris Lattner7896c9f2009-12-03 00:50:42 +000060 NextMII = llvm::next(MII);
Anton Korobeynikov7aaf94b2009-11-03 01:04:26 +000061 MachineInstr *MI = &*MII;
62
Jim Grosbache5165492009-11-09 00:11:35 +000063 if (MI->getOpcode() == ARM::VMOVD &&
Anton Korobeynikov7aaf94b2009-11-03 01:04:26 +000064 !TII->isPredicated(MI)) {
65 unsigned SrcReg = MI->getOperand(1).getReg();
Jim Grosbache5165492009-11-09 00:11:35 +000066 // If we do not find an instruction defining the reg, this means the
Anton Korobeynikov7aaf94b2009-11-03 01:04:26 +000067 // register should be live-in for this BB. It's always to better to use
68 // NEON reg-reg moves.
69 unsigned Domain = ARMII::DomainNEON;
70 RegMap::iterator DefMI = Defs.find(SrcReg);
71 if (DefMI != Defs.end()) {
72 Domain = DefMI->second->getDesc().TSFlags & ARMII::DomainMask;
73 // Instructions in general domain are subreg accesses.
74 // Map them to NEON reg-reg moves.
75 if (Domain == ARMII::DomainGeneral)
76 Domain = ARMII::DomainNEON;
77 }
78
Evan Cheng6557bce2011-02-22 19:53:14 +000079 if (inNEONDomain(Domain, isA8)) {
Owen Anderson43967a92011-07-15 18:46:47 +000080 // Convert VMOVD to VORRd
Anton Korobeynikov7aaf94b2009-11-03 01:04:26 +000081 unsigned DestReg = MI->getOperand(0).getReg();
82
83 DEBUG({errs() << "vmov convert: "; MI->dump();});
84
85 // It's safe to ignore imp-defs / imp-uses here, since:
86 // - We're running late, no intelligent condegen passes should be run
87 // afterwards
88 // - The imp-defs / imp-uses are superregs only, we don't care about
89 // them.
Evan Chengac0869d2009-11-21 06:21:52 +000090 AddDefaultPred(BuildMI(MBB, *MI, MI->getDebugLoc(),
Owen Anderson43967a92011-07-15 18:46:47 +000091 TII->get(ARM::VORRd), DestReg)
92 .addReg(SrcReg).addReg(SrcReg));
Anton Korobeynikov7aaf94b2009-11-03 01:04:26 +000093 MBB.erase(MI);
94 MachineBasicBlock::iterator I = prior(NextMII);
95 MI = &*I;
96
97 DEBUG({errs() << " into: "; MI->dump();});
98
99 Modified = true;
100 ++NumVMovs;
101 } else {
Anton Korobeynikov747409a2009-11-03 18:46:11 +0000102 assert((Domain & ARMII::DomainVFP) && "Invalid domain!");
Anton Korobeynikov7aaf94b2009-11-03 01:04:26 +0000103 // Do nothing.
104 }
105 }
106
107 // Update def information.
108 for (unsigned i = 0, e = MI->getNumOperands(); i != e; ++i) {
109 const MachineOperand& MO = MI->getOperand(i);
110 if (!MO.isReg() || !MO.isDef())
111 continue;
112 unsigned MOReg = MO.getReg();
113
114 Defs[MOReg] = MI;
Jakob Stoklund Olesenfca3a252010-07-06 23:26:23 +0000115 // Catch aliases as well.
116 for (const unsigned *R = TRI->getAliasSet(MOReg); *R; ++R)
Anton Korobeynikov7aaf94b2009-11-03 01:04:26 +0000117 Defs[*R] = MI;
118 }
119 }
120
121 return Modified;
122}
123
124bool NEONMoveFixPass::runOnMachineFunction(MachineFunction &Fn) {
125 ARMFunctionInfo *AFI = Fn.getInfo<ARMFunctionInfo>();
126 const TargetMachine &TM = Fn.getTarget();
127
Evan Cheng9c207ac2010-05-17 01:11:46 +0000128 if (AFI->isThumb1OnlyFunction())
Anton Korobeynikov7aaf94b2009-11-03 01:04:26 +0000129 return false;
130
131 TRI = TM.getRegisterInfo();
Anton Korobeynikov7aaf94b2009-11-03 01:04:26 +0000132 TII = static_cast<const ARMBaseInstrInfo*>(TM.getInstrInfo());
Evan Cheng6557bce2011-02-22 19:53:14 +0000133 isA8 = TM.getSubtarget<ARMSubtarget>().isCortexA8();
Anton Korobeynikov7aaf94b2009-11-03 01:04:26 +0000134
135 bool Modified = false;
136 for (MachineFunction::iterator MFI = Fn.begin(), E = Fn.end(); MFI != E;
137 ++MFI) {
138 MachineBasicBlock &MBB = *MFI;
139 Modified |= InsertMoves(MBB);
140 }
141
142 return Modified;
143}
144
145/// createNEONMoveFixPass - Returns an instance of the NEON reg-reg moves fix
146/// pass.
147FunctionPass *llvm::createNEONMoveFixPass() {
148 return new NEONMoveFixPass();
149}