blob: 7e1ce429ef7d29e4dc22289807df806a7a1150b6 [file] [log] [blame]
Chris Lattner1c08c712005-01-07 07:47:53 +00001//===-- SelectionDAGISel.cpp - Implement the SelectionDAGISel class -------===//
Misha Brukmanedf128a2005-04-21 22:36:52 +00002//
Chris Lattner1c08c712005-01-07 07:47:53 +00003// The LLVM Compiler Infrastructure
4//
Chris Lattner4ee451d2007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Misha Brukmanedf128a2005-04-21 22:36:52 +00007//
Chris Lattner1c08c712005-01-07 07:47:53 +00008//===----------------------------------------------------------------------===//
9//
10// This implements the SelectionDAGISel class.
11//
12//===----------------------------------------------------------------------===//
13
14#define DEBUG_TYPE "isel"
Dan Gohman84fbac52009-02-06 17:22:58 +000015#include "ScheduleDAGSDNodes.h"
Dan Gohman2048b852009-11-23 18:04:58 +000016#include "SelectionDAGBuilder.h"
Dan Gohman6277eb22009-11-23 17:16:22 +000017#include "FunctionLoweringInfo.h"
Dan Gohman84fbac52009-02-06 17:22:58 +000018#include "llvm/CodeGen/SelectionDAGISel.h"
Jim Laskeyc7c3f112006-10-16 20:52:31 +000019#include "llvm/Analysis/AliasAnalysis.h"
Devang Patel713f0432009-09-16 21:09:07 +000020#include "llvm/Analysis/DebugInfo.h"
Anton Korobeynikov5502bf62007-04-04 21:14:49 +000021#include "llvm/Constants.h"
Chris Lattneradf6a962005-05-13 18:50:42 +000022#include "llvm/CallingConv.h"
Chris Lattner1c08c712005-01-07 07:47:53 +000023#include "llvm/DerivedTypes.h"
24#include "llvm/Function.h"
Chris Lattner36ce6912005-11-29 06:21:05 +000025#include "llvm/GlobalVariable.h"
Chris Lattnerce7518c2006-01-26 22:24:51 +000026#include "llvm/InlineAsm.h"
Chris Lattner1c08c712005-01-07 07:47:53 +000027#include "llvm/Instructions.h"
28#include "llvm/Intrinsics.h"
Jim Laskey43970fe2006-03-23 18:06:46 +000029#include "llvm/IntrinsicInst.h"
Chris Lattner75c478a2009-10-27 17:02:08 +000030#include "llvm/LLVMContext.h"
Dan Gohman78eca172008-08-19 22:33:34 +000031#include "llvm/CodeGen/FastISel.h"
Gordon Henriksen5a29c9e2008-08-17 12:56:54 +000032#include "llvm/CodeGen/GCStrategy.h"
Gordon Henriksen5eca0752008-08-17 18:44:35 +000033#include "llvm/CodeGen/GCMetadata.h"
Chris Lattner1c08c712005-01-07 07:47:53 +000034#include "llvm/CodeGen/MachineFunction.h"
Dan Gohmanad2afc22009-07-31 18:16:33 +000035#include "llvm/CodeGen/MachineFunctionAnalysis.h"
Chris Lattner1c08c712005-01-07 07:47:53 +000036#include "llvm/CodeGen/MachineFrameInfo.h"
37#include "llvm/CodeGen/MachineInstrBuilder.h"
Chris Lattner84bc5422007-12-31 04:13:23 +000038#include "llvm/CodeGen/MachineJumpTableInfo.h"
39#include "llvm/CodeGen/MachineModuleInfo.h"
40#include "llvm/CodeGen/MachineRegisterInfo.h"
Dan Gohmanfc54c552009-01-15 22:18:12 +000041#include "llvm/CodeGen/ScheduleHazardRecognizer.h"
Jim Laskeyeb577ba2006-08-02 12:30:23 +000042#include "llvm/CodeGen/SchedulerRegistry.h"
Chris Lattner1c08c712005-01-07 07:47:53 +000043#include "llvm/CodeGen/SelectionDAG.h"
Devang Patel6e7a1612009-01-09 19:11:50 +000044#include "llvm/CodeGen/DwarfWriter.h"
Dan Gohman6f0d0242008-02-10 18:45:23 +000045#include "llvm/Target/TargetRegisterInfo.h"
Chris Lattner1c08c712005-01-07 07:47:53 +000046#include "llvm/Target/TargetData.h"
47#include "llvm/Target/TargetFrameInfo.h"
Dan Gohmane1f188f2009-10-29 22:30:23 +000048#include "llvm/Target/TargetIntrinsicInfo.h"
Chris Lattner1c08c712005-01-07 07:47:53 +000049#include "llvm/Target/TargetInstrInfo.h"
50#include "llvm/Target/TargetLowering.h"
51#include "llvm/Target/TargetMachine.h"
Vladimir Prus12472912006-05-23 13:43:15 +000052#include "llvm/Target/TargetOptions.h"
Chris Lattnera4f0b3a2006-08-27 12:54:02 +000053#include "llvm/Support/Compiler.h"
Evan Chengdb8d56b2008-06-30 20:45:06 +000054#include "llvm/Support/Debug.h"
Torok Edwin7d696d82009-07-11 13:10:19 +000055#include "llvm/Support/ErrorHandling.h"
Evan Chengdb8d56b2008-06-30 20:45:06 +000056#include "llvm/Support/MathExtras.h"
57#include "llvm/Support/Timer.h"
Daniel Dunbarce63ffb2009-07-25 00:23:56 +000058#include "llvm/Support/raw_ostream.h"
Jeff Cohen7e881032006-02-24 02:52:40 +000059#include <algorithm>
Chris Lattner1c08c712005-01-07 07:47:53 +000060using namespace llvm;
61
Chris Lattneread0d882008-06-17 06:09:18 +000062static cl::opt<bool>
Dan Gohman293d5f82008-09-09 22:06:46 +000063EnableFastISelVerbose("fast-isel-verbose", cl::Hidden,
Dan Gohmand659d502008-10-20 21:30:12 +000064 cl::desc("Enable verbose messages in the \"fast\" "
Dan Gohman293d5f82008-09-09 22:06:46 +000065 "instruction selector"));
66static cl::opt<bool>
Dan Gohman4344a5d2008-09-09 23:05:00 +000067EnableFastISelAbort("fast-isel-abort", cl::Hidden,
68 cl::desc("Enable abort calls when \"fast\" instruction fails"));
Dan Gohman8a110532008-09-05 22:59:21 +000069static cl::opt<bool>
Evan Chengdf8ed022009-11-09 06:49:37 +000070SchedLiveInCopies("schedule-livein-copies", cl::Hidden,
Dan Gohman8a110532008-09-05 22:59:21 +000071 cl::desc("Schedule copies of livein registers"),
72 cl::init(false));
Chris Lattneread0d882008-06-17 06:09:18 +000073
Chris Lattnerda8abb02005-09-01 18:44:10 +000074#ifndef NDEBUG
Chris Lattner7944d9d2005-01-12 03:41:21 +000075static cl::opt<bool>
Dan Gohman462dc7f2008-07-21 20:00:07 +000076ViewDAGCombine1("view-dag-combine1-dags", cl::Hidden,
77 cl::desc("Pop up a window to show dags before the first "
78 "dag combine pass"));
79static cl::opt<bool>
80ViewLegalizeTypesDAGs("view-legalize-types-dags", cl::Hidden,
81 cl::desc("Pop up a window to show dags before legalize types"));
82static cl::opt<bool>
83ViewLegalizeDAGs("view-legalize-dags", cl::Hidden,
84 cl::desc("Pop up a window to show dags before legalize"));
85static cl::opt<bool>
86ViewDAGCombine2("view-dag-combine2-dags", cl::Hidden,
87 cl::desc("Pop up a window to show dags before the second "
88 "dag combine pass"));
89static cl::opt<bool>
Duncan Sands25cf2272008-11-24 14:53:14 +000090ViewDAGCombineLT("view-dag-combine-lt-dags", cl::Hidden,
91 cl::desc("Pop up a window to show dags before the post legalize types"
92 " dag combine pass"));
93static cl::opt<bool>
Evan Chenga9c20912006-01-21 02:32:06 +000094ViewISelDAGs("view-isel-dags", cl::Hidden,
95 cl::desc("Pop up a window to show isel dags as they are selected"));
96static cl::opt<bool>
97ViewSchedDAGs("view-sched-dags", cl::Hidden,
98 cl::desc("Pop up a window to show sched dags as they are processed"));
Dan Gohman3e1a7ae2007-08-28 20:32:58 +000099static cl::opt<bool>
100ViewSUnitDAGs("view-sunit-dags", cl::Hidden,
Chris Lattner5bab7852008-01-25 17:24:52 +0000101 cl::desc("Pop up a window to show SUnit dags after they are processed"));
Chris Lattner7944d9d2005-01-12 03:41:21 +0000102#else
Dan Gohman462dc7f2008-07-21 20:00:07 +0000103static const bool ViewDAGCombine1 = false,
104 ViewLegalizeTypesDAGs = false, ViewLegalizeDAGs = false,
105 ViewDAGCombine2 = false,
Duncan Sands25cf2272008-11-24 14:53:14 +0000106 ViewDAGCombineLT = false,
Dan Gohman462dc7f2008-07-21 20:00:07 +0000107 ViewISelDAGs = false, ViewSchedDAGs = false,
108 ViewSUnitDAGs = false;
Chris Lattner7944d9d2005-01-12 03:41:21 +0000109#endif
110
Jim Laskeyeb577ba2006-08-02 12:30:23 +0000111//===---------------------------------------------------------------------===//
112///
113/// RegisterScheduler class - Track the registration of instruction schedulers.
114///
115//===---------------------------------------------------------------------===//
116MachinePassRegistry RegisterScheduler::Registry;
117
118//===---------------------------------------------------------------------===//
119///
120/// ISHeuristic command line option for instruction schedulers.
121///
122//===---------------------------------------------------------------------===//
Dan Gohman844731a2008-05-13 00:00:25 +0000123static cl::opt<RegisterScheduler::FunctionPassCtor, false,
124 RegisterPassParser<RegisterScheduler> >
125ISHeuristic("pre-RA-sched",
126 cl::init(&createDefaultScheduler),
127 cl::desc("Instruction schedulers available (before register"
128 " allocation):"));
Jim Laskey13ec7022006-08-01 14:21:23 +0000129
Dan Gohman844731a2008-05-13 00:00:25 +0000130static RegisterScheduler
Dan Gohmanb8cab922008-10-14 20:25:08 +0000131defaultListDAGScheduler("default", "Best scheduler for the target",
Dan Gohman844731a2008-05-13 00:00:25 +0000132 createDefaultScheduler);
Evan Cheng4ef10862006-01-23 07:01:07 +0000133
Chris Lattner1c08c712005-01-07 07:47:53 +0000134namespace llvm {
135 //===--------------------------------------------------------------------===//
Jim Laskey9373beb2006-08-01 19:14:14 +0000136 /// createDefaultScheduler - This creates an instruction scheduler appropriate
137 /// for the target.
Dan Gohman47ac0f02009-02-11 04:27:20 +0000138 ScheduleDAGSDNodes* createDefaultScheduler(SelectionDAGISel *IS,
Bill Wendling98a366d2009-04-29 23:29:43 +0000139 CodeGenOpt::Level OptLevel) {
Dan Gohmane9530ec2009-01-15 16:58:17 +0000140 const TargetLowering &TLI = IS->getTargetLowering();
141
Bill Wendling98a366d2009-04-29 23:29:43 +0000142 if (OptLevel == CodeGenOpt::None)
Bill Wendlingbe8cc2a2009-04-29 00:15:41 +0000143 return createFastDAGScheduler(IS, OptLevel);
Dan Gohman9e76fea2008-11-20 03:11:19 +0000144 if (TLI.getSchedulingPreference() == TargetLowering::SchedulingForLatency)
Bill Wendlingbe8cc2a2009-04-29 00:15:41 +0000145 return createTDListDAGScheduler(IS, OptLevel);
Dan Gohman9e76fea2008-11-20 03:11:19 +0000146 assert(TLI.getSchedulingPreference() ==
Bill Wendling187361b2010-01-23 10:26:57 +0000147 TargetLowering::SchedulingForRegPressure && "Unknown sched type!");
Bill Wendlingbe8cc2a2009-04-29 00:15:41 +0000148 return createBURRListDAGScheduler(IS, OptLevel);
Jim Laskey9373beb2006-08-01 19:14:14 +0000149 }
Chris Lattner1c08c712005-01-07 07:47:53 +0000150}
151
Evan Chengff9b3732008-01-30 18:18:23 +0000152// EmitInstrWithCustomInserter - This method should be implemented by targets
Dan Gohman533297b2009-10-29 18:10:34 +0000153// that mark instructions with the 'usesCustomInserter' flag. These
Chris Lattner025c39b2005-08-26 20:54:47 +0000154// instructions are special in various ways, which require special support to
155// insert. The specified MachineInstr is created but not inserted into any
Dan Gohman533297b2009-10-29 18:10:34 +0000156// basic blocks, and this method is called to expand it into a sequence of
157// instructions, potentially also creating new basic blocks and control flow.
158// When new basic blocks are inserted and the edges from MBB to its successors
159// are modified, the method should insert pairs of <OldSucc, NewSucc> into the
160// DenseMap.
Evan Chengff9b3732008-01-30 18:18:23 +0000161MachineBasicBlock *TargetLowering::EmitInstrWithCustomInserter(MachineInstr *MI,
Evan Chengfb2e7522009-09-18 21:02:19 +0000162 MachineBasicBlock *MBB,
163 DenseMap<MachineBasicBlock*, MachineBasicBlock*> *EM) const {
Torok Edwinf3689232009-07-12 20:07:01 +0000164#ifndef NDEBUG
David Greene1a053232010-01-05 01:26:11 +0000165 dbgs() << "If a target marks an instruction with "
Dan Gohman533297b2009-10-29 18:10:34 +0000166 "'usesCustomInserter', it must implement "
Torok Edwinf3689232009-07-12 20:07:01 +0000167 "TargetLowering::EmitInstrWithCustomInserter!";
168#endif
Torok Edwinc23197a2009-07-14 16:55:14 +0000169 llvm_unreachable(0);
Daniel Dunbara279bc32009-09-20 02:20:51 +0000170 return 0;
Chris Lattner025c39b2005-08-26 20:54:47 +0000171}
172
Dan Gohman8a110532008-09-05 22:59:21 +0000173/// EmitLiveInCopy - Emit a copy for a live in physical register. If the
174/// physical register has only a single copy use, then coalesced the copy
175/// if possible.
176static void EmitLiveInCopy(MachineBasicBlock *MBB,
177 MachineBasicBlock::iterator &InsertPos,
178 unsigned VirtReg, unsigned PhysReg,
179 const TargetRegisterClass *RC,
180 DenseMap<MachineInstr*, unsigned> &CopyRegMap,
181 const MachineRegisterInfo &MRI,
182 const TargetRegisterInfo &TRI,
183 const TargetInstrInfo &TII) {
184 unsigned NumUses = 0;
185 MachineInstr *UseMI = NULL;
186 for (MachineRegisterInfo::use_iterator UI = MRI.use_begin(VirtReg),
187 UE = MRI.use_end(); UI != UE; ++UI) {
188 UseMI = &*UI;
189 if (++NumUses > 1)
190 break;
191 }
192
193 // If the number of uses is not one, or the use is not a move instruction,
194 // don't coalesce. Also, only coalesce away a virtual register to virtual
195 // register copy.
196 bool Coalesced = false;
Evan Cheng04ee5a12009-01-20 19:12:24 +0000197 unsigned SrcReg, DstReg, SrcSubReg, DstSubReg;
Dan Gohman8a110532008-09-05 22:59:21 +0000198 if (NumUses == 1 &&
Evan Cheng04ee5a12009-01-20 19:12:24 +0000199 TII.isMoveInstr(*UseMI, SrcReg, DstReg, SrcSubReg, DstSubReg) &&
Dan Gohman8a110532008-09-05 22:59:21 +0000200 TargetRegisterInfo::isVirtualRegister(DstReg)) {
201 VirtReg = DstReg;
202 Coalesced = true;
203 }
204
205 // Now find an ideal location to insert the copy.
206 MachineBasicBlock::iterator Pos = InsertPos;
207 while (Pos != MBB->begin()) {
208 MachineInstr *PrevMI = prior(Pos);
209 DenseMap<MachineInstr*, unsigned>::iterator RI = CopyRegMap.find(PrevMI);
210 // copyRegToReg might emit multiple instructions to do a copy.
211 unsigned CopyDstReg = (RI == CopyRegMap.end()) ? 0 : RI->second;
212 if (CopyDstReg && !TRI.regsOverlap(CopyDstReg, PhysReg))
213 // This is what the BB looks like right now:
214 // r1024 = mov r0
215 // ...
216 // r1 = mov r1024
217 //
218 // We want to insert "r1025 = mov r1". Inserting this copy below the
219 // move to r1024 makes it impossible for that move to be coalesced.
220 //
221 // r1025 = mov r1
222 // r1024 = mov r0
223 // ...
224 // r1 = mov 1024
225 // r2 = mov 1025
226 break; // Woot! Found a good location.
227 --Pos;
228 }
229
David Goodwinf1daf7d2009-07-08 23:10:31 +0000230 bool Emitted = TII.copyRegToReg(*MBB, Pos, VirtReg, PhysReg, RC, RC);
231 assert(Emitted && "Unable to issue a live-in copy instruction!\n");
232 (void) Emitted;
Daniel Dunbara279bc32009-09-20 02:20:51 +0000233
Zhongxing Xu931424a2009-10-16 05:42:28 +0000234 CopyRegMap.insert(std::make_pair(prior(Pos), VirtReg));
Dan Gohman8a110532008-09-05 22:59:21 +0000235 if (Coalesced) {
236 if (&*InsertPos == UseMI) ++InsertPos;
237 MBB->erase(UseMI);
238 }
239}
240
241/// EmitLiveInCopies - If this is the first basic block in the function,
242/// and if it has live ins that need to be copied into vregs, emit the
243/// copies into the block.
244static void EmitLiveInCopies(MachineBasicBlock *EntryMBB,
245 const MachineRegisterInfo &MRI,
246 const TargetRegisterInfo &TRI,
247 const TargetInstrInfo &TII) {
248 if (SchedLiveInCopies) {
249 // Emit the copies at a heuristically-determined location in the block.
250 DenseMap<MachineInstr*, unsigned> CopyRegMap;
251 MachineBasicBlock::iterator InsertPos = EntryMBB->begin();
252 for (MachineRegisterInfo::livein_iterator LI = MRI.livein_begin(),
253 E = MRI.livein_end(); LI != E; ++LI)
254 if (LI->second) {
255 const TargetRegisterClass *RC = MRI.getRegClass(LI->second);
256 EmitLiveInCopy(EntryMBB, InsertPos, LI->second, LI->first,
257 RC, CopyRegMap, MRI, TRI, TII);
258 }
259 } else {
260 // Emit the copies into the top of the block.
261 for (MachineRegisterInfo::livein_iterator LI = MRI.livein_begin(),
262 E = MRI.livein_end(); LI != E; ++LI)
263 if (LI->second) {
264 const TargetRegisterClass *RC = MRI.getRegClass(LI->second);
David Goodwinf1daf7d2009-07-08 23:10:31 +0000265 bool Emitted = TII.copyRegToReg(*EntryMBB, EntryMBB->begin(),
266 LI->second, LI->first, RC, RC);
267 assert(Emitted && "Unable to issue a live-in copy instruction!\n");
268 (void) Emitted;
Dan Gohman8a110532008-09-05 22:59:21 +0000269 }
270 }
271}
272
Chris Lattner7041ee32005-01-11 05:56:49 +0000273//===----------------------------------------------------------------------===//
274// SelectionDAGISel code
275//===----------------------------------------------------------------------===//
Chris Lattner1c08c712005-01-07 07:47:53 +0000276
Bill Wendling98a366d2009-04-29 23:29:43 +0000277SelectionDAGISel::SelectionDAGISel(TargetMachine &tm, CodeGenOpt::Level OL) :
Dan Gohmanad2afc22009-07-31 18:16:33 +0000278 MachineFunctionPass(&ID), TM(tm), TLI(*tm.getTargetLowering()),
Dan Gohman7c3234c2008-08-27 23:52:12 +0000279 FuncInfo(new FunctionLoweringInfo(TLI)),
280 CurDAG(new SelectionDAG(TLI, *FuncInfo)),
Dan Gohman2048b852009-11-23 18:04:58 +0000281 SDB(new SelectionDAGBuilder(*CurDAG, TLI, *FuncInfo, OL)),
Dan Gohman7c3234c2008-08-27 23:52:12 +0000282 GFI(),
Bill Wendlingbe8cc2a2009-04-29 00:15:41 +0000283 OptLevel(OL),
Dan Gohman7c3234c2008-08-27 23:52:12 +0000284 DAGSize(0)
285{}
286
287SelectionDAGISel::~SelectionDAGISel() {
Dan Gohman2048b852009-11-23 18:04:58 +0000288 delete SDB;
Dan Gohman7c3234c2008-08-27 23:52:12 +0000289 delete CurDAG;
290 delete FuncInfo;
291}
292
Owen Andersone50ed302009-08-10 22:56:29 +0000293unsigned SelectionDAGISel::MakeReg(EVT VT) {
Chris Lattner84bc5422007-12-31 04:13:23 +0000294 return RegInfo->createVirtualRegister(TLI.getRegClassFor(VT));
Chris Lattner1c08c712005-01-07 07:47:53 +0000295}
296
Chris Lattner495a0b52005-08-17 06:37:43 +0000297void SelectionDAGISel::getAnalysisUsage(AnalysisUsage &AU) const {
Jim Laskeyc7c3f112006-10-16 20:52:31 +0000298 AU.addRequired<AliasAnalysis>();
Dan Gohmana3477fe2009-07-31 23:36:22 +0000299 AU.addPreserved<AliasAnalysis>();
Gordon Henriksen5eca0752008-08-17 18:44:35 +0000300 AU.addRequired<GCModuleInfo>();
Dan Gohmana3477fe2009-07-31 23:36:22 +0000301 AU.addPreserved<GCModuleInfo>();
Devang Patel6e7a1612009-01-09 19:11:50 +0000302 AU.addRequired<DwarfWriter>();
Dan Gohmana3477fe2009-07-31 23:36:22 +0000303 AU.addPreserved<DwarfWriter>();
Dan Gohmanad2afc22009-07-31 18:16:33 +0000304 MachineFunctionPass::getAnalysisUsage(AU);
Chris Lattner495a0b52005-08-17 06:37:43 +0000305}
Chris Lattner1c08c712005-01-07 07:47:53 +0000306
Dan Gohmanad2afc22009-07-31 18:16:33 +0000307bool SelectionDAGISel::runOnMachineFunction(MachineFunction &mf) {
308 Function &Fn = *mf.getFunction();
309
Dan Gohman4344a5d2008-09-09 23:05:00 +0000310 // Do some sanity-checking on the command-line options.
311 assert((!EnableFastISelVerbose || EnableFastISel) &&
312 "-fast-isel-verbose requires -fast-isel");
313 assert((!EnableFastISelAbort || EnableFastISel) &&
314 "-fast-isel-abort requires -fast-isel");
315
Dan Gohman5f43f922007-08-27 16:26:13 +0000316 // Get alias analysis for load/store combining.
317 AA = &getAnalysis<AliasAnalysis>();
318
Dan Gohmanad2afc22009-07-31 18:16:33 +0000319 MF = &mf;
Dan Gohman8a110532008-09-05 22:59:21 +0000320 const TargetInstrInfo &TII = *TM.getInstrInfo();
321 const TargetRegisterInfo &TRI = *TM.getRegisterInfo();
322
Dan Gohmanf7d6cd42009-08-01 03:51:09 +0000323 if (Fn.hasGC())
324 GFI = &getAnalysis<GCModuleInfo>().getFunctionInfo(Fn);
Gordon Henriksence224772008-01-07 01:30:38 +0000325 else
Gordon Henriksen5eca0752008-08-17 18:44:35 +0000326 GFI = 0;
Dan Gohman79ce2762009-01-15 19:20:50 +0000327 RegInfo = &MF->getRegInfo();
David Greene1a053232010-01-05 01:26:11 +0000328 DEBUG(dbgs() << "\n\n\n=== " << Fn.getName() << "\n");
Chris Lattner1c08c712005-01-07 07:47:53 +0000329
Duncan Sands1465d612009-01-28 13:14:17 +0000330 MachineModuleInfo *MMI = getAnalysisIfAvailable<MachineModuleInfo>();
331 DwarfWriter *DW = getAnalysisIfAvailable<DwarfWriter>();
Owen Anderson5dcaceb2009-07-09 18:44:09 +0000332 CurDAG->init(*MF, MMI, DW);
Dan Gohman6277eb22009-11-23 17:16:22 +0000333 FuncInfo->set(Fn, *MF, EnableFastISel);
Dan Gohman2048b852009-11-23 18:04:58 +0000334 SDB->init(GFI, *AA);
Chris Lattner1c08c712005-01-07 07:47:53 +0000335
Dale Johannesen1532f3d2008-04-02 00:25:04 +0000336 for (Function::iterator I = Fn.begin(), E = Fn.end(); I != E; ++I)
337 if (InvokeInst *Invoke = dyn_cast<InvokeInst>(I->getTerminator()))
338 // Mark landing pad.
Dan Gohman7c3234c2008-08-27 23:52:12 +0000339 FuncInfo->MBBMap[Invoke->getSuccessor(1)]->setIsLandingPad();
Duncan Sands9fac0b52007-06-06 10:05:18 +0000340
Dan Gohman79ce2762009-01-15 19:20:50 +0000341 SelectAllBasicBlocks(Fn, *MF, MMI, DW, TII);
Misha Brukmanedf128a2005-04-21 22:36:52 +0000342
Dan Gohman8a110532008-09-05 22:59:21 +0000343 // If the first basic block in the function has live ins that need to be
344 // copied into vregs, emit the copies into the top of the block before
345 // emitting the code for the block.
Dan Gohman79ce2762009-01-15 19:20:50 +0000346 EmitLiveInCopies(MF->begin(), *RegInfo, TRI, TII);
Dan Gohman8a110532008-09-05 22:59:21 +0000347
Evan Chengad2070c2007-02-10 02:43:39 +0000348 // Add function live-ins to entry block live-in set.
Dan Gohman8a110532008-09-05 22:59:21 +0000349 for (MachineRegisterInfo::livein_iterator I = RegInfo->livein_begin(),
350 E = RegInfo->livein_end(); I != E; ++I)
Dan Gohman79ce2762009-01-15 19:20:50 +0000351 MF->begin()->addLiveIn(I->first);
Evan Chengad2070c2007-02-10 02:43:39 +0000352
Duncan Sandsf4070822007-06-15 19:04:19 +0000353#ifndef NDEBUG
Dan Gohman7c3234c2008-08-27 23:52:12 +0000354 assert(FuncInfo->CatchInfoFound.size() == FuncInfo->CatchInfoLost.size() &&
Duncan Sandsf4070822007-06-15 19:04:19 +0000355 "Not all catch info was assigned to a landing pad!");
356#endif
357
Dan Gohman7c3234c2008-08-27 23:52:12 +0000358 FuncInfo->clear();
359
Chris Lattner1c08c712005-01-07 07:47:53 +0000360 return true;
361}
362
Dan Gohman07f111e2009-12-05 00:27:08 +0000363/// SetDebugLoc - Update MF's and SDB's DebugLocs if debug information is
364/// attached with this instruction.
Chris Lattner3990b122009-12-28 23:41:32 +0000365static void SetDebugLoc(unsigned MDDbgKind, Instruction *I,
366 SelectionDAGBuilder *SDB,
Chris Lattner0eb41982009-12-28 20:45:51 +0000367 FastISel *FastIS, MachineFunction *MF) {
368 if (isa<DbgInfoIntrinsic>(I)) return;
369
Chris Lattner3990b122009-12-28 23:41:32 +0000370 if (MDNode *Dbg = I->getMetadata(MDDbgKind)) {
Chris Lattner0eb41982009-12-28 20:45:51 +0000371 DILocation DILoc(Dbg);
372 DebugLoc Loc = ExtractDebugLocation(DILoc, MF->getDebugLocInfo());
Dan Gohman07f111e2009-12-05 00:27:08 +0000373
Chris Lattner0eb41982009-12-28 20:45:51 +0000374 SDB->setCurDebugLoc(Loc);
Dan Gohman07f111e2009-12-05 00:27:08 +0000375
Chris Lattner0eb41982009-12-28 20:45:51 +0000376 if (FastIS)
377 FastIS->setCurDebugLoc(Loc);
Dan Gohman07f111e2009-12-05 00:27:08 +0000378
Chris Lattner0eb41982009-12-28 20:45:51 +0000379 // If the function doesn't have a default debug location yet, set
380 // it. This is kind of a hack.
381 if (MF->getDefaultDebugLoc().isUnknown())
382 MF->setDefaultDebugLoc(Loc);
383 }
Dan Gohman07f111e2009-12-05 00:27:08 +0000384}
385
386/// ResetDebugLoc - Set MF's and SDB's DebugLocs to Unknown.
Chris Lattner3990b122009-12-28 23:41:32 +0000387static void ResetDebugLoc(SelectionDAGBuilder *SDB, FastISel *FastIS) {
Dan Gohman07f111e2009-12-05 00:27:08 +0000388 SDB->setCurDebugLoc(DebugLoc::getUnknownLoc());
389 if (FastIS)
Dan Gohman688fb802009-12-14 23:08:09 +0000390 FastIS->setCurDebugLoc(DebugLoc::getUnknownLoc());
Dan Gohman07f111e2009-12-05 00:27:08 +0000391}
392
Dan Gohmanf350b272008-08-23 02:25:05 +0000393void SelectionDAGISel::SelectBasicBlock(BasicBlock *LLVMBB,
394 BasicBlock::iterator Begin,
Dan Gohmanb4afb132009-11-20 02:51:26 +0000395 BasicBlock::iterator End,
396 bool &HadTailCall) {
Dan Gohman2048b852009-11-23 18:04:58 +0000397 SDB->setCurrentBasicBlock(BB);
Chris Lattner08113472009-12-29 09:01:33 +0000398 unsigned MDDbgKind = LLVMBB->getContext().getMDKindID("dbg");
Dan Gohmanf350b272008-08-23 02:25:05 +0000399
Dan Gohman98ca4f22009-08-05 01:29:28 +0000400 // Lower all of the non-terminator instructions. If a call is emitted
401 // as a tail call, cease emitting nodes for this block.
Dan Gohman2048b852009-11-23 18:04:58 +0000402 for (BasicBlock::iterator I = Begin; I != End && !SDB->HasTailCall; ++I) {
Chris Lattner3990b122009-12-28 23:41:32 +0000403 SetDebugLoc(MDDbgKind, I, SDB, 0, MF);
Dan Gohman07f111e2009-12-05 00:27:08 +0000404
405 if (!isa<TerminatorInst>(I)) {
Dan Gohman2048b852009-11-23 18:04:58 +0000406 SDB->visit(*I);
Dan Gohman07f111e2009-12-05 00:27:08 +0000407
408 // Set the current debug location back to "unknown" so that it doesn't
409 // spuriously apply to subsequent instructions.
410 ResetDebugLoc(SDB, 0);
411 }
Devang Patel123eaa72009-09-16 20:39:11 +0000412 }
Dan Gohmanf350b272008-08-23 02:25:05 +0000413
Dan Gohman2048b852009-11-23 18:04:58 +0000414 if (!SDB->HasTailCall) {
Dan Gohman98ca4f22009-08-05 01:29:28 +0000415 // Ensure that all instructions which are used outside of their defining
416 // blocks are available as virtual registers. Invoke is handled elsewhere.
417 for (BasicBlock::iterator I = Begin; I != End; ++I)
418 if (!isa<PHINode>(I) && !isa<InvokeInst>(I))
Dan Gohman2048b852009-11-23 18:04:58 +0000419 SDB->CopyToExportRegsIfNeeded(I);
Dan Gohmanf350b272008-08-23 02:25:05 +0000420
Dan Gohman98ca4f22009-08-05 01:29:28 +0000421 // Handle PHI nodes in successor blocks.
422 if (End == LLVMBB->end()) {
423 HandlePHINodesInSuccessorBlocks(LLVMBB);
Dan Gohman3df24e62008-09-03 23:12:08 +0000424
Dan Gohman98ca4f22009-08-05 01:29:28 +0000425 // Lower the terminator after the copies are emitted.
Chris Lattner3990b122009-12-28 23:41:32 +0000426 SetDebugLoc(MDDbgKind, LLVMBB->getTerminator(), SDB, 0, MF);
Dan Gohman2048b852009-11-23 18:04:58 +0000427 SDB->visit(*LLVMBB->getTerminator());
Dan Gohman07f111e2009-12-05 00:27:08 +0000428 ResetDebugLoc(SDB, 0);
Dan Gohman98ca4f22009-08-05 01:29:28 +0000429 }
Dan Gohman3df24e62008-09-03 23:12:08 +0000430 }
Daniel Dunbara279bc32009-09-20 02:20:51 +0000431
Chris Lattnera651cf62005-01-17 19:43:36 +0000432 // Make sure the root of the DAG is up-to-date.
Dan Gohman2048b852009-11-23 18:04:58 +0000433 CurDAG->setRoot(SDB->getControlRoot());
Arnold Schwaighoferc85e1712007-10-11 19:40:01 +0000434
Dan Gohmanf350b272008-08-23 02:25:05 +0000435 // Final step, emit the lowered DAG as machine code.
436 CodeGenAndEmitDAG();
Dan Gohman2048b852009-11-23 18:04:58 +0000437 HadTailCall = SDB->HasTailCall;
438 SDB->clear();
Chris Lattner1c08c712005-01-07 07:47:53 +0000439}
440
Evan Cheng54e146b2010-01-09 00:21:08 +0000441namespace {
442/// WorkListRemover - This class is a DAGUpdateListener that removes any deleted
443/// nodes from the worklist.
444class SDOPsWorkListRemover : public SelectionDAG::DAGUpdateListener {
445 SmallVector<SDNode*, 128> &Worklist;
446public:
447 SDOPsWorkListRemover(SmallVector<SDNode*, 128> &wl) : Worklist(wl) {}
448
449 virtual void NodeDeleted(SDNode *N, SDNode *E) {
450 Worklist.erase(std::remove(Worklist.begin(), Worklist.end(), N),
451 Worklist.end());
452 }
453
454 virtual void NodeUpdated(SDNode *N) {
455 // Ignore updates.
456 }
457};
458}
459
Evan Cheng046632f2010-02-10 02:17:34 +0000460/// TrivialTruncElim - Eliminate some trivial nops that can result from
461/// ShrinkDemandedOps: (trunc (ext n)) -> n.
462static bool TrivialTruncElim(SDValue Op,
463 TargetLowering::TargetLoweringOpt &TLO) {
464 SDValue N0 = Op.getOperand(0);
465 EVT VT = Op.getValueType();
466 if ((N0.getOpcode() == ISD::ZERO_EXTEND ||
467 N0.getOpcode() == ISD::SIGN_EXTEND ||
468 N0.getOpcode() == ISD::ANY_EXTEND) &&
469 N0.getOperand(0).getValueType() == VT) {
470 return TLO.CombineTo(Op, N0.getOperand(0));
471 }
472 return false;
473}
474
Evan Cheng54eb4c22010-01-06 19:43:21 +0000475/// ShrinkDemandedOps - A late transformation pass that shrink expressions
476/// using TargetLowering::TargetLoweringOpt::ShrinkDemandedOp. It converts
477/// x+y to (VT)((SmallVT)x+(SmallVT)y) if the casts are free.
Evan Chengd40d03e2010-01-06 19:38:29 +0000478void SelectionDAGISel::ShrinkDemandedOps() {
479 SmallVector<SDNode*, 128> Worklist;
480
481 // Add all the dag nodes to the worklist.
482 Worklist.reserve(CurDAG->allnodes_size());
483 for (SelectionDAG::allnodes_iterator I = CurDAG->allnodes_begin(),
484 E = CurDAG->allnodes_end(); I != E; ++I)
485 Worklist.push_back(I);
486
487 APInt Mask;
488 APInt KnownZero;
489 APInt KnownOne;
490
491 TargetLowering::TargetLoweringOpt TLO(*CurDAG, true);
492 while (!Worklist.empty()) {
Benjamin Kramer7b1e2a52010-01-07 17:27:56 +0000493 SDNode *N = Worklist.pop_back_val();
Evan Chengd40d03e2010-01-06 19:38:29 +0000494
495 if (N->use_empty() && N != CurDAG->getRoot().getNode()) {
Evan Cheng54e146b2010-01-09 00:21:08 +0000496 CurDAG->DeleteNode(N);
Evan Chengd40d03e2010-01-06 19:38:29 +0000497 continue;
498 }
499
500 // Run ShrinkDemandedOp on scalar binary operations.
501 if (N->getNumValues() == 1 &&
502 N->getValueType(0).isSimple() && N->getValueType(0).isInteger()) {
Evan Chengd40d03e2010-01-06 19:38:29 +0000503 unsigned BitWidth = N->getValueType(0).getScalarType().getSizeInBits();
504 APInt Demanded = APInt::getAllOnesValue(BitWidth);
505 APInt KnownZero, KnownOne;
506 if (TLI.SimplifyDemandedBits(SDValue(N, 0), Demanded,
Evan Cheng046632f2010-02-10 02:17:34 +0000507 KnownZero, KnownOne, TLO) ||
508 (N->getOpcode() == ISD::TRUNCATE &&
509 TrivialTruncElim(SDValue(N, 0), TLO))) {
Evan Chengd40d03e2010-01-06 19:38:29 +0000510 // Revisit the node.
511 Worklist.erase(std::remove(Worklist.begin(), Worklist.end(), N),
512 Worklist.end());
513 Worklist.push_back(N);
514
515 // Replace the old value with the new one.
516 DEBUG(errs() << "\nReplacing ";
517 TLO.Old.getNode()->dump(CurDAG);
518 errs() << "\nWith: ";
519 TLO.New.getNode()->dump(CurDAG);
520 errs() << '\n');
521
522 Worklist.push_back(TLO.New.getNode());
Evan Cheng54e146b2010-01-09 00:21:08 +0000523
524 SDOPsWorkListRemover DeadNodes(Worklist);
525 CurDAG->ReplaceAllUsesOfValueWith(TLO.Old, TLO.New, &DeadNodes);
Evan Chengd40d03e2010-01-06 19:38:29 +0000526
527 if (TLO.Old.getNode()->use_empty()) {
528 for (unsigned i = 0, e = TLO.Old.getNode()->getNumOperands();
529 i != e; ++i) {
530 SDNode *OpNode = TLO.Old.getNode()->getOperand(i).getNode();
531 if (OpNode->hasOneUse()) {
532 Worklist.erase(std::remove(Worklist.begin(), Worklist.end(),
Evan Cheng54e146b2010-01-09 00:21:08 +0000533 OpNode), Worklist.end());
534 Worklist.push_back(OpNode);
Evan Chengd40d03e2010-01-06 19:38:29 +0000535 }
536 }
537
538 Worklist.erase(std::remove(Worklist.begin(), Worklist.end(),
Evan Cheng54e146b2010-01-09 00:21:08 +0000539 TLO.Old.getNode()), Worklist.end());
Evan Chengd40d03e2010-01-06 19:38:29 +0000540 CurDAG->DeleteNode(TLO.Old.getNode());
541 }
542 }
543 }
544 }
545}
546
Dan Gohmanf350b272008-08-23 02:25:05 +0000547void SelectionDAGISel::ComputeLiveOutVRegInfo() {
Chris Lattneread0d882008-06-17 06:09:18 +0000548 SmallPtrSet<SDNode*, 128> VisitedNodes;
549 SmallVector<SDNode*, 128> Worklist;
Daniel Dunbara279bc32009-09-20 02:20:51 +0000550
Gabor Greifba36cb52008-08-28 21:40:38 +0000551 Worklist.push_back(CurDAG->getRoot().getNode());
Daniel Dunbara279bc32009-09-20 02:20:51 +0000552
Chris Lattneread0d882008-06-17 06:09:18 +0000553 APInt Mask;
554 APInt KnownZero;
555 APInt KnownOne;
Daniel Dunbara279bc32009-09-20 02:20:51 +0000556
Benjamin Kramer7b1e2a52010-01-07 17:27:56 +0000557 do {
558 SDNode *N = Worklist.pop_back_val();
Daniel Dunbara279bc32009-09-20 02:20:51 +0000559
Chris Lattneread0d882008-06-17 06:09:18 +0000560 // If we've already seen this node, ignore it.
561 if (!VisitedNodes.insert(N))
562 continue;
Daniel Dunbara279bc32009-09-20 02:20:51 +0000563
Chris Lattneread0d882008-06-17 06:09:18 +0000564 // Otherwise, add all chain operands to the worklist.
565 for (unsigned i = 0, e = N->getNumOperands(); i != e; ++i)
Owen Anderson825b72b2009-08-11 20:47:22 +0000566 if (N->getOperand(i).getValueType() == MVT::Other)
Gabor Greifba36cb52008-08-28 21:40:38 +0000567 Worklist.push_back(N->getOperand(i).getNode());
Daniel Dunbara279bc32009-09-20 02:20:51 +0000568
Chris Lattneread0d882008-06-17 06:09:18 +0000569 // If this is a CopyToReg with a vreg dest, process it.
570 if (N->getOpcode() != ISD::CopyToReg)
571 continue;
Daniel Dunbara279bc32009-09-20 02:20:51 +0000572
Chris Lattneread0d882008-06-17 06:09:18 +0000573 unsigned DestReg = cast<RegisterSDNode>(N->getOperand(1))->getReg();
574 if (!TargetRegisterInfo::isVirtualRegister(DestReg))
575 continue;
Daniel Dunbara279bc32009-09-20 02:20:51 +0000576
Chris Lattneread0d882008-06-17 06:09:18 +0000577 // Ignore non-scalar or non-integer values.
Dan Gohman475871a2008-07-27 21:46:04 +0000578 SDValue Src = N->getOperand(2);
Owen Andersone50ed302009-08-10 22:56:29 +0000579 EVT SrcVT = Src.getValueType();
Chris Lattneread0d882008-06-17 06:09:18 +0000580 if (!SrcVT.isInteger() || SrcVT.isVector())
581 continue;
Daniel Dunbara279bc32009-09-20 02:20:51 +0000582
Dan Gohmanf350b272008-08-23 02:25:05 +0000583 unsigned NumSignBits = CurDAG->ComputeNumSignBits(Src);
Chris Lattneread0d882008-06-17 06:09:18 +0000584 Mask = APInt::getAllOnesValue(SrcVT.getSizeInBits());
Dan Gohmanf350b272008-08-23 02:25:05 +0000585 CurDAG->ComputeMaskedBits(Src, Mask, KnownZero, KnownOne);
Daniel Dunbara279bc32009-09-20 02:20:51 +0000586
Chris Lattneread0d882008-06-17 06:09:18 +0000587 // Only install this information if it tells us something.
588 if (NumSignBits != 1 || KnownZero != 0 || KnownOne != 0) {
589 DestReg -= TargetRegisterInfo::FirstVirtualRegister;
Dan Gohmanf7d6cd42009-08-01 03:51:09 +0000590 if (DestReg >= FuncInfo->LiveOutRegInfo.size())
591 FuncInfo->LiveOutRegInfo.resize(DestReg+1);
592 FunctionLoweringInfo::LiveOutInfo &LOI =
593 FuncInfo->LiveOutRegInfo[DestReg];
Chris Lattneread0d882008-06-17 06:09:18 +0000594 LOI.NumSignBits = NumSignBits;
Dan Gohmana80efce2009-03-27 23:55:04 +0000595 LOI.KnownOne = KnownOne;
596 LOI.KnownZero = KnownZero;
Chris Lattneread0d882008-06-17 06:09:18 +0000597 }
Benjamin Kramer7b1e2a52010-01-07 17:27:56 +0000598 } while (!Worklist.empty());
Chris Lattneread0d882008-06-17 06:09:18 +0000599}
600
Dan Gohmanf350b272008-08-23 02:25:05 +0000601void SelectionDAGISel::CodeGenAndEmitDAG() {
Dan Gohman462dc7f2008-07-21 20:00:07 +0000602 std::string GroupName;
603 if (TimePassesIsEnabled)
604 GroupName = "Instruction Selection and Scheduling";
605 std::string BlockName;
606 if (ViewDAGCombine1 || ViewLegalizeTypesDAGs || ViewLegalizeDAGs ||
Duncan Sands25cf2272008-11-24 14:53:14 +0000607 ViewDAGCombine2 || ViewDAGCombineLT || ViewISelDAGs || ViewSchedDAGs ||
608 ViewSUnitDAGs)
Dan Gohmanf7d6cd42009-08-01 03:51:09 +0000609 BlockName = MF->getFunction()->getNameStr() + ":" +
Daniel Dunbarf6ccee52009-07-24 08:24:36 +0000610 BB->getBasicBlock()->getNameStr();
Dan Gohman462dc7f2008-07-21 20:00:07 +0000611
David Greene1a053232010-01-05 01:26:11 +0000612 DEBUG(dbgs() << "Initial selection DAG:\n");
Dan Gohmanf350b272008-08-23 02:25:05 +0000613 DEBUG(CurDAG->dump());
Dan Gohman462dc7f2008-07-21 20:00:07 +0000614
Dan Gohmanf350b272008-08-23 02:25:05 +0000615 if (ViewDAGCombine1) CurDAG->viewGraph("dag-combine1 input for " + BlockName);
Dan Gohman417e11b2007-10-08 15:12:17 +0000616
Chris Lattneraf21d552005-10-10 16:47:10 +0000617 // Run the DAG combiner in pre-legalize mode.
Evan Chengebffb662008-07-01 17:59:20 +0000618 if (TimePassesIsEnabled) {
Dan Gohman5e843682008-07-14 18:19:29 +0000619 NamedRegionTimer T("DAG Combining 1", GroupName);
Bill Wendlingbe8cc2a2009-04-29 00:15:41 +0000620 CurDAG->Combine(Unrestricted, *AA, OptLevel);
Evan Chengebffb662008-07-01 17:59:20 +0000621 } else {
Bill Wendlingbe8cc2a2009-04-29 00:15:41 +0000622 CurDAG->Combine(Unrestricted, *AA, OptLevel);
Evan Chengebffb662008-07-01 17:59:20 +0000623 }
Daniel Dunbara279bc32009-09-20 02:20:51 +0000624
David Greene1a053232010-01-05 01:26:11 +0000625 DEBUG(dbgs() << "Optimized lowered selection DAG:\n");
Dan Gohmanf350b272008-08-23 02:25:05 +0000626 DEBUG(CurDAG->dump());
Daniel Dunbara279bc32009-09-20 02:20:51 +0000627
Chris Lattner1c08c712005-01-07 07:47:53 +0000628 // Second step, hack on the DAG until it only uses operations and types that
629 // the target supports.
Dan Gohman714efc62009-12-05 17:51:33 +0000630 if (ViewLegalizeTypesDAGs) CurDAG->viewGraph("legalize-types input for " +
631 BlockName);
Dan Gohman462dc7f2008-07-21 20:00:07 +0000632
Dan Gohman714efc62009-12-05 17:51:33 +0000633 bool Changed;
634 if (TimePassesIsEnabled) {
635 NamedRegionTimer T("Type Legalization", GroupName);
636 Changed = CurDAG->LegalizeTypes();
637 } else {
638 Changed = CurDAG->LegalizeTypes();
639 }
640
David Greene1a053232010-01-05 01:26:11 +0000641 DEBUG(dbgs() << "Type-legalized selection DAG:\n");
Dan Gohman714efc62009-12-05 17:51:33 +0000642 DEBUG(CurDAG->dump());
643
644 if (Changed) {
645 if (ViewDAGCombineLT)
646 CurDAG->viewGraph("dag-combine-lt input for " + BlockName);
647
648 // Run the DAG combiner in post-type-legalize mode.
Dan Gohman462dc7f2008-07-21 20:00:07 +0000649 if (TimePassesIsEnabled) {
Dan Gohman714efc62009-12-05 17:51:33 +0000650 NamedRegionTimer T("DAG Combining after legalize types", GroupName);
651 CurDAG->Combine(NoIllegalTypes, *AA, OptLevel);
Dan Gohman462dc7f2008-07-21 20:00:07 +0000652 } else {
Dan Gohman714efc62009-12-05 17:51:33 +0000653 CurDAG->Combine(NoIllegalTypes, *AA, OptLevel);
Dan Gohman462dc7f2008-07-21 20:00:07 +0000654 }
655
David Greene1a053232010-01-05 01:26:11 +0000656 DEBUG(dbgs() << "Optimized type-legalized selection DAG:\n");
Dan Gohmanf350b272008-08-23 02:25:05 +0000657 DEBUG(CurDAG->dump());
Dan Gohman714efc62009-12-05 17:51:33 +0000658 }
Dan Gohman462dc7f2008-07-21 20:00:07 +0000659
Dan Gohman714efc62009-12-05 17:51:33 +0000660 if (TimePassesIsEnabled) {
661 NamedRegionTimer T("Vector Legalization", GroupName);
662 Changed = CurDAG->LegalizeVectors();
663 } else {
664 Changed = CurDAG->LegalizeVectors();
665 }
Duncan Sands25cf2272008-11-24 14:53:14 +0000666
Dan Gohman714efc62009-12-05 17:51:33 +0000667 if (Changed) {
Eli Friedman5c22c802009-05-23 12:35:30 +0000668 if (TimePassesIsEnabled) {
Dan Gohman714efc62009-12-05 17:51:33 +0000669 NamedRegionTimer T("Type Legalization 2", GroupName);
Bill Wendling98820072009-12-28 01:51:30 +0000670 CurDAG->LegalizeTypes();
Eli Friedman5c22c802009-05-23 12:35:30 +0000671 } else {
Bill Wendling98820072009-12-28 01:51:30 +0000672 CurDAG->LegalizeTypes();
Eli Friedman5c22c802009-05-23 12:35:30 +0000673 }
674
Dan Gohman714efc62009-12-05 17:51:33 +0000675 if (ViewDAGCombineLT)
676 CurDAG->viewGraph("dag-combine-lv input for " + BlockName);
Eli Friedman5c22c802009-05-23 12:35:30 +0000677
Dan Gohman714efc62009-12-05 17:51:33 +0000678 // Run the DAG combiner in post-type-legalize mode.
679 if (TimePassesIsEnabled) {
680 NamedRegionTimer T("DAG Combining after legalize vectors", GroupName);
681 CurDAG->Combine(NoIllegalOperations, *AA, OptLevel);
682 } else {
683 CurDAG->Combine(NoIllegalOperations, *AA, OptLevel);
Eli Friedman5c22c802009-05-23 12:35:30 +0000684 }
Dan Gohman714efc62009-12-05 17:51:33 +0000685
David Greene1a053232010-01-05 01:26:11 +0000686 DEBUG(dbgs() << "Optimized vector-legalized selection DAG:\n");
Dan Gohman714efc62009-12-05 17:51:33 +0000687 DEBUG(CurDAG->dump());
Chris Lattner70587ea2008-07-10 23:37:50 +0000688 }
Daniel Dunbara279bc32009-09-20 02:20:51 +0000689
Dan Gohmanf350b272008-08-23 02:25:05 +0000690 if (ViewLegalizeDAGs) CurDAG->viewGraph("legalize input for " + BlockName);
Dan Gohman462dc7f2008-07-21 20:00:07 +0000691
Evan Chengebffb662008-07-01 17:59:20 +0000692 if (TimePassesIsEnabled) {
Dan Gohman5e843682008-07-14 18:19:29 +0000693 NamedRegionTimer T("DAG Legalization", GroupName);
Dan Gohman714efc62009-12-05 17:51:33 +0000694 CurDAG->Legalize(OptLevel);
Evan Chengebffb662008-07-01 17:59:20 +0000695 } else {
Dan Gohman714efc62009-12-05 17:51:33 +0000696 CurDAG->Legalize(OptLevel);
Evan Chengebffb662008-07-01 17:59:20 +0000697 }
Daniel Dunbara279bc32009-09-20 02:20:51 +0000698
David Greene1a053232010-01-05 01:26:11 +0000699 DEBUG(dbgs() << "Legalized selection DAG:\n");
Dan Gohmanf350b272008-08-23 02:25:05 +0000700 DEBUG(CurDAG->dump());
Daniel Dunbara279bc32009-09-20 02:20:51 +0000701
Dan Gohmanf350b272008-08-23 02:25:05 +0000702 if (ViewDAGCombine2) CurDAG->viewGraph("dag-combine2 input for " + BlockName);
Dan Gohman462dc7f2008-07-21 20:00:07 +0000703
Chris Lattneraf21d552005-10-10 16:47:10 +0000704 // Run the DAG combiner in post-legalize mode.
Evan Chengebffb662008-07-01 17:59:20 +0000705 if (TimePassesIsEnabled) {
Dan Gohman5e843682008-07-14 18:19:29 +0000706 NamedRegionTimer T("DAG Combining 2", GroupName);
Bill Wendlingbe8cc2a2009-04-29 00:15:41 +0000707 CurDAG->Combine(NoIllegalOperations, *AA, OptLevel);
Evan Chengebffb662008-07-01 17:59:20 +0000708 } else {
Bill Wendlingbe8cc2a2009-04-29 00:15:41 +0000709 CurDAG->Combine(NoIllegalOperations, *AA, OptLevel);
Evan Chengebffb662008-07-01 17:59:20 +0000710 }
Daniel Dunbara279bc32009-09-20 02:20:51 +0000711
David Greene1a053232010-01-05 01:26:11 +0000712 DEBUG(dbgs() << "Optimized legalized selection DAG:\n");
Dan Gohmanf350b272008-08-23 02:25:05 +0000713 DEBUG(CurDAG->dump());
Dan Gohman417e11b2007-10-08 15:12:17 +0000714
Dan Gohmanf350b272008-08-23 02:25:05 +0000715 if (ViewISelDAGs) CurDAG->viewGraph("isel input for " + BlockName);
Daniel Dunbara279bc32009-09-20 02:20:51 +0000716
Evan Chengd40d03e2010-01-06 19:38:29 +0000717 if (OptLevel != CodeGenOpt::None) {
718 ShrinkDemandedOps();
Dan Gohmanf350b272008-08-23 02:25:05 +0000719 ComputeLiveOutVRegInfo();
Evan Chengd40d03e2010-01-06 19:38:29 +0000720 }
Evan Cheng552c4a82006-04-28 02:09:19 +0000721
Chris Lattnera33ef482005-03-30 01:10:47 +0000722 // Third, instruction select all of the operations to machine code, adding the
723 // code to the MachineBasicBlock.
Evan Chengebffb662008-07-01 17:59:20 +0000724 if (TimePassesIsEnabled) {
Dan Gohman5e843682008-07-14 18:19:29 +0000725 NamedRegionTimer T("Instruction Selection", GroupName);
Chris Lattner7c306da2010-03-02 06:34:30 +0000726 DoInstructionSelection();
Evan Chengebffb662008-07-01 17:59:20 +0000727 } else {
Chris Lattner7c306da2010-03-02 06:34:30 +0000728 DoInstructionSelection();
Evan Chengebffb662008-07-01 17:59:20 +0000729 }
Evan Chengdb8d56b2008-06-30 20:45:06 +0000730
David Greene1a053232010-01-05 01:26:11 +0000731 DEBUG(dbgs() << "Selected selection DAG:\n");
Dan Gohmanf350b272008-08-23 02:25:05 +0000732 DEBUG(CurDAG->dump());
Dan Gohman462dc7f2008-07-21 20:00:07 +0000733
Dan Gohmanf350b272008-08-23 02:25:05 +0000734 if (ViewSchedDAGs) CurDAG->viewGraph("scheduler input for " + BlockName);
Dan Gohman462dc7f2008-07-21 20:00:07 +0000735
Dan Gohman5e843682008-07-14 18:19:29 +0000736 // Schedule machine code.
Dan Gohman47ac0f02009-02-11 04:27:20 +0000737 ScheduleDAGSDNodes *Scheduler = CreateScheduler();
Dan Gohman5e843682008-07-14 18:19:29 +0000738 if (TimePassesIsEnabled) {
739 NamedRegionTimer T("Instruction Scheduling", GroupName);
Dan Gohman47ac0f02009-02-11 04:27:20 +0000740 Scheduler->Run(CurDAG, BB, BB->end());
Dan Gohman5e843682008-07-14 18:19:29 +0000741 } else {
Dan Gohman47ac0f02009-02-11 04:27:20 +0000742 Scheduler->Run(CurDAG, BB, BB->end());
Dan Gohman5e843682008-07-14 18:19:29 +0000743 }
744
Dan Gohman462dc7f2008-07-21 20:00:07 +0000745 if (ViewSUnitDAGs) Scheduler->viewGraph();
746
Daniel Dunbara279bc32009-09-20 02:20:51 +0000747 // Emit machine code to BB. This can change 'BB' to the last block being
Evan Chengdb8d56b2008-06-30 20:45:06 +0000748 // inserted into.
Evan Chengebffb662008-07-01 17:59:20 +0000749 if (TimePassesIsEnabled) {
Dan Gohman5e843682008-07-14 18:19:29 +0000750 NamedRegionTimer T("Instruction Creation", GroupName);
Dan Gohman2048b852009-11-23 18:04:58 +0000751 BB = Scheduler->EmitSchedule(&SDB->EdgeMapping);
Evan Chengebffb662008-07-01 17:59:20 +0000752 } else {
Dan Gohman2048b852009-11-23 18:04:58 +0000753 BB = Scheduler->EmitSchedule(&SDB->EdgeMapping);
Dan Gohman5e843682008-07-14 18:19:29 +0000754 }
755
756 // Free the scheduler state.
757 if (TimePassesIsEnabled) {
758 NamedRegionTimer T("Instruction Scheduling Cleanup", GroupName);
759 delete Scheduler;
760 } else {
761 delete Scheduler;
Evan Chengebffb662008-07-01 17:59:20 +0000762 }
Evan Chengdb8d56b2008-06-30 20:45:06 +0000763
David Greene1a053232010-01-05 01:26:11 +0000764 DEBUG(dbgs() << "Selected machine code:\n");
Chris Lattner1c08c712005-01-07 07:47:53 +0000765 DEBUG(BB->dump());
Daniel Dunbara279bc32009-09-20 02:20:51 +0000766}
Chris Lattner1c08c712005-01-07 07:47:53 +0000767
Chris Lattner7c306da2010-03-02 06:34:30 +0000768void SelectionDAGISel::DoInstructionSelection() {
769 DEBUG(errs() << "===== Instruction selection begins:\n");
770
771 PreprocessISelDAG();
772
773 // Select target instructions for the DAG.
774 {
775 // Number all nodes with a topological order and set DAGSize.
776 DAGSize = CurDAG->AssignTopologicalOrder();
777
778 // Create a dummy node (which is not added to allnodes), that adds
779 // a reference to the root node, preventing it from being deleted,
780 // and tracking any changes of the root.
781 HandleSDNode Dummy(CurDAG->getRoot());
782 ISelPosition = SelectionDAG::allnodes_iterator(CurDAG->getRoot().getNode());
783 ++ISelPosition;
784
785 // The AllNodes list is now topological-sorted. Visit the
786 // nodes by starting at the end of the list (the root of the
787 // graph) and preceding back toward the beginning (the entry
788 // node).
789 while (ISelPosition != CurDAG->allnodes_begin()) {
790 SDNode *Node = --ISelPosition;
791 // Skip dead nodes. DAGCombiner is expected to eliminate all dead nodes,
792 // but there are currently some corner cases that it misses. Also, this
793 // makes it theoretically possible to disable the DAGCombiner.
794 if (Node->use_empty())
795 continue;
796
797 SDNode *ResNode = Select(Node);
798
799 // If node should not be replaced, continue with the next one.
800 if (ResNode == Node)
801 continue;
802 // Replace node.
803 if (ResNode)
804 ReplaceUses(Node, ResNode);
805
806 // If after the replacement this node is not used any more,
807 // remove this dead node.
808 if (Node->use_empty()) { // Don't delete EntryToken, etc.
809 ISelUpdater ISU(ISelPosition);
810 CurDAG->RemoveDeadNode(Node, &ISU);
811 }
812 }
813
814 CurDAG->setRoot(Dummy.getValue());
815 }
816 DEBUG(errs() << "===== Instruction selection ends:\n");
817
818 PostprocessISelDAG();
819
820 // FIXME: This shouldn't be needed, remove it.
821 CurDAG->RemoveDeadNodes();
822}
823
824
Dan Gohman79ce2762009-01-15 19:20:50 +0000825void SelectionDAGISel::SelectAllBasicBlocks(Function &Fn,
826 MachineFunction &MF,
Dan Gohmandd5b58a2008-10-14 23:54:11 +0000827 MachineModuleInfo *MMI,
Devang Patel83489bb2009-01-13 00:35:13 +0000828 DwarfWriter *DW,
Dan Gohmandd5b58a2008-10-14 23:54:11 +0000829 const TargetInstrInfo &TII) {
Dan Gohmana43abd12008-09-29 21:55:50 +0000830 // Initialize the Fast-ISel state, if needed.
831 FastISel *FastIS = 0;
832 if (EnableFastISel)
Dan Gohman79ce2762009-01-15 19:20:50 +0000833 FastIS = TLI.createFastISel(MF, MMI, DW,
Dan Gohmana43abd12008-09-29 21:55:50 +0000834 FuncInfo->ValueMap,
835 FuncInfo->MBBMap,
Dan Gohmandd5b58a2008-10-14 23:54:11 +0000836 FuncInfo->StaticAllocaMap
837#ifndef NDEBUG
838 , FuncInfo->CatchInfoLost
839#endif
840 );
Dan Gohmana43abd12008-09-29 21:55:50 +0000841
Chris Lattner08113472009-12-29 09:01:33 +0000842 unsigned MDDbgKind = Fn.getContext().getMDKindID("dbg");
Devang Patel123eaa72009-09-16 20:39:11 +0000843
Dan Gohmana43abd12008-09-29 21:55:50 +0000844 // Iterate over all basic blocks in the function.
Evan Cheng39fd6e82008-08-07 00:43:25 +0000845 for (Function::iterator I = Fn.begin(), E = Fn.end(); I != E; ++I) {
846 BasicBlock *LLVMBB = &*I;
Dan Gohman7c3234c2008-08-27 23:52:12 +0000847 BB = FuncInfo->MBBMap[LLVMBB];
Dan Gohmanf350b272008-08-23 02:25:05 +0000848
Dan Gohman3df24e62008-09-03 23:12:08 +0000849 BasicBlock::iterator const Begin = LLVMBB->begin();
850 BasicBlock::iterator const End = LLVMBB->end();
Evan Cheng9f118502008-09-08 16:01:27 +0000851 BasicBlock::iterator BI = Begin;
Dan Gohman5edd3612008-08-28 20:28:56 +0000852
853 // Lower any arguments needed in this block if this is the entry block.
Dan Gohman33134c42008-09-25 17:05:24 +0000854 bool SuppressFastISel = false;
855 if (LLVMBB == &Fn.getEntryBlock()) {
Dan Gohman5edd3612008-08-28 20:28:56 +0000856 LowerArguments(LLVMBB);
Dan Gohmanf350b272008-08-23 02:25:05 +0000857
Dan Gohman33134c42008-09-25 17:05:24 +0000858 // If any of the arguments has the byval attribute, forgo
859 // fast-isel in the entry block.
Dan Gohmana43abd12008-09-29 21:55:50 +0000860 if (FastIS) {
Dan Gohman33134c42008-09-25 17:05:24 +0000861 unsigned j = 1;
862 for (Function::arg_iterator I = Fn.arg_begin(), E = Fn.arg_end();
863 I != E; ++I, ++j)
Devang Patel05988662008-09-25 21:00:45 +0000864 if (Fn.paramHasAttr(j, Attribute::ByVal)) {
Dan Gohman77ca41e2008-09-25 17:21:42 +0000865 if (EnableFastISelVerbose || EnableFastISelAbort)
David Greene1a053232010-01-05 01:26:11 +0000866 dbgs() << "FastISel skips entry block due to byval argument\n";
Dan Gohman33134c42008-09-25 17:05:24 +0000867 SuppressFastISel = true;
868 break;
869 }
870 }
871 }
872
Dan Gohmandd5b58a2008-10-14 23:54:11 +0000873 if (MMI && BB->isLandingPad()) {
874 // Add a label to mark the beginning of the landing pad. Deletion of the
875 // landing pad can thus be detected via the MachineModuleInfo.
876 unsigned LabelID = MMI->addLandingPad(BB);
877
Chris Lattner518bb532010-02-09 19:54:29 +0000878 const TargetInstrDesc &II = TII.get(TargetOpcode::EH_LABEL);
Dan Gohman2048b852009-11-23 18:04:58 +0000879 BuildMI(BB, SDB->getCurDebugLoc(), II).addImm(LabelID);
Dan Gohmandd5b58a2008-10-14 23:54:11 +0000880
881 // Mark exception register as live in.
882 unsigned Reg = TLI.getExceptionAddressRegister();
883 if (Reg) BB->addLiveIn(Reg);
884
885 // Mark exception selector register as live in.
886 Reg = TLI.getExceptionSelectorRegister();
887 if (Reg) BB->addLiveIn(Reg);
888
889 // FIXME: Hack around an exception handling flaw (PR1508): the personality
890 // function and list of typeids logically belong to the invoke (or, if you
891 // like, the basic block containing the invoke), and need to be associated
892 // with it in the dwarf exception handling tables. Currently however the
893 // information is provided by an intrinsic (eh.selector) that can be moved
894 // to unexpected places by the optimizers: if the unwind edge is critical,
895 // then breaking it can result in the intrinsics being in the successor of
Jim Grosbachf4549b02010-01-15 00:36:15 +0000896 // the landing pad, not the landing pad itself. This results
897 // in exceptions not being caught because no typeids are associated with
898 // the invoke. This may not be the only way things can go wrong, but it
899 // is the only way we try to work around for the moment.
Dan Gohmandd5b58a2008-10-14 23:54:11 +0000900 BranchInst *Br = dyn_cast<BranchInst>(LLVMBB->getTerminator());
901
902 if (Br && Br->isUnconditional()) { // Critical edge?
903 BasicBlock::iterator I, E;
904 for (I = LLVMBB->begin(), E = --LLVMBB->end(); I != E; ++I)
905 if (isa<EHSelectorInst>(I))
906 break;
907
908 if (I == E)
909 // No catch info found - try to extract some from the successor.
Dan Gohman5fca8b12009-11-23 18:12:11 +0000910 CopyCatchInfo(Br->getSuccessor(0), LLVMBB, MMI, *FuncInfo);
Dan Gohmandd5b58a2008-10-14 23:54:11 +0000911 }
912 }
913
Dan Gohmanf350b272008-08-23 02:25:05 +0000914 // Before doing SelectionDAG ISel, see if FastISel has been requested.
Dan Gohmandd5b58a2008-10-14 23:54:11 +0000915 if (FastIS && !SuppressFastISel) {
Dan Gohmana43abd12008-09-29 21:55:50 +0000916 // Emit code for any incoming arguments. This must happen before
917 // beginning FastISel on the entry block.
918 if (LLVMBB == &Fn.getEntryBlock()) {
Dan Gohman2048b852009-11-23 18:04:58 +0000919 CurDAG->setRoot(SDB->getControlRoot());
Dan Gohmana43abd12008-09-29 21:55:50 +0000920 CodeGenAndEmitDAG();
Dan Gohman2048b852009-11-23 18:04:58 +0000921 SDB->clear();
Dan Gohmana43abd12008-09-29 21:55:50 +0000922 }
Dan Gohman241f4642008-10-04 00:56:36 +0000923 FastIS->startNewBlock(BB);
Dan Gohmana43abd12008-09-29 21:55:50 +0000924 // Do FastISel on as many instructions as possible.
925 for (; BI != End; ++BI) {
926 // Just before the terminator instruction, insert instructions to
927 // feed PHI nodes in successor blocks.
928 if (isa<TerminatorInst>(BI))
929 if (!HandlePHINodesInSuccessorBlocksFast(LLVMBB, FastIS)) {
Dan Gohman07f111e2009-12-05 00:27:08 +0000930 ResetDebugLoc(SDB, FastIS);
Dan Gohman4344a5d2008-09-09 23:05:00 +0000931 if (EnableFastISelVerbose || EnableFastISelAbort) {
David Greene1a053232010-01-05 01:26:11 +0000932 dbgs() << "FastISel miss: ";
Dan Gohman293d5f82008-09-09 22:06:46 +0000933 BI->dump();
934 }
Daniel Dunbara279bc32009-09-20 02:20:51 +0000935 assert(!EnableFastISelAbort &&
Torok Edwinf3689232009-07-12 20:07:01 +0000936 "FastISel didn't handle a PHI in a successor");
Dan Gohmana43abd12008-09-29 21:55:50 +0000937 break;
Dan Gohmanf350b272008-08-23 02:25:05 +0000938 }
Dan Gohmana43abd12008-09-29 21:55:50 +0000939
Chris Lattner3990b122009-12-28 23:41:32 +0000940 SetDebugLoc(MDDbgKind, BI, SDB, FastIS, &MF);
Dan Gohman381ca552009-12-05 01:29:04 +0000941
Dan Gohman21c14e32010-01-12 04:32:35 +0000942 // Try to select the instruction with FastISel.
Dan Gohman07f111e2009-12-05 00:27:08 +0000943 if (FastIS->SelectInstruction(BI)) {
944 ResetDebugLoc(SDB, FastIS);
Dan Gohmana43abd12008-09-29 21:55:50 +0000945 continue;
Dan Gohman07f111e2009-12-05 00:27:08 +0000946 }
Dan Gohmana43abd12008-09-29 21:55:50 +0000947
Dan Gohman07f111e2009-12-05 00:27:08 +0000948 // Clear out the debug location so that it doesn't carry over to
949 // unrelated instructions.
950 ResetDebugLoc(SDB, FastIS);
Dan Gohmana43abd12008-09-29 21:55:50 +0000951
952 // Then handle certain instructions as single-LLVM-Instruction blocks.
953 if (isa<CallInst>(BI)) {
954 if (EnableFastISelVerbose || EnableFastISelAbort) {
David Greene1a053232010-01-05 01:26:11 +0000955 dbgs() << "FastISel missed call: ";
Dan Gohmana43abd12008-09-29 21:55:50 +0000956 BI->dump();
957 }
958
Benjamin Kramerf0127052010-01-05 13:12:22 +0000959 if (!BI->getType()->isVoidTy()) {
Dan Gohmana43abd12008-09-29 21:55:50 +0000960 unsigned &R = FuncInfo->ValueMap[BI];
961 if (!R)
962 R = FuncInfo->CreateRegForValue(BI);
963 }
964
Dan Gohmanb4afb132009-11-20 02:51:26 +0000965 bool HadTailCall = false;
Chris Lattner7896c9f2009-12-03 00:50:42 +0000966 SelectBasicBlock(LLVMBB, BI, llvm::next(BI), HadTailCall);
Dan Gohmanb4afb132009-11-20 02:51:26 +0000967
968 // If the call was emitted as a tail call, we're done with the block.
969 if (HadTailCall) {
970 BI = End;
971 break;
972 }
973
Dan Gohman241f4642008-10-04 00:56:36 +0000974 // If the instruction was codegen'd with multiple blocks,
975 // inform the FastISel object where to resume inserting.
976 FastIS->setCurrentBlock(BB);
Dan Gohmana43abd12008-09-29 21:55:50 +0000977 continue;
Dan Gohmanf350b272008-08-23 02:25:05 +0000978 }
Dan Gohmana43abd12008-09-29 21:55:50 +0000979
980 // Otherwise, give up on FastISel for the rest of the block.
981 // For now, be a little lenient about non-branch terminators.
982 if (!isa<TerminatorInst>(BI) || isa<BranchInst>(BI)) {
983 if (EnableFastISelVerbose || EnableFastISelAbort) {
David Greene1a053232010-01-05 01:26:11 +0000984 dbgs() << "FastISel miss: ";
Dan Gohmana43abd12008-09-29 21:55:50 +0000985 BI->dump();
986 }
987 if (EnableFastISelAbort)
988 // The "fast" selector couldn't handle something and bailed.
989 // For the purpose of debugging, just abort.
Torok Edwinc23197a2009-07-14 16:55:14 +0000990 llvm_unreachable("FastISel didn't select the entire block");
Dan Gohmana43abd12008-09-29 21:55:50 +0000991 }
992 break;
Dan Gohmanf350b272008-08-23 02:25:05 +0000993 }
994 }
995
Dan Gohmand2ff6472008-09-02 20:17:56 +0000996 // Run SelectionDAG instruction selection on the remainder of the block
997 // not handled by FastISel. If FastISel is not run, this is the entire
Dan Gohman3df24e62008-09-03 23:12:08 +0000998 // block.
Devang Patel390f3ac2009-04-16 01:33:10 +0000999 if (BI != End) {
Dan Gohmanb4afb132009-11-20 02:51:26 +00001000 bool HadTailCall;
1001 SelectBasicBlock(LLVMBB, BI, End, HadTailCall);
Devang Patel390f3ac2009-04-16 01:33:10 +00001002 }
Dan Gohmanf350b272008-08-23 02:25:05 +00001003
Dan Gohman7c3234c2008-08-27 23:52:12 +00001004 FinishBasicBlock();
Evan Cheng39fd6e82008-08-07 00:43:25 +00001005 }
Dan Gohmana43abd12008-09-29 21:55:50 +00001006
1007 delete FastIS;
Dan Gohman0e5f1302008-07-07 23:02:41 +00001008}
1009
Dan Gohmanfed90b62008-07-28 21:51:04 +00001010void
Dan Gohman7c3234c2008-08-27 23:52:12 +00001011SelectionDAGISel::FinishBasicBlock() {
Dan Gohmanf350b272008-08-23 02:25:05 +00001012
David Greene1a053232010-01-05 01:26:11 +00001013 DEBUG(dbgs() << "Target-post-processed machine code:\n");
Dan Gohmanf350b272008-08-23 02:25:05 +00001014 DEBUG(BB->dump());
Nate Begemanf15485a2006-03-27 01:32:24 +00001015
David Greene1a053232010-01-05 01:26:11 +00001016 DEBUG(dbgs() << "Total amount of phi nodes to update: "
Dan Gohman2048b852009-11-23 18:04:58 +00001017 << SDB->PHINodesToUpdate.size() << "\n");
1018 DEBUG(for (unsigned i = 0, e = SDB->PHINodesToUpdate.size(); i != e; ++i)
David Greene1a053232010-01-05 01:26:11 +00001019 dbgs() << "Node " << i << " : ("
Dan Gohman2048b852009-11-23 18:04:58 +00001020 << SDB->PHINodesToUpdate[i].first
1021 << ", " << SDB->PHINodesToUpdate[i].second << ")\n");
Daniel Dunbara279bc32009-09-20 02:20:51 +00001022
Chris Lattnera33ef482005-03-30 01:10:47 +00001023 // Next, now that we know what the last MBB the LLVM BB expanded is, update
Chris Lattner1c08c712005-01-07 07:47:53 +00001024 // PHI nodes in successors.
Dan Gohman2048b852009-11-23 18:04:58 +00001025 if (SDB->SwitchCases.empty() &&
1026 SDB->JTCases.empty() &&
1027 SDB->BitTestCases.empty()) {
1028 for (unsigned i = 0, e = SDB->PHINodesToUpdate.size(); i != e; ++i) {
1029 MachineInstr *PHI = SDB->PHINodesToUpdate[i].first;
Chris Lattner518bb532010-02-09 19:54:29 +00001030 assert(PHI->isPHI() &&
Nate Begemanf15485a2006-03-27 01:32:24 +00001031 "This is not a machine PHI node that we are updating!");
Dan Gohman2048b852009-11-23 18:04:58 +00001032 PHI->addOperand(MachineOperand::CreateReg(SDB->PHINodesToUpdate[i].second,
Chris Lattner9ce2e9d2007-12-30 00:57:42 +00001033 false));
1034 PHI->addOperand(MachineOperand::CreateMBB(BB));
Nate Begemanf15485a2006-03-27 01:32:24 +00001035 }
Dan Gohman2048b852009-11-23 18:04:58 +00001036 SDB->PHINodesToUpdate.clear();
Nate Begemanf15485a2006-03-27 01:32:24 +00001037 return;
Chris Lattner1c08c712005-01-07 07:47:53 +00001038 }
Anton Korobeynikov4198c582007-04-09 12:31:58 +00001039
Dan Gohman2048b852009-11-23 18:04:58 +00001040 for (unsigned i = 0, e = SDB->BitTestCases.size(); i != e; ++i) {
Anton Korobeynikov4198c582007-04-09 12:31:58 +00001041 // Lower header first, if it wasn't already lowered
Dan Gohman2048b852009-11-23 18:04:58 +00001042 if (!SDB->BitTestCases[i].Emitted) {
Anton Korobeynikov4198c582007-04-09 12:31:58 +00001043 // Set the current basic block to the mbb we wish to insert the code into
Dan Gohman2048b852009-11-23 18:04:58 +00001044 BB = SDB->BitTestCases[i].Parent;
1045 SDB->setCurrentBasicBlock(BB);
Anton Korobeynikov4198c582007-04-09 12:31:58 +00001046 // Emit the code
Dan Gohman2048b852009-11-23 18:04:58 +00001047 SDB->visitBitTestHeader(SDB->BitTestCases[i]);
1048 CurDAG->setRoot(SDB->getRoot());
Dan Gohmanf350b272008-08-23 02:25:05 +00001049 CodeGenAndEmitDAG();
Dan Gohman2048b852009-11-23 18:04:58 +00001050 SDB->clear();
Daniel Dunbara279bc32009-09-20 02:20:51 +00001051 }
Anton Korobeynikov4198c582007-04-09 12:31:58 +00001052
Dan Gohman2048b852009-11-23 18:04:58 +00001053 for (unsigned j = 0, ej = SDB->BitTestCases[i].Cases.size(); j != ej; ++j) {
Anton Korobeynikov4198c582007-04-09 12:31:58 +00001054 // Set the current basic block to the mbb we wish to insert the code into
Dan Gohman2048b852009-11-23 18:04:58 +00001055 BB = SDB->BitTestCases[i].Cases[j].ThisBB;
1056 SDB->setCurrentBasicBlock(BB);
Anton Korobeynikov4198c582007-04-09 12:31:58 +00001057 // Emit the code
1058 if (j+1 != ej)
Dan Gohman2048b852009-11-23 18:04:58 +00001059 SDB->visitBitTestCase(SDB->BitTestCases[i].Cases[j+1].ThisBB,
1060 SDB->BitTestCases[i].Reg,
1061 SDB->BitTestCases[i].Cases[j]);
Anton Korobeynikov4198c582007-04-09 12:31:58 +00001062 else
Dan Gohman2048b852009-11-23 18:04:58 +00001063 SDB->visitBitTestCase(SDB->BitTestCases[i].Default,
1064 SDB->BitTestCases[i].Reg,
1065 SDB->BitTestCases[i].Cases[j]);
Daniel Dunbara279bc32009-09-20 02:20:51 +00001066
1067
Dan Gohman2048b852009-11-23 18:04:58 +00001068 CurDAG->setRoot(SDB->getRoot());
Dan Gohmanf350b272008-08-23 02:25:05 +00001069 CodeGenAndEmitDAG();
Dan Gohman2048b852009-11-23 18:04:58 +00001070 SDB->clear();
Anton Korobeynikov4198c582007-04-09 12:31:58 +00001071 }
1072
1073 // Update PHI Nodes
Dan Gohman2048b852009-11-23 18:04:58 +00001074 for (unsigned pi = 0, pe = SDB->PHINodesToUpdate.size(); pi != pe; ++pi) {
1075 MachineInstr *PHI = SDB->PHINodesToUpdate[pi].first;
Anton Korobeynikov4198c582007-04-09 12:31:58 +00001076 MachineBasicBlock *PHIBB = PHI->getParent();
Chris Lattner518bb532010-02-09 19:54:29 +00001077 assert(PHI->isPHI() &&
Anton Korobeynikov4198c582007-04-09 12:31:58 +00001078 "This is not a machine PHI node that we are updating!");
1079 // This is "default" BB. We have two jumps to it. From "header" BB and
1080 // from last "case" BB.
Dan Gohman2048b852009-11-23 18:04:58 +00001081 if (PHIBB == SDB->BitTestCases[i].Default) {
Jim Grosbachf4549b02010-01-15 00:36:15 +00001082 PHI->addOperand(MachineOperand::
1083 CreateReg(SDB->PHINodesToUpdate[pi].second, false));
Dan Gohman2048b852009-11-23 18:04:58 +00001084 PHI->addOperand(MachineOperand::CreateMBB(SDB->BitTestCases[i].Parent));
Jim Grosbachf4549b02010-01-15 00:36:15 +00001085 PHI->addOperand(MachineOperand::
1086 CreateReg(SDB->PHINodesToUpdate[pi].second, false));
Dan Gohman2048b852009-11-23 18:04:58 +00001087 PHI->addOperand(MachineOperand::CreateMBB(SDB->BitTestCases[i].Cases.
Chris Lattner9ce2e9d2007-12-30 00:57:42 +00001088 back().ThisBB));
Anton Korobeynikov4198c582007-04-09 12:31:58 +00001089 }
1090 // One of "cases" BB.
Dan Gohman2048b852009-11-23 18:04:58 +00001091 for (unsigned j = 0, ej = SDB->BitTestCases[i].Cases.size();
Dan Gohman7c3234c2008-08-27 23:52:12 +00001092 j != ej; ++j) {
Dan Gohman2048b852009-11-23 18:04:58 +00001093 MachineBasicBlock* cBB = SDB->BitTestCases[i].Cases[j].ThisBB;
Jakob Stoklund Olesendd437ba2010-01-11 21:02:33 +00001094 if (cBB->isSuccessor(PHIBB)) {
Jim Grosbachf4549b02010-01-15 00:36:15 +00001095 PHI->addOperand(MachineOperand::
1096 CreateReg(SDB->PHINodesToUpdate[pi].second, false));
Chris Lattner9ce2e9d2007-12-30 00:57:42 +00001097 PHI->addOperand(MachineOperand::CreateMBB(cBB));
Anton Korobeynikov4198c582007-04-09 12:31:58 +00001098 }
1099 }
1100 }
1101 }
Dan Gohman2048b852009-11-23 18:04:58 +00001102 SDB->BitTestCases.clear();
Anton Korobeynikov4198c582007-04-09 12:31:58 +00001103
Nate Begeman9453eea2006-04-23 06:26:20 +00001104 // If the JumpTable record is filled in, then we need to emit a jump table.
1105 // Updating the PHI nodes is tricky in this case, since we need to determine
1106 // whether the PHI is a successor of the range check MBB or the jump table MBB
Dan Gohman2048b852009-11-23 18:04:58 +00001107 for (unsigned i = 0, e = SDB->JTCases.size(); i != e; ++i) {
Anton Korobeynikov3a84b9b2007-03-25 15:07:15 +00001108 // Lower header first, if it wasn't already lowered
Dan Gohman2048b852009-11-23 18:04:58 +00001109 if (!SDB->JTCases[i].first.Emitted) {
Anton Korobeynikov3a84b9b2007-03-25 15:07:15 +00001110 // Set the current basic block to the mbb we wish to insert the code into
Dan Gohman2048b852009-11-23 18:04:58 +00001111 BB = SDB->JTCases[i].first.HeaderBB;
1112 SDB->setCurrentBasicBlock(BB);
Anton Korobeynikov3a84b9b2007-03-25 15:07:15 +00001113 // Emit the code
Dan Gohman2048b852009-11-23 18:04:58 +00001114 SDB->visitJumpTableHeader(SDB->JTCases[i].second, SDB->JTCases[i].first);
1115 CurDAG->setRoot(SDB->getRoot());
Dan Gohmanf350b272008-08-23 02:25:05 +00001116 CodeGenAndEmitDAG();
Dan Gohman2048b852009-11-23 18:04:58 +00001117 SDB->clear();
Anton Korobeynikov4198c582007-04-09 12:31:58 +00001118 }
Daniel Dunbara279bc32009-09-20 02:20:51 +00001119
Nate Begeman37efe672006-04-22 18:53:45 +00001120 // Set the current basic block to the mbb we wish to insert the code into
Dan Gohman2048b852009-11-23 18:04:58 +00001121 BB = SDB->JTCases[i].second.MBB;
1122 SDB->setCurrentBasicBlock(BB);
Nate Begeman37efe672006-04-22 18:53:45 +00001123 // Emit the code
Dan Gohman2048b852009-11-23 18:04:58 +00001124 SDB->visitJumpTable(SDB->JTCases[i].second);
1125 CurDAG->setRoot(SDB->getRoot());
Dan Gohmanf350b272008-08-23 02:25:05 +00001126 CodeGenAndEmitDAG();
Dan Gohman2048b852009-11-23 18:04:58 +00001127 SDB->clear();
Daniel Dunbara279bc32009-09-20 02:20:51 +00001128
Nate Begeman37efe672006-04-22 18:53:45 +00001129 // Update PHI Nodes
Dan Gohman2048b852009-11-23 18:04:58 +00001130 for (unsigned pi = 0, pe = SDB->PHINodesToUpdate.size(); pi != pe; ++pi) {
1131 MachineInstr *PHI = SDB->PHINodesToUpdate[pi].first;
Nate Begeman37efe672006-04-22 18:53:45 +00001132 MachineBasicBlock *PHIBB = PHI->getParent();
Chris Lattner518bb532010-02-09 19:54:29 +00001133 assert(PHI->isPHI() &&
Nate Begeman37efe672006-04-22 18:53:45 +00001134 "This is not a machine PHI node that we are updating!");
Anton Korobeynikov4198c582007-04-09 12:31:58 +00001135 // "default" BB. We can go there only from header BB.
Dan Gohman2048b852009-11-23 18:04:58 +00001136 if (PHIBB == SDB->JTCases[i].second.Default) {
Evan Chengce319102009-09-19 09:51:03 +00001137 PHI->addOperand
Dan Gohman2048b852009-11-23 18:04:58 +00001138 (MachineOperand::CreateReg(SDB->PHINodesToUpdate[pi].second, false));
Evan Chengce319102009-09-19 09:51:03 +00001139 PHI->addOperand
Dan Gohman2048b852009-11-23 18:04:58 +00001140 (MachineOperand::CreateMBB(SDB->JTCases[i].first.HeaderBB));
Nate Begemanf4360a42006-05-03 03:48:02 +00001141 }
Anton Korobeynikov4198c582007-04-09 12:31:58 +00001142 // JT BB. Just iterate over successors here
Jakob Stoklund Olesendd437ba2010-01-11 21:02:33 +00001143 if (BB->isSuccessor(PHIBB)) {
Evan Chengce319102009-09-19 09:51:03 +00001144 PHI->addOperand
Dan Gohman2048b852009-11-23 18:04:58 +00001145 (MachineOperand::CreateReg(SDB->PHINodesToUpdate[pi].second, false));
Chris Lattner9ce2e9d2007-12-30 00:57:42 +00001146 PHI->addOperand(MachineOperand::CreateMBB(BB));
Nate Begeman37efe672006-04-22 18:53:45 +00001147 }
1148 }
Nate Begeman37efe672006-04-22 18:53:45 +00001149 }
Dan Gohman2048b852009-11-23 18:04:58 +00001150 SDB->JTCases.clear();
Daniel Dunbara279bc32009-09-20 02:20:51 +00001151
Chris Lattnerb2e806e2006-10-22 23:00:53 +00001152 // If the switch block involved a branch to one of the actual successors, we
1153 // need to update PHI nodes in that block.
Dan Gohman2048b852009-11-23 18:04:58 +00001154 for (unsigned i = 0, e = SDB->PHINodesToUpdate.size(); i != e; ++i) {
1155 MachineInstr *PHI = SDB->PHINodesToUpdate[i].first;
Chris Lattner518bb532010-02-09 19:54:29 +00001156 assert(PHI->isPHI() &&
Chris Lattnerb2e806e2006-10-22 23:00:53 +00001157 "This is not a machine PHI node that we are updating!");
1158 if (BB->isSuccessor(PHI->getParent())) {
Dan Gohman2048b852009-11-23 18:04:58 +00001159 PHI->addOperand(MachineOperand::CreateReg(SDB->PHINodesToUpdate[i].second,
Chris Lattner9ce2e9d2007-12-30 00:57:42 +00001160 false));
1161 PHI->addOperand(MachineOperand::CreateMBB(BB));
Chris Lattnerb2e806e2006-10-22 23:00:53 +00001162 }
1163 }
Daniel Dunbara279bc32009-09-20 02:20:51 +00001164
Nate Begemanf15485a2006-03-27 01:32:24 +00001165 // If we generated any switch lowering information, build and codegen any
1166 // additional DAGs necessary.
Dan Gohman2048b852009-11-23 18:04:58 +00001167 for (unsigned i = 0, e = SDB->SwitchCases.size(); i != e; ++i) {
Nate Begemanf15485a2006-03-27 01:32:24 +00001168 // Set the current basic block to the mbb we wish to insert the code into
Dan Gohman2048b852009-11-23 18:04:58 +00001169 MachineBasicBlock *ThisBB = BB = SDB->SwitchCases[i].ThisBB;
1170 SDB->setCurrentBasicBlock(BB);
Daniel Dunbara279bc32009-09-20 02:20:51 +00001171
Nate Begemanf15485a2006-03-27 01:32:24 +00001172 // Emit the code
Dan Gohman2048b852009-11-23 18:04:58 +00001173 SDB->visitSwitchCase(SDB->SwitchCases[i]);
1174 CurDAG->setRoot(SDB->getRoot());
Dan Gohmanf350b272008-08-23 02:25:05 +00001175 CodeGenAndEmitDAG();
Daniel Dunbara279bc32009-09-20 02:20:51 +00001176
Chris Lattnerd5e93c02006-09-07 01:59:34 +00001177 // Handle any PHI nodes in successors of this chunk, as if we were coming
1178 // from the original BB before switch expansion. Note that PHI nodes can
1179 // occur multiple times in PHINodesToUpdate. We have to be very careful to
1180 // handle them the right number of times.
Dan Gohman2048b852009-11-23 18:04:58 +00001181 while ((BB = SDB->SwitchCases[i].TrueBB)) { // Handle LHS and RHS.
Evan Chengfb2e7522009-09-18 21:02:19 +00001182 // If new BB's are created during scheduling, the edges may have been
Evan Chengce319102009-09-19 09:51:03 +00001183 // updated. That is, the edge from ThisBB to BB may have been split and
1184 // BB's predecessor is now another block.
Evan Chengfb2e7522009-09-18 21:02:19 +00001185 DenseMap<MachineBasicBlock*, MachineBasicBlock*>::iterator EI =
Dan Gohman2048b852009-11-23 18:04:58 +00001186 SDB->EdgeMapping.find(BB);
1187 if (EI != SDB->EdgeMapping.end())
Evan Chengfb2e7522009-09-18 21:02:19 +00001188 ThisBB = EI->second;
Jakob Stoklund Olesendd437ba2010-01-11 21:02:33 +00001189
1190 // BB may have been removed from the CFG if a branch was constant folded.
1191 if (ThisBB->isSuccessor(BB)) {
1192 for (MachineBasicBlock::iterator Phi = BB->begin();
Chris Lattner518bb532010-02-09 19:54:29 +00001193 Phi != BB->end() && Phi->isPHI();
Jakob Stoklund Olesendd437ba2010-01-11 21:02:33 +00001194 ++Phi) {
1195 // This value for this PHI node is recorded in PHINodesToUpdate.
1196 for (unsigned pn = 0; ; ++pn) {
1197 assert(pn != SDB->PHINodesToUpdate.size() &&
1198 "Didn't find PHI entry!");
1199 if (SDB->PHINodesToUpdate[pn].first == Phi) {
1200 Phi->addOperand(MachineOperand::
1201 CreateReg(SDB->PHINodesToUpdate[pn].second,
1202 false));
1203 Phi->addOperand(MachineOperand::CreateMBB(ThisBB));
1204 break;
1205 }
Evan Cheng8be58a12009-09-18 08:26:06 +00001206 }
Chris Lattnerd5e93c02006-09-07 01:59:34 +00001207 }
Nate Begemanf15485a2006-03-27 01:32:24 +00001208 }
Daniel Dunbara279bc32009-09-20 02:20:51 +00001209
Chris Lattnerd5e93c02006-09-07 01:59:34 +00001210 // Don't process RHS if same block as LHS.
Dan Gohman2048b852009-11-23 18:04:58 +00001211 if (BB == SDB->SwitchCases[i].FalseBB)
1212 SDB->SwitchCases[i].FalseBB = 0;
Daniel Dunbara279bc32009-09-20 02:20:51 +00001213
Chris Lattnerd5e93c02006-09-07 01:59:34 +00001214 // If we haven't handled the RHS, do so now. Otherwise, we're done.
Dan Gohman2048b852009-11-23 18:04:58 +00001215 SDB->SwitchCases[i].TrueBB = SDB->SwitchCases[i].FalseBB;
1216 SDB->SwitchCases[i].FalseBB = 0;
Nate Begemanf15485a2006-03-27 01:32:24 +00001217 }
Dan Gohman2048b852009-11-23 18:04:58 +00001218 assert(SDB->SwitchCases[i].TrueBB == 0 && SDB->SwitchCases[i].FalseBB == 0);
1219 SDB->clear();
Chris Lattnera33ef482005-03-30 01:10:47 +00001220 }
Dan Gohman2048b852009-11-23 18:04:58 +00001221 SDB->SwitchCases.clear();
Dan Gohman7c3234c2008-08-27 23:52:12 +00001222
Dan Gohman2048b852009-11-23 18:04:58 +00001223 SDB->PHINodesToUpdate.clear();
Chris Lattner1c08c712005-01-07 07:47:53 +00001224}
Evan Chenga9c20912006-01-21 02:32:06 +00001225
Jim Laskey13ec7022006-08-01 14:21:23 +00001226
Dan Gohman0a3776d2009-02-06 18:26:51 +00001227/// Create the scheduler. If a specific scheduler was specified
1228/// via the SchedulerRegistry, use it, otherwise select the
1229/// one preferred by the target.
Dan Gohman5e843682008-07-14 18:19:29 +00001230///
Dan Gohman47ac0f02009-02-11 04:27:20 +00001231ScheduleDAGSDNodes *SelectionDAGISel::CreateScheduler() {
Jim Laskeyeb577ba2006-08-02 12:30:23 +00001232 RegisterScheduler::FunctionPassCtor Ctor = RegisterScheduler::getDefault();
Daniel Dunbara279bc32009-09-20 02:20:51 +00001233
Jim Laskey13ec7022006-08-01 14:21:23 +00001234 if (!Ctor) {
Jim Laskeyeb577ba2006-08-02 12:30:23 +00001235 Ctor = ISHeuristic;
Jim Laskey9373beb2006-08-01 19:14:14 +00001236 RegisterScheduler::setDefault(Ctor);
Evan Cheng4ef10862006-01-23 07:01:07 +00001237 }
Daniel Dunbara279bc32009-09-20 02:20:51 +00001238
Bill Wendlingbe8cc2a2009-04-29 00:15:41 +00001239 return Ctor(this, OptLevel);
Evan Chenga9c20912006-01-21 02:32:06 +00001240}
Chris Lattner0e43f2b2006-02-24 02:13:54 +00001241
Dan Gohmanfc54c552009-01-15 22:18:12 +00001242ScheduleHazardRecognizer *SelectionDAGISel::CreateTargetHazardRecognizer() {
1243 return new ScheduleHazardRecognizer();
Jim Laskey9ff542f2006-08-01 18:29:48 +00001244}
1245
Chris Lattner75548062006-10-11 03:58:02 +00001246//===----------------------------------------------------------------------===//
1247// Helper functions used by the generated instruction selector.
1248//===----------------------------------------------------------------------===//
1249// Calls to these methods are generated by tblgen.
1250
1251/// CheckAndMask - The isel is trying to match something like (and X, 255). If
1252/// the dag combiner simplified the 255, we still want to match. RHS is the
1253/// actual value in the DAG on the RHS of an AND, and DesiredMaskS is the value
1254/// specified in the .td file (e.g. 255).
Daniel Dunbara279bc32009-09-20 02:20:51 +00001255bool SelectionDAGISel::CheckAndMask(SDValue LHS, ConstantSDNode *RHS,
Dan Gohmandc9b3d02007-07-24 23:00:27 +00001256 int64_t DesiredMaskS) const {
Dan Gohman2e68b6f2008-02-25 21:11:39 +00001257 const APInt &ActualMask = RHS->getAPIntValue();
1258 const APInt &DesiredMask = APInt(LHS.getValueSizeInBits(), DesiredMaskS);
Daniel Dunbara279bc32009-09-20 02:20:51 +00001259
Chris Lattner75548062006-10-11 03:58:02 +00001260 // If the actual mask exactly matches, success!
1261 if (ActualMask == DesiredMask)
1262 return true;
Daniel Dunbara279bc32009-09-20 02:20:51 +00001263
Chris Lattner75548062006-10-11 03:58:02 +00001264 // If the actual AND mask is allowing unallowed bits, this doesn't match.
Dan Gohman2e68b6f2008-02-25 21:11:39 +00001265 if (ActualMask.intersects(~DesiredMask))
Chris Lattner75548062006-10-11 03:58:02 +00001266 return false;
Daniel Dunbara279bc32009-09-20 02:20:51 +00001267
Chris Lattner75548062006-10-11 03:58:02 +00001268 // Otherwise, the DAG Combiner may have proven that the value coming in is
1269 // either already zero or is not demanded. Check for known zero input bits.
Dan Gohman2e68b6f2008-02-25 21:11:39 +00001270 APInt NeededMask = DesiredMask & ~ActualMask;
Dan Gohmanea859be2007-06-22 14:59:07 +00001271 if (CurDAG->MaskedValueIsZero(LHS, NeededMask))
Chris Lattner75548062006-10-11 03:58:02 +00001272 return true;
Daniel Dunbara279bc32009-09-20 02:20:51 +00001273
Chris Lattner75548062006-10-11 03:58:02 +00001274 // TODO: check to see if missing bits are just not demanded.
1275
1276 // Otherwise, this pattern doesn't match.
1277 return false;
1278}
1279
1280/// CheckOrMask - The isel is trying to match something like (or X, 255). If
1281/// the dag combiner simplified the 255, we still want to match. RHS is the
1282/// actual value in the DAG on the RHS of an OR, and DesiredMaskS is the value
1283/// specified in the .td file (e.g. 255).
Daniel Dunbara279bc32009-09-20 02:20:51 +00001284bool SelectionDAGISel::CheckOrMask(SDValue LHS, ConstantSDNode *RHS,
Dan Gohman2e68b6f2008-02-25 21:11:39 +00001285 int64_t DesiredMaskS) const {
1286 const APInt &ActualMask = RHS->getAPIntValue();
1287 const APInt &DesiredMask = APInt(LHS.getValueSizeInBits(), DesiredMaskS);
Daniel Dunbara279bc32009-09-20 02:20:51 +00001288
Chris Lattner75548062006-10-11 03:58:02 +00001289 // If the actual mask exactly matches, success!
1290 if (ActualMask == DesiredMask)
1291 return true;
Daniel Dunbara279bc32009-09-20 02:20:51 +00001292
Chris Lattner75548062006-10-11 03:58:02 +00001293 // If the actual AND mask is allowing unallowed bits, this doesn't match.
Dan Gohman2e68b6f2008-02-25 21:11:39 +00001294 if (ActualMask.intersects(~DesiredMask))
Chris Lattner75548062006-10-11 03:58:02 +00001295 return false;
Daniel Dunbara279bc32009-09-20 02:20:51 +00001296
Chris Lattner75548062006-10-11 03:58:02 +00001297 // Otherwise, the DAG Combiner may have proven that the value coming in is
1298 // either already zero or is not demanded. Check for known zero input bits.
Dan Gohman2e68b6f2008-02-25 21:11:39 +00001299 APInt NeededMask = DesiredMask & ~ActualMask;
Daniel Dunbara279bc32009-09-20 02:20:51 +00001300
Dan Gohman2e68b6f2008-02-25 21:11:39 +00001301 APInt KnownZero, KnownOne;
Dan Gohmanea859be2007-06-22 14:59:07 +00001302 CurDAG->ComputeMaskedBits(LHS, NeededMask, KnownZero, KnownOne);
Daniel Dunbara279bc32009-09-20 02:20:51 +00001303
Chris Lattner75548062006-10-11 03:58:02 +00001304 // If all the missing bits in the or are already known to be set, match!
1305 if ((NeededMask & KnownOne) == NeededMask)
1306 return true;
Daniel Dunbara279bc32009-09-20 02:20:51 +00001307
Chris Lattner75548062006-10-11 03:58:02 +00001308 // TODO: check to see if missing bits are just not demanded.
Daniel Dunbara279bc32009-09-20 02:20:51 +00001309
Chris Lattner75548062006-10-11 03:58:02 +00001310 // Otherwise, this pattern doesn't match.
1311 return false;
1312}
1313
Jim Laskey9ff542f2006-08-01 18:29:48 +00001314
Chris Lattner0e43f2b2006-02-24 02:13:54 +00001315/// SelectInlineAsmMemoryOperands - Calls to this are automatically generated
1316/// by tblgen. Others should not call it.
1317void SelectionDAGISel::
Dan Gohmanf350b272008-08-23 02:25:05 +00001318SelectInlineAsmMemoryOperands(std::vector<SDValue> &Ops) {
Dan Gohman475871a2008-07-27 21:46:04 +00001319 std::vector<SDValue> InOps;
Chris Lattner0e43f2b2006-02-24 02:13:54 +00001320 std::swap(InOps, Ops);
1321
1322 Ops.push_back(InOps[0]); // input chain.
1323 Ops.push_back(InOps[1]); // input asm string.
1324
Chris Lattner0e43f2b2006-02-24 02:13:54 +00001325 unsigned i = 2, e = InOps.size();
Owen Anderson825b72b2009-08-11 20:47:22 +00001326 if (InOps[e-1].getValueType() == MVT::Flag)
Chris Lattner0e43f2b2006-02-24 02:13:54 +00001327 --e; // Don't process a flag operand if it is here.
Daniel Dunbara279bc32009-09-20 02:20:51 +00001328
Chris Lattner0e43f2b2006-02-24 02:13:54 +00001329 while (i != e) {
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001330 unsigned Flags = cast<ConstantSDNode>(InOps[i])->getZExtValue();
Dale Johannesen86b49f82008-09-24 01:07:17 +00001331 if ((Flags & 7) != 4 /*MEM*/) {
Chris Lattner0e43f2b2006-02-24 02:13:54 +00001332 // Just skip over this operand, copying the operands verbatim.
Evan Cheng697cbbf2009-03-20 18:03:34 +00001333 Ops.insert(Ops.end(), InOps.begin()+i,
1334 InOps.begin()+i+InlineAsm::getNumOperandRegisters(Flags) + 1);
1335 i += InlineAsm::getNumOperandRegisters(Flags) + 1;
Chris Lattner0e43f2b2006-02-24 02:13:54 +00001336 } else {
Evan Cheng697cbbf2009-03-20 18:03:34 +00001337 assert(InlineAsm::getNumOperandRegisters(Flags) == 1 &&
1338 "Memory operand with multiple values?");
Chris Lattner0e43f2b2006-02-24 02:13:54 +00001339 // Otherwise, this is a memory operand. Ask the target to select it.
Dan Gohman475871a2008-07-27 21:46:04 +00001340 std::vector<SDValue> SelOps;
Dan Gohmanf350b272008-08-23 02:25:05 +00001341 if (SelectInlineAsmMemoryOperand(InOps[i+1], 'm', SelOps)) {
Torok Edwin7d696d82009-07-11 13:10:19 +00001342 llvm_report_error("Could not match memory address. Inline asm"
1343 " failure!");
Chris Lattner0e43f2b2006-02-24 02:13:54 +00001344 }
Daniel Dunbara279bc32009-09-20 02:20:51 +00001345
Chris Lattner0e43f2b2006-02-24 02:13:54 +00001346 // Add this to the output node.
Dale Johannesen86b49f82008-09-24 01:07:17 +00001347 Ops.push_back(CurDAG->getTargetConstant(4/*MEM*/ | (SelOps.size()<< 3),
Dale Johannesen99499332009-12-23 07:32:51 +00001348 MVT::i32));
Chris Lattner0e43f2b2006-02-24 02:13:54 +00001349 Ops.insert(Ops.end(), SelOps.begin(), SelOps.end());
1350 i += 2;
1351 }
1352 }
Daniel Dunbara279bc32009-09-20 02:20:51 +00001353
Chris Lattner0e43f2b2006-02-24 02:13:54 +00001354 // Add the flag input back if present.
1355 if (e != InOps.size())
1356 Ops.push_back(InOps.back());
1357}
Devang Patel794fd752007-05-01 21:15:47 +00001358
Owen Andersone50ed302009-08-10 22:56:29 +00001359/// findFlagUse - Return use of EVT::Flag value produced by the specified
Anton Korobeynikovc1c6ef82009-05-08 18:51:58 +00001360/// SDNode.
1361///
1362static SDNode *findFlagUse(SDNode *N) {
1363 unsigned FlagResNo = N->getNumValues()-1;
1364 for (SDNode::use_iterator I = N->use_begin(), E = N->use_end(); I != E; ++I) {
1365 SDUse &Use = I.getUse();
1366 if (Use.getResNo() == FlagResNo)
1367 return Use.getUser();
1368 }
1369 return NULL;
1370}
1371
1372/// findNonImmUse - Return true if "Use" is a non-immediate use of "Def".
1373/// This function recursively traverses up the operand chain, ignoring
1374/// certain nodes.
1375static bool findNonImmUse(SDNode *Use, SDNode* Def, SDNode *ImmedUse,
1376 SDNode *Root,
1377 SmallPtrSet<SDNode*, 16> &Visited) {
Chris Lattnerda244a02010-02-23 19:32:27 +00001378 // The NodeID's are given uniques ID's where a node ID is guaranteed to be
1379 // greater than all of its (recursive) operands. If we scan to a point where
1380 // 'use' is smaller than the node we're scanning for, then we know we will
1381 // never find it.
1382 //
1383 // The Use may be -1 (unassigned) if it is a newly allocated node. This can
1384 // happen because we scan down to newly selected nodes in the case of flag
1385 // uses.
1386 if ((Use->getNodeId() < Def->getNodeId() && Use->getNodeId() != -1))
1387 return false;
1388
1389 // Don't revisit nodes if we already scanned it and didn't fail, we know we
1390 // won't fail if we scan it again.
1391 if (!Visited.insert(Use))
Anton Korobeynikovc1c6ef82009-05-08 18:51:58 +00001392 return false;
1393
1394 for (unsigned i = 0, e = Use->getNumOperands(); i != e; ++i) {
1395 SDNode *N = Use->getOperand(i).getNode();
1396 if (N == Def) {
1397 if (Use == ImmedUse || Use == Root)
1398 continue; // We are not looking for immediate use.
1399 assert(N != Root);
1400 return true;
1401 }
1402
1403 // Traverse up the operand chain.
1404 if (findNonImmUse(N, Def, ImmedUse, Root, Visited))
1405 return true;
1406 }
1407 return false;
1408}
1409
1410/// isNonImmUse - Start searching from Root up the DAG to check is Def can
1411/// be reached. Return true if that's the case. However, ignore direct uses
1412/// by ImmedUse (which would be U in the example illustrated in
Evan Cheng014bf212010-02-15 19:41:07 +00001413/// IsLegalToFold) and by Root (which can happen in the store case).
Anton Korobeynikovc1c6ef82009-05-08 18:51:58 +00001414/// FIXME: to be really generic, we should allow direct use by any node
1415/// that is being folded. But realisticly since we only fold loads which
1416/// have one non-chain use, we only need to watch out for load/op/store
1417/// and load/op/cmp case where the root (store / cmp) may reach the load via
1418/// its chain operand.
1419static inline bool isNonImmUse(SDNode *Root, SDNode *Def, SDNode *ImmedUse) {
1420 SmallPtrSet<SDNode*, 16> Visited;
1421 return findNonImmUse(Root, Def, ImmedUse, Root, Visited);
1422}
1423
Evan Cheng014bf212010-02-15 19:41:07 +00001424/// IsProfitableToFold - Returns true if it's profitable to fold the specific
1425/// operand node N of U during instruction selection that starts at Root.
1426bool SelectionDAGISel::IsProfitableToFold(SDValue N, SDNode *U,
1427 SDNode *Root) const {
1428 if (OptLevel == CodeGenOpt::None) return false;
1429 return N.hasOneUse();
1430}
1431
1432/// IsLegalToFold - Returns true if the specific operand node N of
1433/// U can be folded during instruction selection that starts at Root.
1434bool SelectionDAGISel::IsLegalToFold(SDValue N, SDNode *U, SDNode *Root) const {
Anton Korobeynikovc1c6ef82009-05-08 18:51:58 +00001435 if (OptLevel == CodeGenOpt::None) return false;
1436
1437 // If Root use can somehow reach N through a path that that doesn't contain
1438 // U then folding N would create a cycle. e.g. In the following
1439 // diagram, Root can reach N through X. If N is folded into into Root, then
1440 // X is both a predecessor and a successor of U.
1441 //
1442 // [N*] //
1443 // ^ ^ //
1444 // / \ //
1445 // [U*] [X]? //
1446 // ^ ^ //
1447 // \ / //
1448 // \ / //
1449 // [Root*] //
1450 //
1451 // * indicates nodes to be folded together.
1452 //
1453 // If Root produces a flag, then it gets (even more) interesting. Since it
1454 // will be "glued" together with its flag use in the scheduler, we need to
1455 // check if it might reach N.
1456 //
1457 // [N*] //
1458 // ^ ^ //
1459 // / \ //
1460 // [U*] [X]? //
1461 // ^ ^ //
1462 // \ \ //
1463 // \ | //
1464 // [Root*] | //
1465 // ^ | //
1466 // f | //
1467 // | / //
1468 // [Y] / //
1469 // ^ / //
1470 // f / //
1471 // | / //
1472 // [FU] //
1473 //
1474 // If FU (flag use) indirectly reaches N (the load), and Root folds N
1475 // (call it Fold), then X is a predecessor of FU and a successor of
1476 // Fold. But since Fold and FU are flagged together, this will create
1477 // a cycle in the scheduling graph.
1478
Owen Andersone50ed302009-08-10 22:56:29 +00001479 EVT VT = Root->getValueType(Root->getNumValues()-1);
Owen Anderson825b72b2009-08-11 20:47:22 +00001480 while (VT == MVT::Flag) {
Anton Korobeynikovc1c6ef82009-05-08 18:51:58 +00001481 SDNode *FU = findFlagUse(Root);
1482 if (FU == NULL)
1483 break;
1484 Root = FU;
1485 VT = Root->getValueType(Root->getNumValues()-1);
1486 }
1487
Evan Cheng014bf212010-02-15 19:41:07 +00001488 return !isNonImmUse(Root, N.getNode(), U);
Anton Korobeynikovc1c6ef82009-05-08 18:51:58 +00001489}
1490
Dan Gohmaneeb3a002010-01-05 01:24:18 +00001491SDNode *SelectionDAGISel::Select_INLINEASM(SDNode *N) {
1492 std::vector<SDValue> Ops(N->op_begin(), N->op_end());
Dan Gohmane1f188f2009-10-29 22:30:23 +00001493 SelectInlineAsmMemoryOperands(Ops);
1494
1495 std::vector<EVT> VTs;
1496 VTs.push_back(MVT::Other);
1497 VTs.push_back(MVT::Flag);
Dan Gohmaneeb3a002010-01-05 01:24:18 +00001498 SDValue New = CurDAG->getNode(ISD::INLINEASM, N->getDebugLoc(),
Dan Gohmane1f188f2009-10-29 22:30:23 +00001499 VTs, &Ops[0], Ops.size());
1500 return New.getNode();
1501}
1502
Dan Gohmaneeb3a002010-01-05 01:24:18 +00001503SDNode *SelectionDAGISel::Select_UNDEF(SDNode *N) {
Chris Lattner518bb532010-02-09 19:54:29 +00001504 return CurDAG->SelectNodeTo(N, TargetOpcode::IMPLICIT_DEF,N->getValueType(0));
Dan Gohmane1f188f2009-10-29 22:30:23 +00001505}
1506
Dan Gohmaneeb3a002010-01-05 01:24:18 +00001507SDNode *SelectionDAGISel::Select_EH_LABEL(SDNode *N) {
1508 SDValue Chain = N->getOperand(0);
Dan Gohmane1f188f2009-10-29 22:30:23 +00001509 unsigned C = cast<LabelSDNode>(N)->getLabelID();
1510 SDValue Tmp = CurDAG->getTargetConstant(C, MVT::i32);
Chris Lattner518bb532010-02-09 19:54:29 +00001511 return CurDAG->SelectNodeTo(N, TargetOpcode::EH_LABEL,
Dan Gohmane1f188f2009-10-29 22:30:23 +00001512 MVT::Other, Tmp, Chain);
1513}
1514
Chris Lattner2a49d572010-02-28 22:37:22 +00001515/// GetVBR - decode a vbr encoding whose top bit is set.
1516ALWAYS_INLINE static uint64_t
1517GetVBR(uint64_t Val, const unsigned char *MatcherTable, unsigned &Idx) {
1518 assert(Val >= 128 && "Not a VBR");
1519 Val &= 127; // Remove first vbr bit.
1520
1521 unsigned Shift = 7;
1522 uint64_t NextBits;
1523 do {
Chris Lattner14df8dc2010-02-28 22:38:43 +00001524 NextBits = MatcherTable[Idx++];
Chris Lattner2a49d572010-02-28 22:37:22 +00001525 Val |= (NextBits&127) << Shift;
1526 Shift += 7;
1527 } while (NextBits & 128);
1528
1529 return Val;
1530}
1531
Chris Lattner2a49d572010-02-28 22:37:22 +00001532
1533/// UpdateChainsAndFlags - When a match is complete, this method updates uses of
1534/// interior flag and chain results to use the new flag and chain results.
1535static void UpdateChainsAndFlags(SDNode *NodeToMatch, SDValue InputChain,
1536 const SmallVectorImpl<SDNode*> &ChainNodesMatched,
1537 SDValue InputFlag,
1538 const SmallVectorImpl<SDNode*> &FlagResultNodesMatched,
1539 bool isMorphNodeTo, SelectionDAG *CurDAG) {
1540 // Now that all the normal results are replaced, we replace the chain and
1541 // flag results if present.
1542 if (!ChainNodesMatched.empty()) {
1543 assert(InputChain.getNode() != 0 &&
1544 "Matched input chains but didn't produce a chain");
1545 // Loop over all of the nodes we matched that produced a chain result.
1546 // Replace all the chain results with the final chain we ended up with.
1547 for (unsigned i = 0, e = ChainNodesMatched.size(); i != e; ++i) {
1548 SDNode *ChainNode = ChainNodesMatched[i];
1549
1550 // Don't replace the results of the root node if we're doing a
1551 // MorphNodeTo.
1552 if (ChainNode == NodeToMatch && isMorphNodeTo)
1553 continue;
1554
1555 SDValue ChainVal = SDValue(ChainNode, ChainNode->getNumValues()-1);
1556 if (ChainVal.getValueType() == MVT::Flag)
1557 ChainVal = ChainVal.getValue(ChainVal->getNumValues()-2);
1558 assert(ChainVal.getValueType() == MVT::Other && "Not a chain?");
1559 CurDAG->ReplaceAllUsesOfValueWith(ChainVal, InputChain);
1560 }
1561 }
1562
1563 // If the result produces a flag, update any flag results in the matched
1564 // pattern with the flag result.
1565 if (InputFlag.getNode() != 0) {
1566 // Handle any interior nodes explicitly marked.
1567 for (unsigned i = 0, e = FlagResultNodesMatched.size(); i != e; ++i) {
1568 SDNode *FRN = FlagResultNodesMatched[i];
1569 assert(FRN->getValueType(FRN->getNumValues()-1) == MVT::Flag &&
1570 "Doesn't have a flag result");
1571 CurDAG->ReplaceAllUsesOfValueWith(SDValue(FRN, FRN->getNumValues()-1),
1572 InputFlag);
1573 }
1574 }
1575
1576 DEBUG(errs() << "ISEL: Match complete!\n");
1577}
1578
Chris Lattnerc6d7ad32010-03-02 02:22:10 +00001579enum ChainResult {
1580 CR_Simple,
1581 CR_InducesCycle,
1582 CR_LeadsToInteriorNode
1583};
1584
1585/// WalkChainUsers - Walk down the users of the specified chained node that is
1586/// part of the pattern we're matching, looking at all of the users we find.
1587/// This determines whether something is an interior node, whether we have a
1588/// non-pattern node in between two pattern nodes (which prevent folding because
1589/// it would induce a cycle) and whether we have a TokenFactor node sandwiched
1590/// between pattern nodes (in which case the TF becomes part of the pattern).
1591///
1592/// The walk we do here is guaranteed to be small because we quickly get down to
1593/// already selected nodes "below" us.
1594static ChainResult
1595WalkChainUsers(SDNode *ChainedNode,
1596 SmallVectorImpl<SDNode*> &ChainedNodesInPattern,
1597 SmallVectorImpl<SDNode*> &InteriorChainedNodes) {
1598 ChainResult Result = CR_Simple;
1599
1600 for (SDNode::use_iterator UI = ChainedNode->use_begin(),
1601 E = ChainedNode->use_end(); UI != E; ++UI) {
1602 // Make sure the use is of the chain, not some other value we produce.
1603 if (UI.getUse().getValueType() != MVT::Other) continue;
1604
1605 SDNode *User = *UI;
1606
1607 // If we see an already-selected machine node, then we've gone beyond the
1608 // pattern that we're selecting down into the already selected chunk of the
1609 // DAG.
1610 if (User->isMachineOpcode() ||
1611 User->getOpcode() == ISD::CopyToReg ||
1612 User->getOpcode() == ISD::CopyFromReg ||
1613 User->getOpcode() == ISD::INLINEASM ||
1614 User->getOpcode() == ISD::HANDLENODE) // Root of the graph.
1615 continue;
1616
1617 // If we have a TokenFactor, we handle it specially.
1618 if (User->getOpcode() != ISD::TokenFactor) {
1619 // If the node isn't a token factor and isn't part of our pattern, then it
1620 // must be a random chained node in between two nodes we're selecting.
1621 // This happens when we have something like:
1622 // x = load ptr
1623 // call
1624 // y = x+4
1625 // store y -> ptr
1626 // Because we structurally match the load/store as a read/modify/write,
1627 // but the call is chained between them. We cannot fold in this case
1628 // because it would induce a cycle in the graph.
1629 if (!std::count(ChainedNodesInPattern.begin(),
1630 ChainedNodesInPattern.end(), User))
1631 return CR_InducesCycle;
1632
1633 // Otherwise we found a node that is part of our pattern. For example in:
1634 // x = load ptr
1635 // y = x+4
1636 // store y -> ptr
1637 // This would happen when we're scanning down from the load and see the
1638 // store as a user. Record that there is a use of ChainedNode that is
1639 // part of the pattern and keep scanning uses.
1640 Result = CR_LeadsToInteriorNode;
1641 InteriorChainedNodes.push_back(User);
1642 continue;
1643 }
1644
1645 // If we found a TokenFactor, there are two cases to consider: first if the
1646 // TokenFactor is just hanging "below" the pattern we're matching (i.e. no
1647 // uses of the TF are in our pattern) we just want to ignore it. Second,
1648 // the TokenFactor can be sandwiched in between two chained nodes, like so:
1649 // [Load chain]
1650 // ^
1651 // |
1652 // [Load]
1653 // ^ ^
1654 // | \ DAG's like cheese
1655 // / \ do you?
1656 // / |
1657 // [TokenFactor] [Op]
1658 // ^ ^
1659 // | |
1660 // \ /
1661 // \ /
1662 // [Store]
1663 //
1664 // In this case, the TokenFactor becomes part of our match and we rewrite it
1665 // as a new TokenFactor.
1666 //
1667 // To distinguish these two cases, do a recursive walk down the uses.
1668 switch (WalkChainUsers(User, ChainedNodesInPattern, InteriorChainedNodes)) {
1669 case CR_Simple:
1670 // If the uses of the TokenFactor are just already-selected nodes, ignore
1671 // it, it is "below" our pattern.
1672 continue;
1673 case CR_InducesCycle:
1674 // If the uses of the TokenFactor lead to nodes that are not part of our
1675 // pattern that are not selected, folding would turn this into a cycle,
1676 // bail out now.
1677 return CR_InducesCycle;
1678 case CR_LeadsToInteriorNode:
1679 break; // Otherwise, keep processing.
1680 }
1681
1682 // Okay, we know we're in the interesting interior case. The TokenFactor
1683 // is now going to be considered part of the pattern so that we rewrite its
1684 // uses (it may have uses that are not part of the pattern) with the
1685 // ultimate chain result of the generated code. We will also add its chain
1686 // inputs as inputs to the ultimate TokenFactor we create.
1687 Result = CR_LeadsToInteriorNode;
1688 ChainedNodesInPattern.push_back(User);
1689 InteriorChainedNodes.push_back(User);
1690 continue;
1691 }
1692
1693 return Result;
1694}
1695
Chris Lattner6b307922010-03-02 00:00:03 +00001696/// HandleMergeInputChains - This implements the OPC_EmitMergeInputChains
Chris Lattnerc6d7ad32010-03-02 02:22:10 +00001697/// operation for when the pattern matched multiple nodes with chains. The
1698/// input vector contains a list of all of the chained nodes that we match. We
1699/// must determine if this is a valid thing to cover (i.e. matching it won't
1700/// induce cycles in the DAG) and if so, creating a TokenFactor node. that will
1701/// be used as the input node chain for the generated nodes.
Chris Lattner6b307922010-03-02 00:00:03 +00001702static SDValue
Chris Lattnerc6d7ad32010-03-02 02:22:10 +00001703HandleMergeInputChains(SmallVectorImpl<SDNode*> &ChainNodesMatched,
Chris Lattner6b307922010-03-02 00:00:03 +00001704 SelectionDAG *CurDAG) {
1705 assert(ChainNodesMatched.size() > 1 &&
1706 "Should only happen for multi chain node case");
Chris Lattnerc6d7ad32010-03-02 02:22:10 +00001707
1708 // Walk all of the chained nodes we've matched, recursively scanning down the
1709 // users of the chain result. This adds any TokenFactor nodes that are caught
1710 // in between chained nodes to the chained and interior nodes list.
1711 SmallVector<SDNode*, 3> InteriorChainedNodes;
1712 for (unsigned i = 0, e = ChainNodesMatched.size(); i != e; ++i) {
1713 if (WalkChainUsers(ChainNodesMatched[i], ChainNodesMatched,
1714 InteriorChainedNodes) == CR_InducesCycle)
1715 return SDValue(); // Would induce a cycle.
1716 }
Chris Lattner6b307922010-03-02 00:00:03 +00001717
Chris Lattnerc6d7ad32010-03-02 02:22:10 +00001718 // Okay, we have walked all the matched nodes and collected TokenFactor nodes
1719 // that we are interested in. Form our input TokenFactor node.
Chris Lattner6b307922010-03-02 00:00:03 +00001720 SmallVector<SDValue, 3> InputChains;
1721 for (unsigned i = 0, e = ChainNodesMatched.size(); i != e; ++i) {
Chris Lattnerc6d7ad32010-03-02 02:22:10 +00001722 // Add the input chain of this node to the InputChains list (which will be
1723 // the operands of the generated TokenFactor) if it's not an interior node.
1724 SDNode *N = ChainNodesMatched[i];
1725 if (N->getOpcode() != ISD::TokenFactor) {
1726 if (std::count(InteriorChainedNodes.begin(),InteriorChainedNodes.end(),N))
1727 continue;
1728
1729 // Otherwise, add the input chain.
1730 SDValue InChain = ChainNodesMatched[i]->getOperand(0);
1731 assert(InChain.getValueType() == MVT::Other && "Not a chain");
Chris Lattner6b307922010-03-02 00:00:03 +00001732 InputChains.push_back(InChain);
Chris Lattnerc6d7ad32010-03-02 02:22:10 +00001733 continue;
1734 }
1735
1736 // If we have a token factor, we want to add all inputs of the token factor
1737 // that are not part of the pattern we're matching.
1738 for (unsigned op = 0, e = N->getNumOperands(); op != e; ++op) {
1739 if (!std::count(ChainNodesMatched.begin(), ChainNodesMatched.end(),
Chris Lattner6183fbd2010-03-02 02:37:23 +00001740 N->getOperand(op).getNode()))
1741 InputChains.push_back(N->getOperand(op));
Chris Lattnerc6d7ad32010-03-02 02:22:10 +00001742 }
Chris Lattner6b307922010-03-02 00:00:03 +00001743 }
1744
1745 SDValue Res;
1746 if (InputChains.size() == 1)
1747 return InputChains[0];
1748 return CurDAG->getNode(ISD::TokenFactor, ChainNodesMatched[0]->getDebugLoc(),
1749 MVT::Other, &InputChains[0], InputChains.size());
1750}
Chris Lattner2a49d572010-02-28 22:37:22 +00001751
Chris Lattner3ff1e4d2010-03-02 06:55:04 +00001752/// MorphNode - Handle morphing a node in place for the selector.
1753SDNode *SelectionDAGISel::
1754MorphNode(SDNode *Node, unsigned TargetOpc, SDVTList VTList,
1755 const SDValue *Ops, unsigned NumOps, unsigned EmitNodeInfo) {
1756 // It is possible we're using MorphNodeTo to replace a node with no
1757 // normal results with one that has a normal result (or we could be
1758 // adding a chain) and the input could have flags and chains as well.
1759 // In this case we need to shifting the operands down.
1760 // FIXME: This is a horrible hack and broken in obscure cases, no worse
1761 // than the old isel though. We should sink this into MorphNodeTo.
1762 int OldFlagResultNo = -1, OldChainResultNo = -1;
1763
1764 unsigned NTMNumResults = Node->getNumValues();
1765 if (Node->getValueType(NTMNumResults-1) == MVT::Flag) {
1766 OldFlagResultNo = NTMNumResults-1;
1767 if (NTMNumResults != 1 &&
1768 Node->getValueType(NTMNumResults-2) == MVT::Other)
1769 OldChainResultNo = NTMNumResults-2;
1770 } else if (Node->getValueType(NTMNumResults-1) == MVT::Other)
1771 OldChainResultNo = NTMNumResults-1;
1772
Chris Lattner61c97f62010-03-02 07:14:49 +00001773 // Call the underlying SelectionDAG routine to do the transmogrification. Note
1774 // that this deletes operands of the old node that become dead.
Chris Lattner3ff1e4d2010-03-02 06:55:04 +00001775 SDNode *Res = CurDAG->MorphNodeTo(Node, ~TargetOpc, VTList, Ops, NumOps);
1776
1777 // MorphNodeTo can operate in two ways: if an existing node with the
1778 // specified operands exists, it can just return it. Otherwise, it
1779 // updates the node in place to have the requested operands.
1780 if (Res == Node) {
1781 // If we updated the node in place, reset the node ID. To the isel,
1782 // this should be just like a newly allocated machine node.
1783 Res->setNodeId(-1);
1784 }
1785
1786 unsigned ResNumResults = Res->getNumValues();
1787 // Move the flag if needed.
1788 if ((EmitNodeInfo & OPFL_FlagOutput) && OldFlagResultNo != -1 &&
1789 (unsigned)OldFlagResultNo != ResNumResults-1)
1790 CurDAG->ReplaceAllUsesOfValueWith(SDValue(Node, OldFlagResultNo),
1791 SDValue(Res, ResNumResults-1));
1792
1793 if ((EmitNodeInfo & OPFL_FlagOutput) != 0)
1794 --ResNumResults;
1795
1796 // Move the chain reference if needed.
1797 if ((EmitNodeInfo & OPFL_Chain) && OldChainResultNo != -1 &&
1798 (unsigned)OldChainResultNo != ResNumResults-1)
1799 CurDAG->ReplaceAllUsesOfValueWith(SDValue(Node, OldChainResultNo),
1800 SDValue(Res, ResNumResults-1));
1801
1802 // Otherwise, no replacement happened because the node already exists. Replace
1803 // Uses of the old node with the new one.
1804 if (Res != Node)
1805 CurDAG->ReplaceAllUsesWith(Node, Res);
1806
1807 return Res;
1808}
1809
1810
Chris Lattner2a49d572010-02-28 22:37:22 +00001811struct MatchScope {
1812 /// FailIndex - If this match fails, this is the index to continue with.
1813 unsigned FailIndex;
1814
1815 /// NodeStack - The node stack when the scope was formed.
1816 SmallVector<SDValue, 4> NodeStack;
1817
1818 /// NumRecordedNodes - The number of recorded nodes when the scope was formed.
1819 unsigned NumRecordedNodes;
1820
1821 /// NumMatchedMemRefs - The number of matched memref entries.
1822 unsigned NumMatchedMemRefs;
1823
1824 /// InputChain/InputFlag - The current chain/flag
1825 SDValue InputChain, InputFlag;
1826
1827 /// HasChainNodesMatched - True if the ChainNodesMatched list is non-empty.
1828 bool HasChainNodesMatched, HasFlagResultNodesMatched;
1829};
1830
1831SDNode *SelectionDAGISel::
1832SelectCodeCommon(SDNode *NodeToMatch, const unsigned char *MatcherTable,
1833 unsigned TableSize) {
1834 // FIXME: Should these even be selected? Handle these cases in the caller?
1835 switch (NodeToMatch->getOpcode()) {
1836 default:
1837 break;
1838 case ISD::EntryToken: // These nodes remain the same.
1839 case ISD::BasicBlock:
1840 case ISD::Register:
1841 case ISD::HANDLENODE:
1842 case ISD::TargetConstant:
1843 case ISD::TargetConstantFP:
1844 case ISD::TargetConstantPool:
1845 case ISD::TargetFrameIndex:
1846 case ISD::TargetExternalSymbol:
1847 case ISD::TargetBlockAddress:
1848 case ISD::TargetJumpTable:
1849 case ISD::TargetGlobalTLSAddress:
1850 case ISD::TargetGlobalAddress:
1851 case ISD::TokenFactor:
1852 case ISD::CopyFromReg:
1853 case ISD::CopyToReg:
1854 return 0;
1855 case ISD::AssertSext:
1856 case ISD::AssertZext:
1857 CurDAG->ReplaceAllUsesOfValueWith(SDValue(NodeToMatch, 0),
1858 NodeToMatch->getOperand(0));
1859 return 0;
1860 case ISD::INLINEASM: return Select_INLINEASM(NodeToMatch);
1861 case ISD::EH_LABEL: return Select_EH_LABEL(NodeToMatch);
1862 case ISD::UNDEF: return Select_UNDEF(NodeToMatch);
1863 }
1864
1865 assert(!NodeToMatch->isMachineOpcode() && "Node already selected!");
1866
1867 // Set up the node stack with NodeToMatch as the only node on the stack.
1868 SmallVector<SDValue, 8> NodeStack;
1869 SDValue N = SDValue(NodeToMatch, 0);
1870 NodeStack.push_back(N);
1871
1872 // MatchScopes - Scopes used when matching, if a match failure happens, this
1873 // indicates where to continue checking.
1874 SmallVector<MatchScope, 8> MatchScopes;
1875
1876 // RecordedNodes - This is the set of nodes that have been recorded by the
1877 // state machine.
1878 SmallVector<SDValue, 8> RecordedNodes;
1879
1880 // MatchedMemRefs - This is the set of MemRef's we've seen in the input
1881 // pattern.
1882 SmallVector<MachineMemOperand*, 2> MatchedMemRefs;
1883
1884 // These are the current input chain and flag for use when generating nodes.
1885 // Various Emit operations change these. For example, emitting a copytoreg
1886 // uses and updates these.
1887 SDValue InputChain, InputFlag;
1888
1889 // ChainNodesMatched - If a pattern matches nodes that have input/output
1890 // chains, the OPC_EmitMergeInputChains operation is emitted which indicates
1891 // which ones they are. The result is captured into this list so that we can
1892 // update the chain results when the pattern is complete.
1893 SmallVector<SDNode*, 3> ChainNodesMatched;
1894 SmallVector<SDNode*, 3> FlagResultNodesMatched;
1895
1896 DEBUG(errs() << "ISEL: Starting pattern match on root node: ";
1897 NodeToMatch->dump(CurDAG);
1898 errs() << '\n');
1899
Chris Lattner7390eeb2010-03-01 18:47:11 +00001900 // Determine where to start the interpreter. Normally we start at opcode #0,
1901 // but if the state machine starts with an OPC_SwitchOpcode, then we
1902 // accelerate the first lookup (which is guaranteed to be hot) with the
1903 // OpcodeOffset table.
Chris Lattner2a49d572010-02-28 22:37:22 +00001904 unsigned MatcherIndex = 0;
Chris Lattner7390eeb2010-03-01 18:47:11 +00001905
1906 if (!OpcodeOffset.empty()) {
1907 // Already computed the OpcodeOffset table, just index into it.
1908 if (N.getOpcode() < OpcodeOffset.size())
1909 MatcherIndex = OpcodeOffset[N.getOpcode()];
1910 DEBUG(errs() << " Initial Opcode index to " << MatcherIndex << "\n");
1911
1912 } else if (MatcherTable[0] == OPC_SwitchOpcode) {
1913 // Otherwise, the table isn't computed, but the state machine does start
1914 // with an OPC_SwitchOpcode instruction. Populate the table now, since this
1915 // is the first time we're selecting an instruction.
1916 unsigned Idx = 1;
1917 while (1) {
1918 // Get the size of this case.
1919 unsigned CaseSize = MatcherTable[Idx++];
1920 if (CaseSize & 128)
1921 CaseSize = GetVBR(CaseSize, MatcherTable, Idx);
1922 if (CaseSize == 0) break;
1923
1924 // Get the opcode, add the index to the table.
1925 unsigned Opc = MatcherTable[Idx++];
1926 if (Opc >= OpcodeOffset.size())
1927 OpcodeOffset.resize((Opc+1)*2);
1928 OpcodeOffset[Opc] = Idx;
1929 Idx += CaseSize;
1930 }
1931
1932 // Okay, do the lookup for the first opcode.
1933 if (N.getOpcode() < OpcodeOffset.size())
1934 MatcherIndex = OpcodeOffset[N.getOpcode()];
1935 }
1936
Chris Lattner2a49d572010-02-28 22:37:22 +00001937 while (1) {
1938 assert(MatcherIndex < TableSize && "Invalid index");
1939 BuiltinOpcodes Opcode = (BuiltinOpcodes)MatcherTable[MatcherIndex++];
1940 switch (Opcode) {
1941 case OPC_Scope: {
1942 unsigned NumToSkip = MatcherTable[MatcherIndex++];
1943 if (NumToSkip & 128)
1944 NumToSkip = GetVBR(NumToSkip, MatcherTable, MatcherIndex);
1945 assert(NumToSkip != 0 &&
1946 "First entry of OPC_Scope shouldn't be 0, scope has no children?");
1947
1948 // Push a MatchScope which indicates where to go if the first child fails
1949 // to match.
1950 MatchScope NewEntry;
1951 NewEntry.FailIndex = MatcherIndex+NumToSkip;
1952 NewEntry.NodeStack.append(NodeStack.begin(), NodeStack.end());
1953 NewEntry.NumRecordedNodes = RecordedNodes.size();
1954 NewEntry.NumMatchedMemRefs = MatchedMemRefs.size();
1955 NewEntry.InputChain = InputChain;
1956 NewEntry.InputFlag = InputFlag;
1957 NewEntry.HasChainNodesMatched = !ChainNodesMatched.empty();
1958 NewEntry.HasFlagResultNodesMatched = !FlagResultNodesMatched.empty();
1959 MatchScopes.push_back(NewEntry);
1960 continue;
1961 }
1962 case OPC_RecordNode:
1963 // Remember this node, it may end up being an operand in the pattern.
1964 RecordedNodes.push_back(N);
1965 continue;
1966
1967 case OPC_RecordChild0: case OPC_RecordChild1:
1968 case OPC_RecordChild2: case OPC_RecordChild3:
1969 case OPC_RecordChild4: case OPC_RecordChild5:
1970 case OPC_RecordChild6: case OPC_RecordChild7: {
1971 unsigned ChildNo = Opcode-OPC_RecordChild0;
1972 if (ChildNo >= N.getNumOperands())
1973 break; // Match fails if out of range child #.
1974
1975 RecordedNodes.push_back(N->getOperand(ChildNo));
1976 continue;
1977 }
1978 case OPC_RecordMemRef:
1979 MatchedMemRefs.push_back(cast<MemSDNode>(N)->getMemOperand());
1980 continue;
1981
1982 case OPC_CaptureFlagInput:
1983 // If the current node has an input flag, capture it in InputFlag.
1984 if (N->getNumOperands() != 0 &&
1985 N->getOperand(N->getNumOperands()-1).getValueType() == MVT::Flag)
1986 InputFlag = N->getOperand(N->getNumOperands()-1);
1987 continue;
1988
1989 case OPC_MoveChild: {
1990 unsigned ChildNo = MatcherTable[MatcherIndex++];
1991 if (ChildNo >= N.getNumOperands())
1992 break; // Match fails if out of range child #.
1993 N = N.getOperand(ChildNo);
1994 NodeStack.push_back(N);
1995 continue;
1996 }
1997
1998 case OPC_MoveParent:
1999 // Pop the current node off the NodeStack.
2000 NodeStack.pop_back();
2001 assert(!NodeStack.empty() && "Node stack imbalance!");
2002 N = NodeStack.back();
2003 continue;
2004
2005 case OPC_CheckSame: {
2006 // Accept if it is exactly the same as a previously recorded node.
2007 unsigned RecNo = MatcherTable[MatcherIndex++];
2008 assert(RecNo < RecordedNodes.size() && "Invalid CheckSame");
2009 if (N != RecordedNodes[RecNo]) break;
2010 continue;
2011 }
2012 case OPC_CheckPatternPredicate:
2013 if (!CheckPatternPredicate(MatcherTable[MatcherIndex++])) break;
2014 continue;
2015 case OPC_CheckPredicate:
2016 if (!CheckNodePredicate(N.getNode(), MatcherTable[MatcherIndex++])) break;
2017 continue;
2018 case OPC_CheckComplexPat:
2019 if (!CheckComplexPattern(NodeToMatch, N,
2020 MatcherTable[MatcherIndex++], RecordedNodes))
2021 break;
2022 continue;
2023 case OPC_CheckOpcode:
2024 if (N->getOpcode() != MatcherTable[MatcherIndex++]) break;
2025 continue;
2026
Chris Lattnereb669212010-03-01 06:59:22 +00002027 case OPC_SwitchOpcode: {
2028 unsigned CurNodeOpcode = N.getOpcode();
2029
Chris Lattner7d892d62010-03-01 07:43:08 +00002030 unsigned SwitchStart = MatcherIndex-1; (void)SwitchStart;
Chris Lattnereb669212010-03-01 06:59:22 +00002031
2032 unsigned CaseSize;
2033 while (1) {
2034 // Get the size of this case.
2035 CaseSize = MatcherTable[MatcherIndex++];
2036 if (CaseSize & 128)
2037 CaseSize = GetVBR(CaseSize, MatcherTable, MatcherIndex);
2038 if (CaseSize == 0) break;
2039
2040 // If the opcode matches, then we will execute this case.
2041 if (CurNodeOpcode == MatcherTable[MatcherIndex++])
2042 break;
2043
2044 // Otherwise, skip over this case.
2045 MatcherIndex += CaseSize;
2046 }
2047
2048 // If we failed to match, bail out.
2049 if (CaseSize == 0) break;
2050
2051 // Otherwise, execute the case we found.
2052 DEBUG(errs() << " OpcodeSwitch from " << SwitchStart
2053 << " to " << MatcherIndex << "\n");
2054 continue;
2055 }
2056
Chris Lattner2a49d572010-02-28 22:37:22 +00002057 case OPC_CheckType: {
2058 MVT::SimpleValueType VT =
2059 (MVT::SimpleValueType)MatcherTable[MatcherIndex++];
2060 if (N.getValueType() != VT) {
2061 // Handle the case when VT is iPTR.
2062 if (VT != MVT::iPTR || N.getValueType() != TLI.getPointerTy())
2063 break;
2064 }
2065 continue;
2066 }
2067 case OPC_CheckChild0Type: case OPC_CheckChild1Type:
2068 case OPC_CheckChild2Type: case OPC_CheckChild3Type:
2069 case OPC_CheckChild4Type: case OPC_CheckChild5Type:
2070 case OPC_CheckChild6Type: case OPC_CheckChild7Type: {
2071 unsigned ChildNo = Opcode-OPC_CheckChild0Type;
2072 if (ChildNo >= N.getNumOperands())
2073 break; // Match fails if out of range child #.
2074
2075 MVT::SimpleValueType VT =
2076 (MVT::SimpleValueType)MatcherTable[MatcherIndex++];
2077 EVT ChildVT = N.getOperand(ChildNo).getValueType();
2078 if (ChildVT != VT) {
2079 // Handle the case when VT is iPTR.
2080 if (VT != MVT::iPTR || ChildVT != TLI.getPointerTy())
2081 break;
2082 }
2083 continue;
2084 }
2085 case OPC_CheckCondCode:
2086 if (cast<CondCodeSDNode>(N)->get() !=
2087 (ISD::CondCode)MatcherTable[MatcherIndex++]) break;
2088 continue;
2089 case OPC_CheckValueType: {
2090 MVT::SimpleValueType VT =
2091 (MVT::SimpleValueType)MatcherTable[MatcherIndex++];
2092 if (cast<VTSDNode>(N)->getVT() != VT) {
2093 // Handle the case when VT is iPTR.
2094 if (VT != MVT::iPTR || cast<VTSDNode>(N)->getVT() != TLI.getPointerTy())
2095 break;
2096 }
2097 continue;
2098 }
2099 case OPC_CheckInteger: {
2100 int64_t Val = MatcherTable[MatcherIndex++];
2101 if (Val & 128)
2102 Val = GetVBR(Val, MatcherTable, MatcherIndex);
2103
2104 ConstantSDNode *C = dyn_cast<ConstantSDNode>(N);
2105 if (C == 0 || C->getSExtValue() != Val)
2106 break;
2107 continue;
2108 }
2109 case OPC_CheckAndImm: {
2110 int64_t Val = MatcherTable[MatcherIndex++];
2111 if (Val & 128)
2112 Val = GetVBR(Val, MatcherTable, MatcherIndex);
2113
2114 if (N->getOpcode() != ISD::AND) break;
2115 ConstantSDNode *C = dyn_cast<ConstantSDNode>(N->getOperand(1));
2116 if (C == 0 || !CheckAndMask(N.getOperand(0), C, Val))
2117 break;
2118 continue;
2119 }
2120 case OPC_CheckOrImm: {
2121 int64_t Val = MatcherTable[MatcherIndex++];
2122 if (Val & 128)
2123 Val = GetVBR(Val, MatcherTable, MatcherIndex);
2124
2125 if (N->getOpcode() != ISD::OR) break;
2126
2127 ConstantSDNode *C = dyn_cast<ConstantSDNode>(N->getOperand(1));
2128 if (C == 0 || !CheckOrMask(N.getOperand(0), C, Val))
2129 break;
2130 continue;
2131 }
2132
2133 case OPC_CheckFoldableChainNode: {
2134 assert(NodeStack.size() != 1 && "No parent node");
2135 // Verify that all intermediate nodes between the root and this one have
2136 // a single use.
2137 bool HasMultipleUses = false;
2138 for (unsigned i = 1, e = NodeStack.size()-1; i != e; ++i)
2139 if (!NodeStack[i].hasOneUse()) {
2140 HasMultipleUses = true;
2141 break;
2142 }
2143 if (HasMultipleUses) break;
2144
2145 // Check to see that the target thinks this is profitable to fold and that
2146 // we can fold it without inducing cycles in the graph.
2147 if (!IsProfitableToFold(N, NodeStack[NodeStack.size()-2].getNode(),
2148 NodeToMatch) ||
2149 !IsLegalToFold(N, NodeStack[NodeStack.size()-2].getNode(),
2150 NodeToMatch))
2151 break;
2152
2153 continue;
2154 }
Chris Lattner2a49d572010-02-28 22:37:22 +00002155 case OPC_EmitInteger: {
2156 MVT::SimpleValueType VT =
2157 (MVT::SimpleValueType)MatcherTable[MatcherIndex++];
2158 int64_t Val = MatcherTable[MatcherIndex++];
2159 if (Val & 128)
2160 Val = GetVBR(Val, MatcherTable, MatcherIndex);
2161 RecordedNodes.push_back(CurDAG->getTargetConstant(Val, VT));
2162 continue;
2163 }
2164 case OPC_EmitRegister: {
2165 MVT::SimpleValueType VT =
2166 (MVT::SimpleValueType)MatcherTable[MatcherIndex++];
2167 unsigned RegNo = MatcherTable[MatcherIndex++];
2168 RecordedNodes.push_back(CurDAG->getRegister(RegNo, VT));
2169 continue;
2170 }
2171
2172 case OPC_EmitConvertToTarget: {
2173 // Convert from IMM/FPIMM to target version.
2174 unsigned RecNo = MatcherTable[MatcherIndex++];
2175 assert(RecNo < RecordedNodes.size() && "Invalid CheckSame");
2176 SDValue Imm = RecordedNodes[RecNo];
2177
2178 if (Imm->getOpcode() == ISD::Constant) {
2179 int64_t Val = cast<ConstantSDNode>(Imm)->getZExtValue();
2180 Imm = CurDAG->getTargetConstant(Val, Imm.getValueType());
2181 } else if (Imm->getOpcode() == ISD::ConstantFP) {
2182 const ConstantFP *Val=cast<ConstantFPSDNode>(Imm)->getConstantFPValue();
2183 Imm = CurDAG->getTargetConstantFP(*Val, Imm.getValueType());
2184 }
2185
2186 RecordedNodes.push_back(Imm);
2187 continue;
2188 }
2189
2190 case OPC_EmitMergeInputChains: {
2191 assert(InputChain.getNode() == 0 &&
2192 "EmitMergeInputChains should be the first chain producing node");
2193 // This node gets a list of nodes we matched in the input that have
2194 // chains. We want to token factor all of the input chains to these nodes
2195 // together. However, if any of the input chains is actually one of the
2196 // nodes matched in this pattern, then we have an intra-match reference.
2197 // Ignore these because the newly token factored chain should not refer to
2198 // the old nodes.
2199 unsigned NumChains = MatcherTable[MatcherIndex++];
2200 assert(NumChains != 0 && "Can't TF zero chains");
2201
2202 assert(ChainNodesMatched.empty() &&
2203 "Should only have one EmitMergeInputChains per match");
2204
2205 // Handle the first chain.
2206 unsigned RecNo = MatcherTable[MatcherIndex++];
2207 assert(RecNo < RecordedNodes.size() && "Invalid CheckSame");
2208 ChainNodesMatched.push_back(RecordedNodes[RecNo].getNode());
2209
2210 // If the chained node is not the root, we can't fold it if it has
2211 // multiple uses.
2212 // FIXME: What if other value results of the node have uses not matched by
2213 // this pattern?
2214 if (ChainNodesMatched.back() != NodeToMatch &&
2215 !RecordedNodes[RecNo].hasOneUse()) {
2216 ChainNodesMatched.clear();
2217 break;
2218 }
2219
2220 // The common case here is that we have exactly one chain, which is really
2221 // cheap to handle, just do it.
2222 if (NumChains == 1) {
2223 InputChain = RecordedNodes[RecNo].getOperand(0);
2224 assert(InputChain.getValueType() == MVT::Other && "Not a chain");
2225 continue;
2226 }
2227
2228 // Read all of the chained nodes.
2229 for (unsigned i = 1; i != NumChains; ++i) {
2230 RecNo = MatcherTable[MatcherIndex++];
2231 assert(RecNo < RecordedNodes.size() && "Invalid CheckSame");
2232 ChainNodesMatched.push_back(RecordedNodes[RecNo].getNode());
2233
2234 // FIXME: What if other value results of the node have uses not matched
2235 // by this pattern?
2236 if (ChainNodesMatched.back() != NodeToMatch &&
2237 !RecordedNodes[RecNo].hasOneUse()) {
2238 ChainNodesMatched.clear();
2239 break;
2240 }
2241 }
Chris Lattner6b307922010-03-02 00:00:03 +00002242
2243 // If the inner loop broke out, the match fails.
2244 if (ChainNodesMatched.empty())
2245 break;
Chris Lattner2a49d572010-02-28 22:37:22 +00002246
Chris Lattner6b307922010-03-02 00:00:03 +00002247 // Merge the input chains if they are not intra-pattern references.
2248 InputChain = HandleMergeInputChains(ChainNodesMatched, CurDAG);
2249
2250 if (InputChain.getNode() == 0)
2251 break; // Failed to merge.
Chris Lattner2a49d572010-02-28 22:37:22 +00002252
Chris Lattner2a49d572010-02-28 22:37:22 +00002253 continue;
2254 }
2255
2256 case OPC_EmitCopyToReg: {
2257 unsigned RecNo = MatcherTable[MatcherIndex++];
2258 assert(RecNo < RecordedNodes.size() && "Invalid CheckSame");
2259 unsigned DestPhysReg = MatcherTable[MatcherIndex++];
2260
2261 if (InputChain.getNode() == 0)
2262 InputChain = CurDAG->getEntryNode();
2263
2264 InputChain = CurDAG->getCopyToReg(InputChain, NodeToMatch->getDebugLoc(),
2265 DestPhysReg, RecordedNodes[RecNo],
2266 InputFlag);
2267
2268 InputFlag = InputChain.getValue(1);
2269 continue;
2270 }
2271
2272 case OPC_EmitNodeXForm: {
2273 unsigned XFormNo = MatcherTable[MatcherIndex++];
2274 unsigned RecNo = MatcherTable[MatcherIndex++];
2275 assert(RecNo < RecordedNodes.size() && "Invalid CheckSame");
2276 RecordedNodes.push_back(RunSDNodeXForm(RecordedNodes[RecNo], XFormNo));
2277 continue;
2278 }
2279
2280 case OPC_EmitNode:
2281 case OPC_MorphNodeTo: {
Chris Lattner14df8dc2010-02-28 22:38:43 +00002282 uint16_t TargetOpc = MatcherTable[MatcherIndex++];
2283 TargetOpc |= (unsigned short)MatcherTable[MatcherIndex++] << 8;
Chris Lattner2a49d572010-02-28 22:37:22 +00002284 unsigned EmitNodeInfo = MatcherTable[MatcherIndex++];
2285 // Get the result VT list.
2286 unsigned NumVTs = MatcherTable[MatcherIndex++];
2287 SmallVector<EVT, 4> VTs;
2288 for (unsigned i = 0; i != NumVTs; ++i) {
2289 MVT::SimpleValueType VT =
2290 (MVT::SimpleValueType)MatcherTable[MatcherIndex++];
2291 if (VT == MVT::iPTR) VT = TLI.getPointerTy().SimpleTy;
2292 VTs.push_back(VT);
2293 }
2294
2295 if (EmitNodeInfo & OPFL_Chain)
2296 VTs.push_back(MVT::Other);
2297 if (EmitNodeInfo & OPFL_FlagOutput)
2298 VTs.push_back(MVT::Flag);
2299
Chris Lattner7d892d62010-03-01 07:43:08 +00002300 // This is hot code, so optimize the two most common cases of 1 and 2
2301 // results.
2302 SDVTList VTList;
2303 if (VTs.size() == 1)
2304 VTList = CurDAG->getVTList(VTs[0]);
2305 else if (VTs.size() == 2)
2306 VTList = CurDAG->getVTList(VTs[0], VTs[1]);
2307 else
2308 VTList = CurDAG->getVTList(VTs.data(), VTs.size());
Chris Lattner2a49d572010-02-28 22:37:22 +00002309
2310 // Get the operand list.
2311 unsigned NumOps = MatcherTable[MatcherIndex++];
2312 SmallVector<SDValue, 8> Ops;
2313 for (unsigned i = 0; i != NumOps; ++i) {
2314 unsigned RecNo = MatcherTable[MatcherIndex++];
2315 if (RecNo & 128)
2316 RecNo = GetVBR(RecNo, MatcherTable, MatcherIndex);
2317
2318 assert(RecNo < RecordedNodes.size() && "Invalid EmitNode");
2319 Ops.push_back(RecordedNodes[RecNo]);
2320 }
2321
2322 // If there are variadic operands to add, handle them now.
2323 if (EmitNodeInfo & OPFL_VariadicInfo) {
2324 // Determine the start index to copy from.
2325 unsigned FirstOpToCopy = getNumFixedFromVariadicInfo(EmitNodeInfo);
2326 FirstOpToCopy += (EmitNodeInfo & OPFL_Chain) ? 1 : 0;
2327 assert(NodeToMatch->getNumOperands() >= FirstOpToCopy &&
2328 "Invalid variadic node");
2329 // Copy all of the variadic operands, not including a potential flag
2330 // input.
2331 for (unsigned i = FirstOpToCopy, e = NodeToMatch->getNumOperands();
2332 i != e; ++i) {
2333 SDValue V = NodeToMatch->getOperand(i);
2334 if (V.getValueType() == MVT::Flag) break;
2335 Ops.push_back(V);
2336 }
2337 }
2338
2339 // If this has chain/flag inputs, add them.
2340 if (EmitNodeInfo & OPFL_Chain)
2341 Ops.push_back(InputChain);
2342 if ((EmitNodeInfo & OPFL_FlagInput) && InputFlag.getNode() != 0)
2343 Ops.push_back(InputFlag);
2344
2345 // Create the node.
2346 SDNode *Res = 0;
2347 if (Opcode != OPC_MorphNodeTo) {
2348 // If this is a normal EmitNode command, just create the new node and
2349 // add the results to the RecordedNodes list.
2350 Res = CurDAG->getMachineNode(TargetOpc, NodeToMatch->getDebugLoc(),
2351 VTList, Ops.data(), Ops.size());
2352
2353 // Add all the non-flag/non-chain results to the RecordedNodes list.
2354 for (unsigned i = 0, e = VTs.size(); i != e; ++i) {
2355 if (VTs[i] == MVT::Other || VTs[i] == MVT::Flag) break;
2356 RecordedNodes.push_back(SDValue(Res, i));
2357 }
2358
2359 } else {
Chris Lattner3ff1e4d2010-03-02 06:55:04 +00002360 Res = MorphNode(NodeToMatch, TargetOpc, VTList, Ops.data(), Ops.size(),
2361 EmitNodeInfo);
Chris Lattner2a49d572010-02-28 22:37:22 +00002362 }
2363
2364 // If the node had chain/flag results, update our notion of the current
2365 // chain and flag.
2366 if (VTs.back() == MVT::Flag) {
2367 InputFlag = SDValue(Res, VTs.size()-1);
2368 if (EmitNodeInfo & OPFL_Chain)
2369 InputChain = SDValue(Res, VTs.size()-2);
2370 } else if (EmitNodeInfo & OPFL_Chain)
2371 InputChain = SDValue(Res, VTs.size()-1);
2372
2373 // If the OPFL_MemRefs flag is set on this node, slap all of the
2374 // accumulated memrefs onto it.
2375 //
2376 // FIXME: This is vastly incorrect for patterns with multiple outputs
2377 // instructions that access memory and for ComplexPatterns that match
2378 // loads.
2379 if (EmitNodeInfo & OPFL_MemRefs) {
2380 MachineSDNode::mmo_iterator MemRefs =
2381 MF->allocateMemRefsArray(MatchedMemRefs.size());
2382 std::copy(MatchedMemRefs.begin(), MatchedMemRefs.end(), MemRefs);
2383 cast<MachineSDNode>(Res)
2384 ->setMemRefs(MemRefs, MemRefs + MatchedMemRefs.size());
2385 }
2386
2387 DEBUG(errs() << " "
2388 << (Opcode == OPC_MorphNodeTo ? "Morphed" : "Created")
2389 << " node: "; Res->dump(CurDAG); errs() << "\n");
2390
2391 // If this was a MorphNodeTo then we're completely done!
2392 if (Opcode == OPC_MorphNodeTo) {
2393 // Update chain and flag uses.
2394 UpdateChainsAndFlags(NodeToMatch, InputChain, ChainNodesMatched,
2395 InputFlag, FlagResultNodesMatched, true, CurDAG);
2396 return 0;
2397 }
2398
2399 continue;
2400 }
2401
2402 case OPC_MarkFlagResults: {
2403 unsigned NumNodes = MatcherTable[MatcherIndex++];
2404
2405 // Read and remember all the flag-result nodes.
2406 for (unsigned i = 0; i != NumNodes; ++i) {
2407 unsigned RecNo = MatcherTable[MatcherIndex++];
2408 if (RecNo & 128)
2409 RecNo = GetVBR(RecNo, MatcherTable, MatcherIndex);
2410
2411 assert(RecNo < RecordedNodes.size() && "Invalid CheckSame");
2412 FlagResultNodesMatched.push_back(RecordedNodes[RecNo].getNode());
2413 }
2414 continue;
2415 }
2416
2417 case OPC_CompleteMatch: {
2418 // The match has been completed, and any new nodes (if any) have been
2419 // created. Patch up references to the matched dag to use the newly
2420 // created nodes.
2421 unsigned NumResults = MatcherTable[MatcherIndex++];
2422
2423 for (unsigned i = 0; i != NumResults; ++i) {
2424 unsigned ResSlot = MatcherTable[MatcherIndex++];
2425 if (ResSlot & 128)
2426 ResSlot = GetVBR(ResSlot, MatcherTable, MatcherIndex);
2427
2428 assert(ResSlot < RecordedNodes.size() && "Invalid CheckSame");
2429 SDValue Res = RecordedNodes[ResSlot];
2430
2431 // FIXME2: Eliminate this horrible hack by fixing the 'Gen' program
2432 // after (parallel) on input patterns are removed. This would also
2433 // allow us to stop encoding #results in OPC_CompleteMatch's table
2434 // entry.
2435 if (NodeToMatch->getNumValues() <= i ||
2436 NodeToMatch->getValueType(i) == MVT::Other ||
2437 NodeToMatch->getValueType(i) == MVT::Flag)
2438 break;
2439 assert((NodeToMatch->getValueType(i) == Res.getValueType() ||
2440 NodeToMatch->getValueType(i) == MVT::iPTR ||
2441 Res.getValueType() == MVT::iPTR ||
2442 NodeToMatch->getValueType(i).getSizeInBits() ==
2443 Res.getValueType().getSizeInBits()) &&
2444 "invalid replacement");
2445 CurDAG->ReplaceAllUsesOfValueWith(SDValue(NodeToMatch, i), Res);
2446 }
2447
2448 // If the root node defines a flag, add it to the flag nodes to update
2449 // list.
2450 if (NodeToMatch->getValueType(NodeToMatch->getNumValues()-1) == MVT::Flag)
2451 FlagResultNodesMatched.push_back(NodeToMatch);
2452
2453 // Update chain and flag uses.
2454 UpdateChainsAndFlags(NodeToMatch, InputChain, ChainNodesMatched,
2455 InputFlag, FlagResultNodesMatched, false, CurDAG);
2456
2457 assert(NodeToMatch->use_empty() &&
2458 "Didn't replace all uses of the node?");
2459
2460 // FIXME: We just return here, which interacts correctly with SelectRoot
2461 // above. We should fix this to not return an SDNode* anymore.
2462 return 0;
2463 }
2464 }
2465
2466 // If the code reached this point, then the match failed. See if there is
2467 // another child to try in the current 'Scope', otherwise pop it until we
2468 // find a case to check.
2469 while (1) {
2470 if (MatchScopes.empty()) {
2471 CannotYetSelect(NodeToMatch);
2472 return 0;
2473 }
2474
2475 // Restore the interpreter state back to the point where the scope was
2476 // formed.
2477 MatchScope &LastScope = MatchScopes.back();
2478 RecordedNodes.resize(LastScope.NumRecordedNodes);
2479 NodeStack.clear();
2480 NodeStack.append(LastScope.NodeStack.begin(), LastScope.NodeStack.end());
2481 N = NodeStack.back();
2482
2483 DEBUG(errs() << " Match failed at index " << MatcherIndex
2484 << " continuing at " << LastScope.FailIndex << "\n");
2485
2486 if (LastScope.NumMatchedMemRefs != MatchedMemRefs.size())
2487 MatchedMemRefs.resize(LastScope.NumMatchedMemRefs);
2488 MatcherIndex = LastScope.FailIndex;
2489
2490 InputChain = LastScope.InputChain;
2491 InputFlag = LastScope.InputFlag;
2492 if (!LastScope.HasChainNodesMatched)
2493 ChainNodesMatched.clear();
2494 if (!LastScope.HasFlagResultNodesMatched)
2495 FlagResultNodesMatched.clear();
2496
2497 // Check to see what the offset is at the new MatcherIndex. If it is zero
2498 // we have reached the end of this scope, otherwise we have another child
2499 // in the current scope to try.
2500 unsigned NumToSkip = MatcherTable[MatcherIndex++];
2501 if (NumToSkip & 128)
2502 NumToSkip = GetVBR(NumToSkip, MatcherTable, MatcherIndex);
2503
2504 // If we have another child in this scope to match, update FailIndex and
2505 // try it.
2506 if (NumToSkip != 0) {
2507 LastScope.FailIndex = MatcherIndex+NumToSkip;
2508 break;
2509 }
2510
2511 // End of this scope, pop it and try the next child in the containing
2512 // scope.
2513 MatchScopes.pop_back();
2514 }
2515 }
2516}
2517
2518
2519
Dan Gohmaneeb3a002010-01-05 01:24:18 +00002520void SelectionDAGISel::CannotYetSelect(SDNode *N) {
Chris Lattner409ac582010-02-17 06:28:22 +00002521 if (N->getOpcode() == ISD::INTRINSIC_W_CHAIN ||
2522 N->getOpcode() == ISD::INTRINSIC_WO_CHAIN ||
2523 N->getOpcode() == ISD::INTRINSIC_VOID)
2524 return CannotYetSelectIntrinsic(N);
2525
Dan Gohmane1f188f2009-10-29 22:30:23 +00002526 std::string msg;
2527 raw_string_ostream Msg(msg);
2528 Msg << "Cannot yet select: ";
David Greenece6715f2010-01-19 20:37:34 +00002529 N->printrFull(Msg, CurDAG);
Dan Gohmane1f188f2009-10-29 22:30:23 +00002530 llvm_report_error(Msg.str());
2531}
2532
Dan Gohmaneeb3a002010-01-05 01:24:18 +00002533void SelectionDAGISel::CannotYetSelectIntrinsic(SDNode *N) {
David Greene1a053232010-01-05 01:26:11 +00002534 dbgs() << "Cannot yet select: ";
Dan Gohmane1f188f2009-10-29 22:30:23 +00002535 unsigned iid =
Jim Grosbachf4549b02010-01-15 00:36:15 +00002536 cast<ConstantSDNode>(N->getOperand(N->getOperand(0).getValueType() ==
2537 MVT::Other))->getZExtValue();
Dan Gohmane1f188f2009-10-29 22:30:23 +00002538 if (iid < Intrinsic::num_intrinsics)
Jim Grosbachf4549b02010-01-15 00:36:15 +00002539 llvm_report_error("Cannot yet select: intrinsic %" +
2540 Intrinsic::getName((Intrinsic::ID)iid));
Dan Gohmane1f188f2009-10-29 22:30:23 +00002541 else if (const TargetIntrinsicInfo *tii = TM.getIntrinsicInfo())
2542 llvm_report_error(Twine("Cannot yet select: target intrinsic %") +
2543 tii->getName(iid));
2544}
Anton Korobeynikovc1c6ef82009-05-08 18:51:58 +00002545
Devang Patel19974732007-05-03 01:11:54 +00002546char SelectionDAGISel::ID = 0;