blob: cbbd619f0b84ece970765e1962666307a9e38472 [file] [log] [blame]
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001//===-- IA64ISelPattern.cpp - A pattern matching inst selector for IA64 ---===//
Misha Brukman4633f1c2005-04-21 23:13:11 +00002//
Duraid Madina9b9d45f2005-03-17 18:17:03 +00003// The LLVM Compiler Infrastructure
4//
5// This file was developed by Duraid Madina and is distributed under the
6// University of Illinois Open Source License. See LICENSE.TXT for details.
Misha Brukman4633f1c2005-04-21 23:13:11 +00007//
Duraid Madina9b9d45f2005-03-17 18:17:03 +00008//===----------------------------------------------------------------------===//
9//
10// This file defines a pattern matching instruction selector for IA64.
11//
12//===----------------------------------------------------------------------===//
13
14#include "IA64.h"
15#include "IA64InstrBuilder.h"
16#include "IA64RegisterInfo.h"
17#include "IA64MachineFunctionInfo.h"
18#include "llvm/Constants.h" // FIXME: REMOVE
19#include "llvm/Function.h"
20#include "llvm/CodeGen/MachineConstantPool.h" // FIXME: REMOVE
21#include "llvm/CodeGen/MachineFunction.h"
22#include "llvm/CodeGen/MachineFrameInfo.h"
23#include "llvm/CodeGen/SelectionDAG.h"
24#include "llvm/CodeGen/SelectionDAGISel.h"
25#include "llvm/CodeGen/SSARegMap.h"
26#include "llvm/Target/TargetData.h"
27#include "llvm/Target/TargetLowering.h"
28#include "llvm/Support/MathExtras.h"
29#include "llvm/ADT/Statistic.h"
30#include <set>
Duraid Madinab2322562005-04-26 07:23:02 +000031#include <map>
Duraid Madina9b9d45f2005-03-17 18:17:03 +000032#include <algorithm>
33using namespace llvm;
34
35//===----------------------------------------------------------------------===//
36// IA64TargetLowering - IA64 Implementation of the TargetLowering interface
37namespace {
38 class IA64TargetLowering : public TargetLowering {
39 int VarArgsFrameIndex; // FrameIndex for start of varargs area.
Misha Brukman4633f1c2005-04-21 23:13:11 +000040
Duraid Madina9b9d45f2005-03-17 18:17:03 +000041 //int ReturnAddrIndex; // FrameIndex for return slot.
42 unsigned GP, SP, RP; // FIXME - clean this mess up
43 public:
44
45 unsigned VirtGPR; // this is public so it can be accessed in the selector
46 // for ISD::RET down below. add an accessor instead? FIXME
47
48 IA64TargetLowering(TargetMachine &TM) : TargetLowering(TM) {
Misha Brukman4633f1c2005-04-21 23:13:11 +000049
Duraid Madina9b9d45f2005-03-17 18:17:03 +000050 // register class for general registers
51 addRegisterClass(MVT::i64, IA64::GRRegisterClass);
52
53 // register class for FP registers
54 addRegisterClass(MVT::f64, IA64::FPRegisterClass);
Misha Brukman4633f1c2005-04-21 23:13:11 +000055
56 // register class for predicate registers
Duraid Madina9b9d45f2005-03-17 18:17:03 +000057 addRegisterClass(MVT::i1, IA64::PRRegisterClass);
Misha Brukman4633f1c2005-04-21 23:13:11 +000058
Chris Lattnerda4d4692005-04-09 03:22:37 +000059 setOperationAction(ISD::BRCONDTWOWAY , MVT::Other, Expand);
Duraid Madina9b9d45f2005-03-17 18:17:03 +000060 setOperationAction(ISD::FP_ROUND_INREG , MVT::f32 , Expand);
61
Misha Brukman4633f1c2005-04-21 23:13:11 +000062 setSetCCResultType(MVT::i1);
Duraid Madina9b9d45f2005-03-17 18:17:03 +000063 setShiftAmountType(MVT::i64);
64
65 setOperationAction(ISD::EXTLOAD , MVT::i1 , Promote);
Duraid Madina9b9d45f2005-03-17 18:17:03 +000066
67 setOperationAction(ISD::ZEXTLOAD , MVT::i1 , Expand);
Duraid Madina9b9d45f2005-03-17 18:17:03 +000068
69 setOperationAction(ISD::SEXTLOAD , MVT::i1 , Expand);
70 setOperationAction(ISD::SEXTLOAD , MVT::i8 , Expand);
71 setOperationAction(ISD::SEXTLOAD , MVT::i16 , Expand);
Duraid Madinac4ccc2d2005-04-14 08:37:32 +000072 setOperationAction(ISD::SEXTLOAD , MVT::i32 , Expand);
Duraid Madina9b9d45f2005-03-17 18:17:03 +000073
74 setOperationAction(ISD::SREM , MVT::f32 , Expand);
75 setOperationAction(ISD::SREM , MVT::f64 , Expand);
76
77 setOperationAction(ISD::UREM , MVT::f32 , Expand);
78 setOperationAction(ISD::UREM , MVT::f64 , Expand);
Misha Brukman4633f1c2005-04-21 23:13:11 +000079
Duraid Madina9b9d45f2005-03-17 18:17:03 +000080 setOperationAction(ISD::MEMMOVE , MVT::Other, Expand);
81 setOperationAction(ISD::MEMSET , MVT::Other, Expand);
82 setOperationAction(ISD::MEMCPY , MVT::Other, Expand);
83
Chris Lattner17234b72005-04-30 04:26:06 +000084 // We don't support sin/cos/sqrt
85 setOperationAction(ISD::FSIN , MVT::f64, Expand);
86 setOperationAction(ISD::FCOS , MVT::f64, Expand);
87 setOperationAction(ISD::FSQRT, MVT::f64, Expand);
88 setOperationAction(ISD::FSIN , MVT::f32, Expand);
89 setOperationAction(ISD::FCOS , MVT::f32, Expand);
90 setOperationAction(ISD::FSQRT, MVT::f32, Expand);
91
Andrew Lenharthb5884d32005-05-04 19:25:37 +000092 //IA64 has these, but they are not implemented
Chris Lattner1f38e5c2005-05-11 05:03:56 +000093 setOperationAction(ISD::CTTZ , MVT::i64 , Expand);
94 setOperationAction(ISD::CTLZ , MVT::i64 , Expand);
Andrew Lenharthb5884d32005-05-04 19:25:37 +000095
Duraid Madina9b9d45f2005-03-17 18:17:03 +000096 computeRegisterProperties();
97
98 addLegalFPImmediate(+0.0);
99 addLegalFPImmediate(+1.0);
100 addLegalFPImmediate(-0.0);
101 addLegalFPImmediate(-1.0);
102 }
103
104 /// LowerArguments - This hook must be implemented to indicate how we should
105 /// lower the arguments for the specified function, into the specified DAG.
106 virtual std::vector<SDOperand>
107 LowerArguments(Function &F, SelectionDAG &DAG);
108
109 /// LowerCallTo - This hook lowers an abstract call to a function into an
110 /// actual call.
111 virtual std::pair<SDOperand, SDOperand>
Chris Lattnerc57f6822005-05-12 19:56:45 +0000112 LowerCallTo(SDOperand Chain, const Type *RetTy, bool isVarArg, unsigned CC,
Nate Begeman8e21e712005-03-26 01:29:23 +0000113 SDOperand Callee, ArgListTy &Args, SelectionDAG &DAG);
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000114
115 virtual std::pair<SDOperand, SDOperand>
116 LowerVAStart(SDOperand Chain, SelectionDAG &DAG);
117
118 virtual std::pair<SDOperand,SDOperand>
119 LowerVAArgNext(bool isVANext, SDOperand Chain, SDOperand VAList,
120 const Type *ArgTy, SelectionDAG &DAG);
121
122 virtual std::pair<SDOperand, SDOperand>
123 LowerFrameReturnAddress(bool isFrameAddr, SDOperand Chain, unsigned Depth,
124 SelectionDAG &DAG);
125
126 void restoreGP_SP_RP(MachineBasicBlock* BB)
127 {
128 BuildMI(BB, IA64::MOV, 1, IA64::r1).addReg(GP);
129 BuildMI(BB, IA64::MOV, 1, IA64::r12).addReg(SP);
130 BuildMI(BB, IA64::MOV, 1, IA64::rp).addReg(RP);
131 }
132
Duraid Madinabeeaab22005-03-31 12:31:11 +0000133 void restoreSP_RP(MachineBasicBlock* BB)
134 {
135 BuildMI(BB, IA64::MOV, 1, IA64::r12).addReg(SP);
136 BuildMI(BB, IA64::MOV, 1, IA64::rp).addReg(RP);
137 }
138
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000139 void restoreRP(MachineBasicBlock* BB)
140 {
141 BuildMI(BB, IA64::MOV, 1, IA64::rp).addReg(RP);
142 }
143
144 void restoreGP(MachineBasicBlock* BB)
145 {
146 BuildMI(BB, IA64::MOV, 1, IA64::r1).addReg(GP);
147 }
148
149 };
150}
151
152
153std::vector<SDOperand>
154IA64TargetLowering::LowerArguments(Function &F, SelectionDAG &DAG) {
155 std::vector<SDOperand> ArgValues;
156
157 //
158 // add beautiful description of IA64 stack frame format
159 // here (from intel 24535803.pdf most likely)
160 //
161 MachineFunction &MF = DAG.getMachineFunction();
162 MachineFrameInfo *MFI = MF.getFrameInfo();
163
164 GP = MF.getSSARegMap()->createVirtualRegister(getRegClassFor(MVT::i64));
165 SP = MF.getSSARegMap()->createVirtualRegister(getRegClassFor(MVT::i64));
166 RP = MF.getSSARegMap()->createVirtualRegister(getRegClassFor(MVT::i64));
167
168 MachineBasicBlock& BB = MF.front();
169
Misha Brukman4633f1c2005-04-21 23:13:11 +0000170 unsigned args_int[] = {IA64::r32, IA64::r33, IA64::r34, IA64::r35,
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000171 IA64::r36, IA64::r37, IA64::r38, IA64::r39};
Misha Brukman4633f1c2005-04-21 23:13:11 +0000172
173 unsigned args_FP[] = {IA64::F8, IA64::F9, IA64::F10, IA64::F11,
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000174 IA64::F12,IA64::F13,IA64::F14, IA64::F15};
Misha Brukman4633f1c2005-04-21 23:13:11 +0000175
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000176 unsigned argVreg[8];
177 unsigned argPreg[8];
178 unsigned argOpc[8];
179
Duraid Madinabeeaab22005-03-31 12:31:11 +0000180 unsigned used_FPArgs = 0; // how many FP args have been used so far?
Misha Brukman4633f1c2005-04-21 23:13:11 +0000181
Duraid Madinabeeaab22005-03-31 12:31:11 +0000182 unsigned ArgOffset = 0;
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000183 int count = 0;
Misha Brukman4633f1c2005-04-21 23:13:11 +0000184
Alkis Evlogimenos12cf3852005-03-19 09:22:17 +0000185 for (Function::arg_iterator I = F.arg_begin(), E = F.arg_end(); I != E; ++I)
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000186 {
187 SDOperand newroot, argt;
188 if(count < 8) { // need to fix this logic? maybe.
Misha Brukman7847fca2005-04-22 17:54:37 +0000189
190 switch (getValueType(I->getType())) {
191 default:
192 std::cerr << "ERROR in LowerArgs: unknown type "
193 << getValueType(I->getType()) << "\n";
194 abort();
195 case MVT::f32:
196 // fixme? (well, will need to for weird FP structy stuff,
197 // see intel ABI docs)
198 case MVT::f64:
199//XXX BuildMI(&BB, IA64::IDEF, 0, args_FP[used_FPArgs]);
200 MF.addLiveIn(args_FP[used_FPArgs]); // mark this reg as liveIn
201 // floating point args go into f8..f15 as-needed, the increment
202 argVreg[count] = // is below..:
203 MF.getSSARegMap()->createVirtualRegister(getRegClassFor(MVT::f64));
204 // FP args go into f8..f15 as needed: (hence the ++)
205 argPreg[count] = args_FP[used_FPArgs++];
206 argOpc[count] = IA64::FMOV;
207 argt = newroot = DAG.getCopyFromReg(argVreg[count],
208 getValueType(I->getType()), DAG.getRoot());
209 break;
210 case MVT::i1: // NOTE: as far as C abi stuff goes,
211 // bools are just boring old ints
212 case MVT::i8:
213 case MVT::i16:
214 case MVT::i32:
215 case MVT::i64:
216//XXX BuildMI(&BB, IA64::IDEF, 0, args_int[count]);
217 MF.addLiveIn(args_int[count]); // mark this register as liveIn
218 argVreg[count] =
219 MF.getSSARegMap()->createVirtualRegister(getRegClassFor(MVT::i64));
220 argPreg[count] = args_int[count];
221 argOpc[count] = IA64::MOV;
222 argt = newroot =
223 DAG.getCopyFromReg(argVreg[count], MVT::i64, DAG.getRoot());
224 if ( getValueType(I->getType()) != MVT::i64)
225 argt = DAG.getNode(ISD::TRUNCATE, getValueType(I->getType()),
226 newroot);
227 break;
228 }
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000229 } else { // more than 8 args go into the frame
Misha Brukman7847fca2005-04-22 17:54:37 +0000230 // Create the frame index object for this incoming parameter...
231 ArgOffset = 16 + 8 * (count - 8);
232 int FI = MFI->CreateFixedObject(8, ArgOffset);
233
234 // Create the SelectionDAG nodes corresponding to a load
235 //from this parameter
236 SDOperand FIN = DAG.getFrameIndex(FI, MVT::i64);
237 argt = newroot = DAG.getLoad(getValueType(I->getType()),
Andrew Lenharth2d86ea22005-04-27 20:10:01 +0000238 DAG.getEntryNode(), FIN, DAG.getSrcValue(NULL));
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000239 }
240 ++count;
241 DAG.setRoot(newroot.getValue(1));
242 ArgValues.push_back(argt);
Misha Brukman4633f1c2005-04-21 23:13:11 +0000243 }
Duraid Madinabeeaab22005-03-31 12:31:11 +0000244
Misha Brukman4633f1c2005-04-21 23:13:11 +0000245
Duraid Madinabeeaab22005-03-31 12:31:11 +0000246 // Create a vreg to hold the output of (what will become)
247 // the "alloc" instruction
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000248 VirtGPR = MF.getSSARegMap()->createVirtualRegister(getRegClassFor(MVT::i64));
249 BuildMI(&BB, IA64::PSEUDO_ALLOC, 0, VirtGPR);
250 // we create a PSEUDO_ALLOC (pseudo)instruction for now
251
252 BuildMI(&BB, IA64::IDEF, 0, IA64::r1);
253
254 // hmm:
255 BuildMI(&BB, IA64::IDEF, 0, IA64::r12);
256 BuildMI(&BB, IA64::IDEF, 0, IA64::rp);
257 // ..hmm.
258
259 BuildMI(&BB, IA64::MOV, 1, GP).addReg(IA64::r1);
260
261 // hmm:
262 BuildMI(&BB, IA64::MOV, 1, SP).addReg(IA64::r12);
263 BuildMI(&BB, IA64::MOV, 1, RP).addReg(IA64::rp);
264 // ..hmm.
265
Duraid Madinabeeaab22005-03-31 12:31:11 +0000266 unsigned tempOffset=0;
Misha Brukman4633f1c2005-04-21 23:13:11 +0000267
Duraid Madinabeeaab22005-03-31 12:31:11 +0000268 // if this is a varargs function, we simply lower llvm.va_start by
269 // pointing to the first entry
270 if(F.isVarArg()) {
271 tempOffset=0;
272 VarArgsFrameIndex = MFI->CreateFixedObject(8, tempOffset);
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000273 }
Misha Brukman4633f1c2005-04-21 23:13:11 +0000274
Duraid Madinabeeaab22005-03-31 12:31:11 +0000275 // here we actually do the moving of args, and store them to the stack
276 // too if this is a varargs function:
277 for (int i = 0; i < count && i < 8; ++i) {
278 BuildMI(&BB, argOpc[i], 1, argVreg[i]).addReg(argPreg[i]);
279 if(F.isVarArg()) {
280 // if this is a varargs function, we copy the input registers to the stack
281 int FI = MFI->CreateFixedObject(8, tempOffset);
282 tempOffset+=8; //XXX: is it safe to use r22 like this?
283 BuildMI(&BB, IA64::MOV, 1, IA64::r22).addFrameIndex(FI);
284 // FIXME: we should use st8.spill here, one day
285 BuildMI(&BB, IA64::ST8, 1, IA64::r22).addReg(argPreg[i]);
286 }
287 }
288
Duraid Madinaca494fd2005-04-12 14:54:44 +0000289 // Finally, inform the code generator which regs we return values in.
290 // (see the ISD::RET: case down below)
291 switch (getValueType(F.getReturnType())) {
292 default: assert(0 && "i have no idea where to return this type!");
293 case MVT::isVoid: break;
294 case MVT::i1:
295 case MVT::i8:
296 case MVT::i16:
297 case MVT::i32:
298 case MVT::i64:
299 MF.addLiveOut(IA64::r8);
300 break;
301 case MVT::f32:
302 case MVT::f64:
303 MF.addLiveOut(IA64::F8);
304 break;
305 }
Misha Brukman4633f1c2005-04-21 23:13:11 +0000306
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000307 return ArgValues;
308}
Misha Brukman4633f1c2005-04-21 23:13:11 +0000309
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000310std::pair<SDOperand, SDOperand>
311IA64TargetLowering::LowerCallTo(SDOperand Chain,
Misha Brukman7847fca2005-04-22 17:54:37 +0000312 const Type *RetTy, bool isVarArg,
Chris Lattnerc57f6822005-05-12 19:56:45 +0000313 unsigned CallingConv,
Misha Brukman7847fca2005-04-22 17:54:37 +0000314 SDOperand Callee, ArgListTy &Args,
315 SelectionDAG &DAG) {
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000316
317 MachineFunction &MF = DAG.getMachineFunction();
318
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000319 unsigned NumBytes = 16;
Duraid Madinabeeaab22005-03-31 12:31:11 +0000320 unsigned outRegsUsed = 0;
321
322 if (Args.size() > 8) {
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000323 NumBytes += (Args.size() - 8) * 8;
Duraid Madinabeeaab22005-03-31 12:31:11 +0000324 outRegsUsed = 8;
325 } else {
326 outRegsUsed = Args.size();
327 }
Misha Brukman4633f1c2005-04-21 23:13:11 +0000328
Duraid Madinabeeaab22005-03-31 12:31:11 +0000329 // FIXME? this WILL fail if we ever try to pass around an arg that
330 // consumes more than a single output slot (a 'real' double, int128
331 // some sort of aggregate etc.), as we'll underestimate how many 'outX'
332 // registers we use. Hopefully, the assembler will notice.
333 MF.getInfo<IA64FunctionInfo>()->outRegsUsed=
334 std::max(outRegsUsed, MF.getInfo<IA64FunctionInfo>()->outRegsUsed);
Misha Brukman4633f1c2005-04-21 23:13:11 +0000335
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000336 Chain = DAG.getNode(ISD::ADJCALLSTACKDOWN, MVT::Other, Chain,
337 DAG.getConstant(NumBytes, getPointerTy()));
Misha Brukman4633f1c2005-04-21 23:13:11 +0000338
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000339 std::vector<SDOperand> args_to_use;
340 for (unsigned i = 0, e = Args.size(); i != e; ++i)
341 {
342 switch (getValueType(Args[i].second)) {
343 default: assert(0 && "unexpected argument type!");
344 case MVT::i1:
345 case MVT::i8:
346 case MVT::i16:
347 case MVT::i32:
Misha Brukman7847fca2005-04-22 17:54:37 +0000348 //promote to 64-bits, sign/zero extending based on type
349 //of the argument
350 if(Args[i].second->isSigned())
351 Args[i].first = DAG.getNode(ISD::SIGN_EXTEND, MVT::i64,
352 Args[i].first);
353 else
354 Args[i].first = DAG.getNode(ISD::ZERO_EXTEND, MVT::i64,
355 Args[i].first);
356 break;
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000357 case MVT::f32:
Misha Brukman7847fca2005-04-22 17:54:37 +0000358 //promote to 64-bits
359 Args[i].first = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Args[i].first);
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000360 case MVT::f64:
361 case MVT::i64:
362 break;
363 }
364 args_to_use.push_back(Args[i].first);
365 }
366
367 std::vector<MVT::ValueType> RetVals;
368 MVT::ValueType RetTyVT = getValueType(RetTy);
369 if (RetTyVT != MVT::isVoid)
370 RetVals.push_back(RetTyVT);
371 RetVals.push_back(MVT::Other);
372
373 SDOperand TheCall = SDOperand(DAG.getCall(RetVals, Chain,
Misha Brukman7847fca2005-04-22 17:54:37 +0000374 Callee, args_to_use), 0);
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000375 Chain = TheCall.getValue(RetTyVT != MVT::isVoid);
376 Chain = DAG.getNode(ISD::ADJCALLSTACKUP, MVT::Other, Chain,
377 DAG.getConstant(NumBytes, getPointerTy()));
378 return std::make_pair(TheCall, Chain);
379}
380
381std::pair<SDOperand, SDOperand>
382IA64TargetLowering::LowerVAStart(SDOperand Chain, SelectionDAG &DAG) {
383 // vastart just returns the address of the VarArgsFrameIndex slot.
384 return std::make_pair(DAG.getFrameIndex(VarArgsFrameIndex, MVT::i64), Chain);
385}
386
387std::pair<SDOperand,SDOperand> IA64TargetLowering::
388LowerVAArgNext(bool isVANext, SDOperand Chain, SDOperand VAList,
389 const Type *ArgTy, SelectionDAG &DAG) {
Duraid Madinabeeaab22005-03-31 12:31:11 +0000390
391 MVT::ValueType ArgVT = getValueType(ArgTy);
392 SDOperand Result;
393 if (!isVANext) {
Andrew Lenharth2d86ea22005-04-27 20:10:01 +0000394 Result = DAG.getLoad(ArgVT, DAG.getEntryNode(), VAList, DAG.getSrcValue(NULL));
Duraid Madinabeeaab22005-03-31 12:31:11 +0000395 } else {
396 unsigned Amt;
397 if (ArgVT == MVT::i32 || ArgVT == MVT::f32)
398 Amt = 8;
399 else {
400 assert((ArgVT == MVT::i64 || ArgVT == MVT::f64) &&
401 "Other types should have been promoted for varargs!");
402 Amt = 8;
403 }
404 Result = DAG.getNode(ISD::ADD, VAList.getValueType(), VAList,
405 DAG.getConstant(Amt, VAList.getValueType()));
406 }
407 return std::make_pair(Result, Chain);
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000408}
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000409
410std::pair<SDOperand, SDOperand> IA64TargetLowering::
411LowerFrameReturnAddress(bool isFrameAddress, SDOperand Chain, unsigned Depth,
412 SelectionDAG &DAG) {
413
414 assert(0 && "LowerFrameReturnAddress not done yet\n");
Duraid Madina817aed42005-03-17 19:00:40 +0000415 abort();
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000416}
417
418
419namespace {
420
421 //===--------------------------------------------------------------------===//
422 /// ISel - IA64 specific code to select IA64 machine instructions for
423 /// SelectionDAG operations.
424 ///
425 class ISel : public SelectionDAGISel {
426 /// IA64Lowering - This object fully describes how to lower LLVM code to an
427 /// IA64-specific SelectionDAG.
428 IA64TargetLowering IA64Lowering;
Duraid Madinab2322562005-04-26 07:23:02 +0000429 SelectionDAG *ISelDAG; // Hack to support us having a dag->dag transform
430 // for sdiv and udiv until it is put into the future
431 // dag combiner
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000432
433 /// ExprMap - As shared expressions are codegen'd, we keep track of which
434 /// vreg the value is produced in, so we only emit one copy of each compiled
435 /// tree.
436 std::map<SDOperand, unsigned> ExprMap;
437 std::set<SDOperand> LoweredTokens;
438
439 public:
Duraid Madinab2322562005-04-26 07:23:02 +0000440 ISel(TargetMachine &TM) : SelectionDAGISel(IA64Lowering), IA64Lowering(TM),
441 ISelDAG(0) { }
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000442
443 /// InstructionSelectBasicBlock - This callback is invoked by
444 /// SelectionDAGISel when it has created a SelectionDAG for us to codegen.
445 virtual void InstructionSelectBasicBlock(SelectionDAG &DAG);
446
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000447 unsigned SelectExpr(SDOperand N);
448 void Select(SDOperand N);
Duraid Madinab2322562005-04-26 07:23:02 +0000449 // a dag->dag to transform mul-by-constant-int to shifts+adds/subs
450 SDOperand BuildConstmulSequence(SDOperand N);
451
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000452 };
453}
454
455/// InstructionSelectBasicBlock - This callback is invoked by SelectionDAGISel
456/// when it has created a SelectionDAG for us to codegen.
457void ISel::InstructionSelectBasicBlock(SelectionDAG &DAG) {
458
459 // Codegen the basic block.
Duraid Madinab2322562005-04-26 07:23:02 +0000460 ISelDAG = &DAG;
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000461 Select(DAG.getRoot());
462
463 // Clear state used for selection.
464 ExprMap.clear();
465 LoweredTokens.clear();
Duraid Madinab2322562005-04-26 07:23:02 +0000466 ISelDAG = 0;
467}
468
Duraid Madinab2322562005-04-26 07:23:02 +0000469// strip leading '0' characters from a string
470void munchLeadingZeros(std::string& inString) {
471 while(inString.c_str()[0]=='0') {
472 inString.erase(0, 1);
473 }
474}
475
476// strip trailing '0' characters from a string
477void munchTrailingZeros(std::string& inString) {
478 int curPos=inString.length()-1;
479
480 while(inString.c_str()[curPos]=='0') {
481 inString.erase(curPos, 1);
482 curPos--;
483 }
484}
485
486// return how many consecutive '0' characters are at the end of a string
487unsigned int countTrailingZeros(std::string& inString) {
488 int curPos=inString.length()-1;
489 unsigned int zeroCount=0;
490 // assert goes here
491 while(inString.c_str()[curPos--]=='0') {
492 zeroCount++;
493 }
494 return zeroCount;
495}
496
497// booth encode a string of '1' and '0' characters (returns string of 'P' (+1)
498// '0' and 'N' (-1) characters)
499void boothEncode(std::string inString, std::string& boothEncodedString) {
500
501 int curpos=0;
502 int replacements=0;
503 int lim=inString.size();
504
505 while(curpos<lim) {
506 if(inString[curpos]=='1') { // if we see a '1', look for a run of them
507 int runlength=0;
508 std::string replaceString="N";
509
510 // find the run length
511 for(;inString[curpos+runlength]=='1';runlength++) ;
512
513 for(int i=0; i<runlength-1; i++)
514 replaceString+="0";
515 replaceString+="1";
516
517 if(runlength>1) {
518 inString.replace(curpos, runlength+1, replaceString);
519 curpos+=runlength-1;
520 } else
521 curpos++;
522 } else { // a zero, we just keep chugging along
523 curpos++;
524 }
525 }
526
527 // clean up (trim the string, reverse it and turn '1's into 'P's)
528 munchTrailingZeros(inString);
529 boothEncodedString="";
530
531 for(int i=inString.size()-1;i>=0;i--)
532 if(inString[i]=='1')
533 boothEncodedString+="P";
534 else
535 boothEncodedString+=inString[i];
536
537}
538
539struct shiftaddblob { // this encodes stuff like (x=) "A << B [+-] C << D"
540 unsigned firstVal; // A
541 unsigned firstShift; // B
542 unsigned secondVal; // C
543 unsigned secondShift; // D
544 bool isSub;
545};
546
547/* this implements Lefevre's "pattern-based" constant multiplication,
548 * see "Multiplication by an Integer Constant", INRIA report 1999-06
549 *
550 * TODO: implement a method to try rewriting P0N<->0PP / N0P<->0NN
551 * to get better booth encodings - this does help in practice
552 * TODO: weight shifts appropriately (most architectures can't
553 * fuse a shift and an add for arbitrary shift amounts) */
554unsigned lefevre(const std::string inString,
555 std::vector<struct shiftaddblob> &ops) {
556 std::string retstring;
557 std::string s = inString;
558 munchTrailingZeros(s);
559
560 int length=s.length()-1;
561
562 if(length==0) {
563 return(0);
564 }
565
566 std::vector<int> p,n;
567
568 for(int i=0; i<=length; i++) {
569 if (s.c_str()[length-i]=='P') {
570 p.push_back(i);
571 } else if (s.c_str()[length-i]=='N') {
572 n.push_back(i);
573 }
574 }
575
576 std::string t, u;
Duraid Madina4706c032005-04-26 09:42:50 +0000577 int c;
578 bool f;
Duraid Madinab2322562005-04-26 07:23:02 +0000579 std::map<const int, int> w;
580
Duraid Madina85d5f602005-04-27 11:57:39 +0000581 for(unsigned i=0; i<p.size(); i++) {
582 for(unsigned j=0; j<i; j++) {
Duraid Madinab2322562005-04-26 07:23:02 +0000583 w[p[i]-p[j]]++;
584 }
585 }
586
Duraid Madina85d5f602005-04-27 11:57:39 +0000587 for(unsigned i=1; i<n.size(); i++) {
588 for(unsigned j=0; j<i; j++) {
Duraid Madinab2322562005-04-26 07:23:02 +0000589 w[n[i]-n[j]]++;
590 }
591 }
592
Duraid Madina85d5f602005-04-27 11:57:39 +0000593 for(unsigned i=0; i<p.size(); i++) {
594 for(unsigned j=0; j<n.size(); j++) {
Duraid Madinab2322562005-04-26 07:23:02 +0000595 w[-abs(p[i]-n[j])]++;
596 }
597 }
598
599 std::map<const int, int>::const_iterator ii;
600 std::vector<int> d;
601 std::multimap<int, int> sorted_by_value;
602
603 for(ii = w.begin(); ii!=w.end(); ii++)
604 sorted_by_value.insert(std::pair<int, int>((*ii).second,(*ii).first));
605
606 for (std::multimap<int, int>::iterator it = sorted_by_value.begin();
607 it != sorted_by_value.end(); ++it) {
608 d.push_back((*it).second);
609 }
610
611 int int_W=0;
612 int int_d;
613
614 while(d.size()>0 && (w[int_d=d.back()] > int_W)) {
615 d.pop_back();
616 retstring=s; // hmmm
617 int x=0;
618 int z=abs(int_d)-1;
619
620 if(int_d>0) {
621
Duraid Madina85d5f602005-04-27 11:57:39 +0000622 for(unsigned base=0; base<retstring.size(); base++) {
Duraid Madinab2322562005-04-26 07:23:02 +0000623 if( ((base+z+1) < retstring.size()) &&
624 retstring.c_str()[base]=='P' &&
625 retstring.c_str()[base+z+1]=='P')
626 {
627 // match
628 x++;
629 retstring.replace(base, 1, "0");
630 retstring.replace(base+z+1, 1, "p");
631 }
632 }
633
Duraid Madina85d5f602005-04-27 11:57:39 +0000634 for(unsigned base=0; base<retstring.size(); base++) {
Duraid Madinab2322562005-04-26 07:23:02 +0000635 if( ((base+z+1) < retstring.size()) &&
636 retstring.c_str()[base]=='N' &&
637 retstring.c_str()[base+z+1]=='N')
638 {
639 // match
640 x++;
641 retstring.replace(base, 1, "0");
642 retstring.replace(base+z+1, 1, "n");
643 }
644 }
645
646 } else {
Duraid Madina85d5f602005-04-27 11:57:39 +0000647 for(unsigned base=0; base<retstring.size(); base++) {
Duraid Madinab2322562005-04-26 07:23:02 +0000648 if( ((base+z+1) < retstring.size()) &&
649 ((retstring.c_str()[base]=='P' &&
650 retstring.c_str()[base+z+1]=='N') ||
651 (retstring.c_str()[base]=='N' &&
652 retstring.c_str()[base+z+1]=='P')) ) {
653 // match
654 x++;
655
656 if(retstring.c_str()[base]=='P') {
657 retstring.replace(base, 1, "0");
658 retstring.replace(base+z+1, 1, "p");
659 } else { // retstring[base]=='N'
660 retstring.replace(base, 1, "0");
661 retstring.replace(base+z+1, 1, "n");
662 }
663 }
664 }
665 }
666
667 if(x>int_W) {
668 int_W = x;
669 t = retstring;
670 c = int_d; // tofix
671 }
672
673 } d.pop_back(); // hmm
674
675 u = t;
676
Duraid Madina85d5f602005-04-27 11:57:39 +0000677 for(unsigned i=0; i<t.length(); i++) {
Duraid Madinab2322562005-04-26 07:23:02 +0000678 if(t.c_str()[i]=='p' || t.c_str()[i]=='n')
679 t.replace(i, 1, "0");
680 }
681
Duraid Madina85d5f602005-04-27 11:57:39 +0000682 for(unsigned i=0; i<u.length(); i++) {
Duraid Madina8a3042c2005-05-09 13:18:34 +0000683 if(u[i]=='P' || u[i]=='N')
Duraid Madinab2322562005-04-26 07:23:02 +0000684 u.replace(i, 1, "0");
Duraid Madina8a3042c2005-05-09 13:18:34 +0000685 if(u[i]=='p')
Duraid Madinab2322562005-04-26 07:23:02 +0000686 u.replace(i, 1, "P");
Duraid Madina8a3042c2005-05-09 13:18:34 +0000687 if(u[i]=='n')
Duraid Madinab2322562005-04-26 07:23:02 +0000688 u.replace(i, 1, "N");
689 }
690
691 if( c<0 ) {
Duraid Madina4706c032005-04-26 09:42:50 +0000692 f=true;
Duraid Madinab2322562005-04-26 07:23:02 +0000693 c=-c;
694 } else
Duraid Madina4706c032005-04-26 09:42:50 +0000695 f=false;
Duraid Madinab2322562005-04-26 07:23:02 +0000696
Duraid Madina8a3042c2005-05-09 13:18:34 +0000697 int pos=0;
698 while(u[pos]=='0')
699 pos++;
700
701 bool hit=(u[pos]=='N');
Duraid Madinab2322562005-04-26 07:23:02 +0000702
703 int g=0;
704 if(hit) {
705 g=1;
Duraid Madina85d5f602005-04-27 11:57:39 +0000706 for(unsigned p=0; p<u.length(); p++) {
Duraid Madina8a3042c2005-05-09 13:18:34 +0000707 bool isP=(u[p]=='P');
708 bool isN=(u[p]=='N');
Duraid Madinab2322562005-04-26 07:23:02 +0000709
710 if(isP)
711 u.replace(p, 1, "N");
712 if(isN)
713 u.replace(p, 1, "P");
714 }
715 }
716
717 munchLeadingZeros(u);
718
719 int i = lefevre(u, ops);
720
721 shiftaddblob blob;
722
723 blob.firstVal=i; blob.firstShift=c;
724 blob.isSub=f;
725 blob.secondVal=i; blob.secondShift=0;
726
727 ops.push_back(blob);
728
729 i = ops.size();
730
731 munchLeadingZeros(t);
732
733 if(t.length()==0)
734 return i;
735
736 if(t.c_str()[0]!='P') {
737 g=2;
Duraid Madina85d5f602005-04-27 11:57:39 +0000738 for(unsigned p=0; p<t.length(); p++) {
Duraid Madinab2322562005-04-26 07:23:02 +0000739 bool isP=(t.c_str()[p]=='P');
740 bool isN=(t.c_str()[p]=='N');
741
742 if(isP)
743 t.replace(p, 1, "N");
744 if(isN)
745 t.replace(p, 1, "P");
746 }
747 }
748
749 int j = lefevre(t, ops);
750
751 int trail=countTrailingZeros(u);
752 blob.secondVal=i; blob.secondShift=trail;
753
754 trail=countTrailingZeros(t);
755 blob.firstVal=j; blob.firstShift=trail;
756
757 switch(g) {
758 case 0:
759 blob.isSub=false; // first + second
760 break;
761 case 1:
762 blob.isSub=true; // first - second
763 break;
764 case 2:
765 blob.isSub=true; // second - first
766 int tmpval, tmpshift;
767 tmpval=blob.firstVal;
768 tmpshift=blob.firstShift;
769 blob.firstVal=blob.secondVal;
770 blob.firstShift=blob.secondShift;
771 blob.secondVal=tmpval;
772 blob.secondShift=tmpshift;
773 break;
774 //assert
775 }
776
777 ops.push_back(blob);
778 return ops.size();
779}
780
781SDOperand ISel::BuildConstmulSequence(SDOperand N) {
782 //FIXME: we should shortcut this stuff for multiplies by 2^n+1
783 // in particular, *3 is nicer as *2+1, not *4-1
784 int64_t constant=cast<ConstantSDNode>(N.getOperand(1))->getValue();
785
786 bool flippedSign;
787 unsigned preliminaryShift=0;
788
Duraid Madina40c9e6b2005-05-02 07:27:14 +0000789 assert(constant != 0 && "erk, you're trying to multiply by constant zero\n");
Duraid Madinab2322562005-04-26 07:23:02 +0000790
791 // first, we make the constant to multiply by positive
792 if(constant<0) {
793 constant=-constant;
794 flippedSign=true;
795 } else {
796 flippedSign=false;
797 }
798
799 // next, we make it odd.
800 for(; (constant%2==0); preliminaryShift++)
801 constant>>=1;
802
803 //OK, we have a positive, odd number of 64 bits or less. Convert it
804 //to a binary string, constantString[0] is the LSB
805 char constantString[65];
806 for(int i=0; i<64; i++)
807 constantString[i]='0'+((constant>>i)&0x1);
808 constantString[64]=0;
809
810 // now, Booth encode it
811 std::string boothEncodedString;
812 boothEncode(constantString, boothEncodedString);
813
814 std::vector<struct shiftaddblob> ops;
815 // do the transformation, filling out 'ops'
816 lefevre(boothEncodedString, ops);
817
818 SDOperand results[ops.size()]; // temporary results (of adds/subs of shifts)
819
820 // now turn 'ops' into DAG bits
Duraid Madina85d5f602005-04-27 11:57:39 +0000821 for(unsigned i=0; i<ops.size(); i++) {
Duraid Madinab2322562005-04-26 07:23:02 +0000822 SDOperand amt = ISelDAG->getConstant(ops[i].firstShift, MVT::i64);
823 SDOperand val = (ops[i].firstVal == 0) ? N.getOperand(0) :
824 results[ops[i].firstVal-1];
825 SDOperand left = ISelDAG->getNode(ISD::SHL, MVT::i64, val, amt);
826 amt = ISelDAG->getConstant(ops[i].secondShift, MVT::i64);
827 val = (ops[i].secondVal == 0) ? N.getOperand(0) :
828 results[ops[i].secondVal-1];
829 SDOperand right = ISelDAG->getNode(ISD::SHL, MVT::i64, val, amt);
830 if(ops[i].isSub)
831 results[i] = ISelDAG->getNode(ISD::SUB, MVT::i64, left, right);
832 else
833 results[i] = ISelDAG->getNode(ISD::ADD, MVT::i64, left, right);
834 }
835
836 // don't forget flippedSign and preliminaryShift!
Duraid Madina40c9e6b2005-05-02 07:27:14 +0000837 SDOperand shiftedresult;
Duraid Madinab2322562005-04-26 07:23:02 +0000838 if(preliminaryShift) {
839 SDOperand finalshift = ISelDAG->getConstant(preliminaryShift, MVT::i64);
Duraid Madina40c9e6b2005-05-02 07:27:14 +0000840 shiftedresult = ISelDAG->getNode(ISD::SHL, MVT::i64,
Duraid Madinab2322562005-04-26 07:23:02 +0000841 results[ops.size()-1], finalshift);
842 } else { // there was no preliminary divide-by-power-of-2 required
Duraid Madina40c9e6b2005-05-02 07:27:14 +0000843 shiftedresult = results[ops.size()-1];
Duraid Madinab2322562005-04-26 07:23:02 +0000844 }
845
Duraid Madina40c9e6b2005-05-02 07:27:14 +0000846 SDOperand finalresult;
847 if(flippedSign) { // if we were multiplying by a negative constant:
848 SDOperand zero = ISelDAG->getConstant(0, MVT::i64);
849 // subtract the result from 0 to flip its sign
850 finalresult = ISelDAG->getNode(ISD::SUB, MVT::i64, zero, shiftedresult);
851 } else { // there was no preliminary multiply by -1 required
852 finalresult = shiftedresult;
853 }
854
Duraid Madinab2322562005-04-26 07:23:02 +0000855 return finalresult;
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000856}
857
Duraid Madina4826a072005-04-06 09:55:17 +0000858/// ExactLog2 - This function solves for (Val == 1 << (N-1)) and returns N. It
859/// returns zero when the input is not exactly a power of two.
Duraid Madinac02780e2005-04-13 04:50:54 +0000860static unsigned ExactLog2(uint64_t Val) {
Duraid Madina4826a072005-04-06 09:55:17 +0000861 if (Val == 0 || (Val & (Val-1))) return 0;
862 unsigned Count = 0;
863 while (Val != 1) {
864 Val >>= 1;
865 ++Count;
866 }
867 return Count;
868}
869
Duraid Madinac02780e2005-04-13 04:50:54 +0000870/// ExactLog2sub1 - This function solves for (Val == (1 << (N-1))-1)
871/// and returns N. It returns 666 if Val is not 2^n -1 for some n.
872static unsigned ExactLog2sub1(uint64_t Val) {
873 unsigned int n;
874 for(n=0; n<64; n++) {
Duraid Madina3eb71502005-04-14 10:06:35 +0000875 if(Val==(uint64_t)((1LL<<n)-1))
Duraid Madinac02780e2005-04-13 04:50:54 +0000876 return n;
877 }
878 return 666;
879}
880
Duraid Madina4826a072005-04-06 09:55:17 +0000881/// ponderIntegerDivisionBy - When handling integer divides, if the divide
882/// is by a constant such that we can efficiently codegen it, this
883/// function says what to do. Currently, it returns 0 if the division must
884/// become a genuine divide, and 1 if the division can be turned into a
885/// right shift.
886static unsigned ponderIntegerDivisionBy(SDOperand N, bool isSigned,
887 unsigned& Imm) {
888 if (N.getOpcode() != ISD::Constant) return 0; // if not a divide by
889 // a constant, give up.
890
891 int64_t v = (int64_t)cast<ConstantSDNode>(N)->getSignExtended();
892
Misha Brukman4633f1c2005-04-21 23:13:11 +0000893 if ((Imm = ExactLog2(v))) { // if a division by a power of two, say so
Duraid Madina4826a072005-04-06 09:55:17 +0000894 return 1;
Misha Brukman4633f1c2005-04-21 23:13:11 +0000895 }
896
Duraid Madina4826a072005-04-06 09:55:17 +0000897 return 0; // fallthrough
898}
899
Duraid Madinac02780e2005-04-13 04:50:54 +0000900static unsigned ponderIntegerAndWith(SDOperand N, unsigned& Imm) {
901 if (N.getOpcode() != ISD::Constant) return 0; // if not ANDing with
902 // a constant, give up.
903
904 int64_t v = (int64_t)cast<ConstantSDNode>(N)->getSignExtended();
905
906 if ((Imm = ExactLog2sub1(v))!=666) { // if ANDing with ((2^n)-1) for some n
907 return 1; // say so
Misha Brukman4633f1c2005-04-21 23:13:11 +0000908 }
909
Duraid Madinac02780e2005-04-13 04:50:54 +0000910 return 0; // fallthrough
911}
912
Duraid Madinaf55e4032005-04-07 12:33:38 +0000913static unsigned ponderIntegerAdditionWith(SDOperand N, unsigned& Imm) {
914 if (N.getOpcode() != ISD::Constant) return 0; // if not adding a
915 // constant, give up.
916 int64_t v = (int64_t)cast<ConstantSDNode>(N)->getSignExtended();
917
918 if (v <= 8191 && v >= -8192) { // if this constants fits in 14 bits, say so
919 Imm = v & 0x3FFF; // 14 bits
920 return 1;
Misha Brukman4633f1c2005-04-21 23:13:11 +0000921 }
Duraid Madinaf55e4032005-04-07 12:33:38 +0000922 return 0; // fallthrough
923}
924
925static unsigned ponderIntegerSubtractionFrom(SDOperand N, unsigned& Imm) {
926 if (N.getOpcode() != ISD::Constant) return 0; // if not subtracting a
927 // constant, give up.
928 int64_t v = (int64_t)cast<ConstantSDNode>(N)->getSignExtended();
929
930 if (v <= 127 && v >= -128) { // if this constants fits in 8 bits, say so
931 Imm = v & 0xFF; // 8 bits
932 return 1;
Misha Brukman4633f1c2005-04-21 23:13:11 +0000933 }
Duraid Madinaf55e4032005-04-07 12:33:38 +0000934 return 0; // fallthrough
935}
936
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000937unsigned ISel::SelectExpr(SDOperand N) {
938 unsigned Result;
939 unsigned Tmp1, Tmp2, Tmp3;
940 unsigned Opc = 0;
941 MVT::ValueType DestType = N.getValueType();
942
943 unsigned opcode = N.getOpcode();
944
945 SDNode *Node = N.Val;
946 SDOperand Op0, Op1;
947
948 if (Node->getOpcode() == ISD::CopyFromReg)
949 // Just use the specified register as our input.
950 return dyn_cast<RegSDNode>(Node)->getReg();
Misha Brukman4633f1c2005-04-21 23:13:11 +0000951
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000952 unsigned &Reg = ExprMap[N];
953 if (Reg) return Reg;
Misha Brukman4633f1c2005-04-21 23:13:11 +0000954
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000955 if (N.getOpcode() != ISD::CALL)
956 Reg = Result = (N.getValueType() != MVT::Other) ?
957 MakeReg(N.getValueType()) : 1;
958 else {
959 // If this is a call instruction, make sure to prepare ALL of the result
960 // values as well as the chain.
961 if (Node->getNumValues() == 1)
962 Reg = Result = 1; // Void call, just a chain.
963 else {
964 Result = MakeReg(Node->getValueType(0));
965 ExprMap[N.getValue(0)] = Result;
966 for (unsigned i = 1, e = N.Val->getNumValues()-1; i != e; ++i)
967 ExprMap[N.getValue(i)] = MakeReg(Node->getValueType(i));
968 ExprMap[SDOperand(Node, Node->getNumValues()-1)] = 1;
969 }
970 }
Misha Brukman4633f1c2005-04-21 23:13:11 +0000971
Duraid Madina9b9d45f2005-03-17 18:17:03 +0000972 switch (N.getOpcode()) {
973 default:
974 Node->dump();
975 assert(0 && "Node not handled!\n");
976
977 case ISD::FrameIndex: {
978 Tmp1 = cast<FrameIndexSDNode>(N)->getIndex();
979 BuildMI(BB, IA64::MOV, 1, Result).addFrameIndex(Tmp1);
980 return Result;
981 }
982
983 case ISD::ConstantPool: {
984 Tmp1 = cast<ConstantPoolSDNode>(N)->getIndex();
985 IA64Lowering.restoreGP(BB); // FIXME: do i really need this?
986 BuildMI(BB, IA64::ADD, 2, Result).addConstantPoolIndex(Tmp1)
987 .addReg(IA64::r1);
988 return Result;
989 }
990
991 case ISD::ConstantFP: {
992 Tmp1 = Result; // Intermediate Register
993 if (cast<ConstantFPSDNode>(N)->getValue() < 0.0 ||
994 cast<ConstantFPSDNode>(N)->isExactlyValue(-0.0))
995 Tmp1 = MakeReg(MVT::f64);
996
997 if (cast<ConstantFPSDNode>(N)->isExactlyValue(+0.0) ||
998 cast<ConstantFPSDNode>(N)->isExactlyValue(-0.0))
999 BuildMI(BB, IA64::FMOV, 1, Tmp1).addReg(IA64::F0); // load 0.0
1000 else if (cast<ConstantFPSDNode>(N)->isExactlyValue(+1.0) ||
1001 cast<ConstantFPSDNode>(N)->isExactlyValue(-1.0))
1002 BuildMI(BB, IA64::FMOV, 1, Tmp1).addReg(IA64::F1); // load 1.0
1003 else
1004 assert(0 && "Unexpected FP constant!");
1005 if (Tmp1 != Result)
1006 // we multiply by +1.0, negate (this is FNMA), and then add 0.0
1007 BuildMI(BB, IA64::FNMA, 3, Result).addReg(Tmp1).addReg(IA64::F1)
Misha Brukman7847fca2005-04-22 17:54:37 +00001008 .addReg(IA64::F0);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001009 return Result;
1010 }
1011
1012 case ISD::DYNAMIC_STACKALLOC: {
1013 // Generate both result values.
1014 if (Result != 1)
1015 ExprMap[N.getValue(1)] = 1; // Generate the token
1016 else
1017 Result = ExprMap[N.getValue(0)] = MakeReg(N.getValue(0).getValueType());
1018
1019 // FIXME: We are currently ignoring the requested alignment for handling
1020 // greater than the stack alignment. This will need to be revisited at some
1021 // point. Align = N.getOperand(2);
1022
1023 if (!isa<ConstantSDNode>(N.getOperand(2)) ||
1024 cast<ConstantSDNode>(N.getOperand(2))->getValue() != 0) {
1025 std::cerr << "Cannot allocate stack object with greater alignment than"
1026 << " the stack alignment yet!";
1027 abort();
1028 }
Misha Brukman4633f1c2005-04-21 23:13:11 +00001029
1030/*
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001031 Select(N.getOperand(0));
1032 if (ConstantSDNode* CN = dyn_cast<ConstantSDNode>(N.getOperand(1)))
1033 {
1034 if (CN->getValue() < 32000)
1035 {
1036 BuildMI(BB, IA64::ADDIMM22, 2, IA64::r12).addReg(IA64::r12)
Misha Brukman7847fca2005-04-22 17:54:37 +00001037 .addImm(-CN->getValue());
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001038 } else {
1039 Tmp1 = SelectExpr(N.getOperand(1));
1040 // Subtract size from stack pointer, thereby allocating some space.
1041 BuildMI(BB, IA64::SUB, 2, IA64::r12).addReg(IA64::r12).addReg(Tmp1);
1042 }
1043 } else {
1044 Tmp1 = SelectExpr(N.getOperand(1));
1045 // Subtract size from stack pointer, thereby allocating some space.
1046 BuildMI(BB, IA64::SUB, 2, IA64::r12).addReg(IA64::r12).addReg(Tmp1);
1047 }
Duraid Madinabeeaab22005-03-31 12:31:11 +00001048*/
1049 Select(N.getOperand(0));
1050 Tmp1 = SelectExpr(N.getOperand(1));
1051 // Subtract size from stack pointer, thereby allocating some space.
1052 BuildMI(BB, IA64::SUB, 2, IA64::r12).addReg(IA64::r12).addReg(Tmp1);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001053 // Put a pointer to the space into the result register, by copying the
1054 // stack pointer.
1055 BuildMI(BB, IA64::MOV, 1, Result).addReg(IA64::r12);
1056 return Result;
1057 }
Misha Brukman4633f1c2005-04-21 23:13:11 +00001058
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001059 case ISD::SELECT: {
1060 Tmp1 = SelectExpr(N.getOperand(0)); //Cond
1061 Tmp2 = SelectExpr(N.getOperand(1)); //Use if TRUE
1062 Tmp3 = SelectExpr(N.getOperand(2)); //Use if FALSE
1063
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001064 unsigned bogoResult;
Misha Brukman4633f1c2005-04-21 23:13:11 +00001065
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001066 switch (N.getOperand(1).getValueType()) {
Misha Brukman7847fca2005-04-22 17:54:37 +00001067 default: assert(0 &&
Duraid Madina4bd708d2005-05-02 06:41:13 +00001068 "ISD::SELECT: 'select'ing something other than i1, i64 or f64!\n");
1069 // for i1, we load the condition into an integer register, then
1070 // conditionally copy Tmp2 and Tmp3 to Tmp1 in parallel (only one
1071 // of them will go through, since the integer register will hold
1072 // either 0 or 1)
1073 case MVT::i1: {
1074 bogoResult=MakeReg(MVT::i1);
1075
1076 // load the condition into an integer register
1077 unsigned condReg=MakeReg(MVT::i64);
1078 unsigned dummy=MakeReg(MVT::i64);
1079 BuildMI(BB, IA64::MOV, 1, dummy).addReg(IA64::r0);
1080 BuildMI(BB, IA64::TPCADDIMM22, 2, condReg).addReg(dummy)
1081 .addImm(1).addReg(Tmp1);
1082
1083 // initialize Result (bool) to false (hence UNC) and if
1084 // the select condition (condReg) is false (0), copy Tmp3
1085 BuildMI(BB, IA64::PCMPEQUNC, 3, bogoResult)
1086 .addReg(condReg).addReg(IA64::r0).addReg(Tmp3);
1087
1088 // now, if the selection condition is true, write 1 to the
1089 // result if Tmp2 is 1
1090 BuildMI(BB, IA64::TPCMPNE, 3, Result).addReg(bogoResult)
1091 .addReg(condReg).addReg(IA64::r0).addReg(Tmp2);
1092 break;
1093 }
1094 // for i64/f64, we just copy Tmp3 and then conditionally overwrite it
1095 // with Tmp2 if Tmp1 is true
Misha Brukman7847fca2005-04-22 17:54:37 +00001096 case MVT::i64:
1097 bogoResult=MakeReg(MVT::i64);
Duraid Madina4bd708d2005-05-02 06:41:13 +00001098 BuildMI(BB, IA64::MOV, 1, bogoResult).addReg(Tmp3);
1099 BuildMI(BB, IA64::CMOV, 2, Result).addReg(bogoResult).addReg(Tmp2)
1100 .addReg(Tmp1);
Misha Brukman7847fca2005-04-22 17:54:37 +00001101 break;
1102 case MVT::f64:
1103 bogoResult=MakeReg(MVT::f64);
Duraid Madina4bd708d2005-05-02 06:41:13 +00001104 BuildMI(BB, IA64::FMOV, 1, bogoResult).addReg(Tmp3);
1105 BuildMI(BB, IA64::CFMOV, 2, Result).addReg(bogoResult).addReg(Tmp2)
1106 .addReg(Tmp1);
Misha Brukman7847fca2005-04-22 17:54:37 +00001107 break;
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001108 }
Duraid Madina4bd708d2005-05-02 06:41:13 +00001109
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001110 return Result;
1111 }
Misha Brukman4633f1c2005-04-21 23:13:11 +00001112
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001113 case ISD::Constant: {
1114 unsigned depositPos=0;
1115 unsigned depositLen=0;
1116 switch (N.getValueType()) {
1117 default: assert(0 && "Cannot use constants of this type!");
1118 case MVT::i1: { // if a bool, we don't 'load' so much as generate
Misha Brukman7847fca2005-04-22 17:54:37 +00001119 // the constant:
1120 if(cast<ConstantSDNode>(N)->getValue()) // true:
1121 BuildMI(BB, IA64::CMPEQ, 2, Result).addReg(IA64::r0).addReg(IA64::r0);
1122 else // false:
1123 BuildMI(BB, IA64::CMPNE, 2, Result).addReg(IA64::r0).addReg(IA64::r0);
1124 return Result; // early exit
1125 }
Duraid Madina5ef2ec92005-04-11 05:55:56 +00001126 case MVT::i64: break;
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001127 }
Misha Brukman4633f1c2005-04-21 23:13:11 +00001128
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001129 int64_t immediate = cast<ConstantSDNode>(N)->getValue();
Duraid Madina5ef2ec92005-04-11 05:55:56 +00001130
1131 if(immediate==0) { // if the constant is just zero,
1132 BuildMI(BB, IA64::MOV, 1, Result).addReg(IA64::r0); // just copy r0
1133 return Result; // early exit
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001134 }
1135
Duraid Madina5ef2ec92005-04-11 05:55:56 +00001136 if (immediate <= 8191 && immediate >= -8192) {
1137 // if this constants fits in 14 bits, we use a mov the assembler will
1138 // turn into: "adds rDest=imm,r0" (and _not_ "andl"...)
1139 BuildMI(BB, IA64::MOVSIMM14, 1, Result).addSImm(immediate);
1140 return Result; // early exit
Misha Brukman4633f1c2005-04-21 23:13:11 +00001141 }
Duraid Madina5ef2ec92005-04-11 05:55:56 +00001142
1143 if (immediate <= 2097151 && immediate >= -2097152) {
1144 // if this constants fits in 22 bits, we use a mov the assembler will
1145 // turn into: "addl rDest=imm,r0"
1146 BuildMI(BB, IA64::MOVSIMM22, 1, Result).addSImm(immediate);
1147 return Result; // early exit
Misha Brukman4633f1c2005-04-21 23:13:11 +00001148 }
Duraid Madina5ef2ec92005-04-11 05:55:56 +00001149
1150 /* otherwise, our immediate is big, so we use movl */
1151 uint64_t Imm = immediate;
Duraid Madina21478e52005-04-11 07:16:39 +00001152 BuildMI(BB, IA64::MOVLIMM64, 1, Result).addImm64(Imm);
Duraid Madina5ef2ec92005-04-11 05:55:56 +00001153 return Result;
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001154 }
Duraid Madina75c9fcb2005-04-02 10:33:53 +00001155
1156 case ISD::UNDEF: {
1157 BuildMI(BB, IA64::IDEF, 0, Result);
1158 return Result;
1159 }
Misha Brukman4633f1c2005-04-21 23:13:11 +00001160
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001161 case ISD::GlobalAddress: {
1162 GlobalValue *GV = cast<GlobalAddressSDNode>(N)->getGlobal();
1163 unsigned Tmp1 = MakeReg(MVT::i64);
Duraid Madinabeeaab22005-03-31 12:31:11 +00001164
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001165 BuildMI(BB, IA64::ADD, 2, Tmp1).addGlobalAddress(GV).addReg(IA64::r1);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001166 BuildMI(BB, IA64::LD8, 1, Result).addReg(Tmp1);
Duraid Madinabeeaab22005-03-31 12:31:11 +00001167
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001168 return Result;
1169 }
Misha Brukman4633f1c2005-04-21 23:13:11 +00001170
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001171 case ISD::ExternalSymbol: {
1172 const char *Sym = cast<ExternalSymbolSDNode>(N)->getSymbol();
Duraid Madinabeeaab22005-03-31 12:31:11 +00001173// assert(0 && "sorry, but what did you want an ExternalSymbol for again?");
1174 BuildMI(BB, IA64::MOV, 1, Result).addExternalSymbol(Sym); // XXX
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001175 return Result;
1176 }
1177
1178 case ISD::FP_EXTEND: {
1179 Tmp1 = SelectExpr(N.getOperand(0));
1180 BuildMI(BB, IA64::FMOV, 1, Result).addReg(Tmp1);
1181 return Result;
1182 }
1183
1184 case ISD::ZERO_EXTEND: {
1185 Tmp1 = SelectExpr(N.getOperand(0)); // value
Misha Brukman4633f1c2005-04-21 23:13:11 +00001186
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001187 switch (N.getOperand(0).getValueType()) {
1188 default: assert(0 && "Cannot zero-extend this type!");
1189 case MVT::i8: Opc = IA64::ZXT1; break;
1190 case MVT::i16: Opc = IA64::ZXT2; break;
1191 case MVT::i32: Opc = IA64::ZXT4; break;
1192
Misha Brukman4633f1c2005-04-21 23:13:11 +00001193 // we handle bools differently! :
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001194 case MVT::i1: { // if the predicate reg has 1, we want a '1' in our GR.
Misha Brukman7847fca2005-04-22 17:54:37 +00001195 unsigned dummy = MakeReg(MVT::i64);
1196 // first load zero:
1197 BuildMI(BB, IA64::MOV, 1, dummy).addReg(IA64::r0);
1198 // ...then conditionally (PR:Tmp1) add 1:
1199 BuildMI(BB, IA64::TPCADDIMM22, 2, Result).addReg(dummy)
1200 .addImm(1).addReg(Tmp1);
1201 return Result; // XXX early exit!
1202 }
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001203 }
1204
1205 BuildMI(BB, Opc, 1, Result).addReg(Tmp1);
1206 return Result;
1207 }
1208
1209 case ISD::SIGN_EXTEND: { // we should only have to handle i1 -> i64 here!!!
1210
1211assert(0 && "hmm, ISD::SIGN_EXTEND: shouldn't ever be reached. bad luck!\n");
1212
1213 Tmp1 = SelectExpr(N.getOperand(0)); // value
Misha Brukman4633f1c2005-04-21 23:13:11 +00001214
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001215 switch (N.getOperand(0).getValueType()) {
1216 default: assert(0 && "Cannot sign-extend this type!");
1217 case MVT::i1: assert(0 && "trying to sign extend a bool? ow.\n");
Misha Brukman7847fca2005-04-22 17:54:37 +00001218 Opc = IA64::SXT1; break;
1219 // FIXME: for now, we treat bools the same as i8s
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001220 case MVT::i8: Opc = IA64::SXT1; break;
1221 case MVT::i16: Opc = IA64::SXT2; break;
1222 case MVT::i32: Opc = IA64::SXT4; break;
1223 }
1224
1225 BuildMI(BB, Opc, 1, Result).addReg(Tmp1);
1226 return Result;
1227 }
1228
1229 case ISD::TRUNCATE: {
1230 // we use the funky dep.z (deposit (zero)) instruction to deposit bits
1231 // of R0 appropriately.
1232 switch (N.getOperand(0).getValueType()) {
1233 default: assert(0 && "Unknown truncate!");
1234 case MVT::i64: break;
1235 }
1236 Tmp1 = SelectExpr(N.getOperand(0));
1237 unsigned depositPos, depositLen;
1238
1239 switch (N.getValueType()) {
1240 default: assert(0 && "Unknown truncate!");
1241 case MVT::i1: {
1242 // if input (normal reg) is 0, 0!=0 -> false (0), if 1, 1!=0 ->true (1):
Misha Brukman7847fca2005-04-22 17:54:37 +00001243 BuildMI(BB, IA64::CMPNE, 2, Result).addReg(Tmp1)
1244 .addReg(IA64::r0);
1245 return Result; // XXX early exit!
1246 }
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001247 case MVT::i8: depositPos=0; depositLen=8; break;
1248 case MVT::i16: depositPos=0; depositLen=16; break;
1249 case MVT::i32: depositPos=0; depositLen=32; break;
1250 }
1251 BuildMI(BB, IA64::DEPZ, 1, Result).addReg(Tmp1)
1252 .addImm(depositPos).addImm(depositLen);
1253 return Result;
1254 }
1255
Misha Brukman7847fca2005-04-22 17:54:37 +00001256/*
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001257 case ISD::FP_ROUND: {
1258 assert (DestType == MVT::f32 && N.getOperand(0).getValueType() == MVT::f64 &&
Misha Brukman7847fca2005-04-22 17:54:37 +00001259 "error: trying to FP_ROUND something other than f64 -> f32!\n");
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001260 Tmp1 = SelectExpr(N.getOperand(0));
1261 BuildMI(BB, IA64::FADDS, 2, Result).addReg(Tmp1).addReg(IA64::F0);
1262 // we add 0.0 using a single precision add to do rounding
1263 return Result;
1264 }
1265*/
1266
1267// FIXME: the following 4 cases need cleaning
1268 case ISD::SINT_TO_FP: {
1269 Tmp1 = SelectExpr(N.getOperand(0));
1270 Tmp2 = MakeReg(MVT::f64);
1271 unsigned dummy = MakeReg(MVT::f64);
1272 BuildMI(BB, IA64::SETFSIG, 1, Tmp2).addReg(Tmp1);
1273 BuildMI(BB, IA64::FCVTXF, 1, dummy).addReg(Tmp2);
1274 BuildMI(BB, IA64::FNORMD, 1, Result).addReg(dummy);
1275 return Result;
1276 }
1277
1278 case ISD::UINT_TO_FP: {
1279 Tmp1 = SelectExpr(N.getOperand(0));
1280 Tmp2 = MakeReg(MVT::f64);
1281 unsigned dummy = MakeReg(MVT::f64);
1282 BuildMI(BB, IA64::SETFSIG, 1, Tmp2).addReg(Tmp1);
1283 BuildMI(BB, IA64::FCVTXUF, 1, dummy).addReg(Tmp2);
1284 BuildMI(BB, IA64::FNORMD, 1, Result).addReg(dummy);
1285 return Result;
1286 }
1287
1288 case ISD::FP_TO_SINT: {
1289 Tmp1 = SelectExpr(N.getOperand(0));
1290 Tmp2 = MakeReg(MVT::f64);
1291 BuildMI(BB, IA64::FCVTFXTRUNC, 1, Tmp2).addReg(Tmp1);
1292 BuildMI(BB, IA64::GETFSIG, 1, Result).addReg(Tmp2);
1293 return Result;
1294 }
1295
1296 case ISD::FP_TO_UINT: {
1297 Tmp1 = SelectExpr(N.getOperand(0));
1298 Tmp2 = MakeReg(MVT::f64);
1299 BuildMI(BB, IA64::FCVTFXUTRUNC, 1, Tmp2).addReg(Tmp1);
1300 BuildMI(BB, IA64::GETFSIG, 1, Result).addReg(Tmp2);
1301 return Result;
1302 }
1303
1304 case ISD::ADD: {
Duraid Madina4826a072005-04-06 09:55:17 +00001305 if(DestType == MVT::f64 && N.getOperand(0).getOpcode() == ISD::MUL &&
1306 N.getOperand(0).Val->hasOneUse()) { // if we can fold this add
1307 // into an fma, do so:
1308 // ++FusedFP; // Statistic
1309 Tmp1 = SelectExpr(N.getOperand(0).getOperand(0));
1310 Tmp2 = SelectExpr(N.getOperand(0).getOperand(1));
1311 Tmp3 = SelectExpr(N.getOperand(1));
1312 BuildMI(BB, IA64::FMA, 3, Result).addReg(Tmp1).addReg(Tmp2).addReg(Tmp3);
1313 return Result; // early exit
1314 }
Duraid Madinaed095022005-04-13 06:12:04 +00001315
1316 if(DestType != MVT::f64 && N.getOperand(0).getOpcode() == ISD::SHL &&
Misha Brukman7847fca2005-04-22 17:54:37 +00001317 N.getOperand(0).Val->hasOneUse()) { // if we might be able to fold
Duraid Madinaed095022005-04-13 06:12:04 +00001318 // this add into a shladd, try:
1319 ConstantSDNode *CSD = NULL;
1320 if((CSD = dyn_cast<ConstantSDNode>(N.getOperand(0).getOperand(1))) &&
Misha Brukman7847fca2005-04-22 17:54:37 +00001321 (CSD->getValue() >= 1) && (CSD->getValue() <= 4) ) { // we can:
Duraid Madinaed095022005-04-13 06:12:04 +00001322
Misha Brukman7847fca2005-04-22 17:54:37 +00001323 // ++FusedSHLADD; // Statistic
1324 Tmp1 = SelectExpr(N.getOperand(0).getOperand(0));
1325 int shl_amt = CSD->getValue();
1326 Tmp3 = SelectExpr(N.getOperand(1));
1327
1328 BuildMI(BB, IA64::SHLADD, 3, Result)
1329 .addReg(Tmp1).addImm(shl_amt).addReg(Tmp3);
1330 return Result; // early exit
Duraid Madinaed095022005-04-13 06:12:04 +00001331 }
1332 }
1333
1334 //else, fallthrough:
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001335 Tmp1 = SelectExpr(N.getOperand(0));
Duraid Madinaf55e4032005-04-07 12:33:38 +00001336 if(DestType != MVT::f64) { // integer addition:
1337 switch (ponderIntegerAdditionWith(N.getOperand(1), Tmp3)) {
Misha Brukman7847fca2005-04-22 17:54:37 +00001338 case 1: // adding a constant that's 14 bits
1339 BuildMI(BB, IA64::ADDIMM14, 2, Result).addReg(Tmp1).addSImm(Tmp3);
1340 return Result; // early exit
1341 } // fallthrough and emit a reg+reg ADD:
1342 Tmp2 = SelectExpr(N.getOperand(1));
1343 BuildMI(BB, IA64::ADD, 2, Result).addReg(Tmp1).addReg(Tmp2);
Duraid Madinaf55e4032005-04-07 12:33:38 +00001344 } else { // this is a floating point addition
Duraid Madina5ef2ec92005-04-11 05:55:56 +00001345 Tmp2 = SelectExpr(N.getOperand(1));
Duraid Madinaf55e4032005-04-07 12:33:38 +00001346 BuildMI(BB, IA64::FADD, 2, Result).addReg(Tmp1).addReg(Tmp2);
1347 }
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001348 return Result;
1349 }
1350
1351 case ISD::MUL: {
Duraid Madina4826a072005-04-06 09:55:17 +00001352
1353 if(DestType != MVT::f64) { // TODO: speed!
Duraid Madinab2322562005-04-26 07:23:02 +00001354 if(N.getOperand(1).getOpcode() != ISD::Constant) { // if not a const mul
1355 // boring old integer multiply with xma
1356 Tmp1 = SelectExpr(N.getOperand(0));
1357 Tmp2 = SelectExpr(N.getOperand(1));
1358
1359 unsigned TempFR1=MakeReg(MVT::f64);
1360 unsigned TempFR2=MakeReg(MVT::f64);
1361 unsigned TempFR3=MakeReg(MVT::f64);
1362 BuildMI(BB, IA64::SETFSIG, 1, TempFR1).addReg(Tmp1);
1363 BuildMI(BB, IA64::SETFSIG, 1, TempFR2).addReg(Tmp2);
1364 BuildMI(BB, IA64::XMAL, 1, TempFR3).addReg(TempFR1).addReg(TempFR2)
1365 .addReg(IA64::F0);
1366 BuildMI(BB, IA64::GETFSIG, 1, Result).addReg(TempFR3);
1367 return Result; // early exit
1368 } else { // we are multiplying by an integer constant! yay
1369 return Reg = SelectExpr(BuildConstmulSequence(N)); // avert your eyes!
1370 }
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001371 }
Duraid Madinab2322562005-04-26 07:23:02 +00001372 else { // floating point multiply
1373 Tmp1 = SelectExpr(N.getOperand(0));
1374 Tmp2 = SelectExpr(N.getOperand(1));
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001375 BuildMI(BB, IA64::FMPY, 2, Result).addReg(Tmp1).addReg(Tmp2);
Duraid Madinab2322562005-04-26 07:23:02 +00001376 return Result;
1377 }
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001378 }
Misha Brukman4633f1c2005-04-21 23:13:11 +00001379
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001380 case ISD::SUB: {
Duraid Madina4826a072005-04-06 09:55:17 +00001381 if(DestType == MVT::f64 && N.getOperand(0).getOpcode() == ISD::MUL &&
1382 N.getOperand(0).Val->hasOneUse()) { // if we can fold this sub
1383 // into an fms, do so:
1384 // ++FusedFP; // Statistic
1385 Tmp1 = SelectExpr(N.getOperand(0).getOperand(0));
1386 Tmp2 = SelectExpr(N.getOperand(0).getOperand(1));
1387 Tmp3 = SelectExpr(N.getOperand(1));
1388 BuildMI(BB, IA64::FMS, 3, Result).addReg(Tmp1).addReg(Tmp2).addReg(Tmp3);
1389 return Result; // early exit
1390 }
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001391 Tmp2 = SelectExpr(N.getOperand(1));
Duraid Madinaf55e4032005-04-07 12:33:38 +00001392 if(DestType != MVT::f64) { // integer subtraction:
1393 switch (ponderIntegerSubtractionFrom(N.getOperand(0), Tmp3)) {
Misha Brukman7847fca2005-04-22 17:54:37 +00001394 case 1: // subtracting *from* an 8 bit constant:
1395 BuildMI(BB, IA64::SUBIMM8, 2, Result).addSImm(Tmp3).addReg(Tmp2);
1396 return Result; // early exit
1397 } // fallthrough and emit a reg+reg SUB:
1398 Tmp1 = SelectExpr(N.getOperand(0));
1399 BuildMI(BB, IA64::SUB, 2, Result).addReg(Tmp1).addReg(Tmp2);
Duraid Madinaf55e4032005-04-07 12:33:38 +00001400 } else { // this is a floating point subtraction
Duraid Madina5ef2ec92005-04-11 05:55:56 +00001401 Tmp1 = SelectExpr(N.getOperand(0));
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001402 BuildMI(BB, IA64::FSUB, 2, Result).addReg(Tmp1).addReg(Tmp2);
Duraid Madinaf55e4032005-04-07 12:33:38 +00001403 }
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001404 return Result;
1405 }
Duraid Madinaa7ee8b82005-04-02 05:18:38 +00001406
1407 case ISD::FABS: {
1408 Tmp1 = SelectExpr(N.getOperand(0));
1409 assert(DestType == MVT::f64 && "trying to fabs something other than f64?");
1410 BuildMI(BB, IA64::FABS, 1, Result).addReg(Tmp1);
1411 return Result;
1412 }
Misha Brukman4633f1c2005-04-21 23:13:11 +00001413
Duraid Madinaa7ee8b82005-04-02 05:18:38 +00001414 case ISD::FNEG: {
Duraid Madinaa7ee8b82005-04-02 05:18:38 +00001415 assert(DestType == MVT::f64 && "trying to fneg something other than f64?");
Duraid Madina75c9fcb2005-04-02 10:33:53 +00001416
Misha Brukman4633f1c2005-04-21 23:13:11 +00001417 if (ISD::FABS == N.getOperand(0).getOpcode()) { // && hasOneUse()?
Duraid Madina75c9fcb2005-04-02 10:33:53 +00001418 Tmp1 = SelectExpr(N.getOperand(0).getOperand(0));
1419 BuildMI(BB, IA64::FNEGABS, 1, Result).addReg(Tmp1); // fold in abs
1420 } else {
1421 Tmp1 = SelectExpr(N.getOperand(0));
1422 BuildMI(BB, IA64::FNEG, 1, Result).addReg(Tmp1); // plain old fneg
1423 }
1424
Duraid Madinaa7ee8b82005-04-02 05:18:38 +00001425 return Result;
1426 }
Misha Brukman7847fca2005-04-22 17:54:37 +00001427
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001428 case ISD::AND: {
1429 switch (N.getValueType()) {
1430 default: assert(0 && "Cannot AND this type!");
1431 case MVT::i1: { // if a bool, we emit a pseudocode AND
1432 unsigned pA = SelectExpr(N.getOperand(0));
1433 unsigned pB = SelectExpr(N.getOperand(1));
Misha Brukman4633f1c2005-04-21 23:13:11 +00001434
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001435/* our pseudocode for AND is:
1436 *
1437(pA) cmp.eq.unc pC,p0 = r0,r0 // pC = pA
1438 cmp.eq pTemp,p0 = r0,r0 // pTemp = NOT pB
1439 ;;
1440(pB) cmp.ne pTemp,p0 = r0,r0
1441 ;;
1442(pTemp)cmp.ne pC,p0 = r0,r0 // if (NOT pB) pC = 0
1443
1444*/
1445 unsigned pTemp = MakeReg(MVT::i1);
Misha Brukman4633f1c2005-04-21 23:13:11 +00001446
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001447 unsigned bogusTemp1 = MakeReg(MVT::i1);
1448 unsigned bogusTemp2 = MakeReg(MVT::i1);
1449 unsigned bogusTemp3 = MakeReg(MVT::i1);
1450 unsigned bogusTemp4 = MakeReg(MVT::i1);
Misha Brukman4633f1c2005-04-21 23:13:11 +00001451
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001452 BuildMI(BB, IA64::PCMPEQUNC, 3, bogusTemp1)
Misha Brukman7847fca2005-04-22 17:54:37 +00001453 .addReg(IA64::r0).addReg(IA64::r0).addReg(pA);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001454 BuildMI(BB, IA64::CMPEQ, 2, bogusTemp2)
Misha Brukman7847fca2005-04-22 17:54:37 +00001455 .addReg(IA64::r0).addReg(IA64::r0);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001456 BuildMI(BB, IA64::TPCMPNE, 3, pTemp)
Misha Brukman7847fca2005-04-22 17:54:37 +00001457 .addReg(bogusTemp2).addReg(IA64::r0).addReg(IA64::r0).addReg(pB);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001458 BuildMI(BB, IA64::TPCMPNE, 3, Result)
Misha Brukman7847fca2005-04-22 17:54:37 +00001459 .addReg(bogusTemp1).addReg(IA64::r0).addReg(IA64::r0).addReg(pTemp);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001460 break;
1461 }
Misha Brukman4633f1c2005-04-21 23:13:11 +00001462
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001463 // if not a bool, we just AND away:
1464 case MVT::i8:
1465 case MVT::i16:
1466 case MVT::i32:
1467 case MVT::i64: {
1468 Tmp1 = SelectExpr(N.getOperand(0));
Duraid Madinac02780e2005-04-13 04:50:54 +00001469 switch (ponderIntegerAndWith(N.getOperand(1), Tmp3)) {
1470 case 1: // ANDing a constant that is 2^n-1 for some n
Misha Brukman7847fca2005-04-22 17:54:37 +00001471 switch (Tmp3) {
1472 case 8: // if AND 0x00000000000000FF, be quaint and use zxt1
1473 BuildMI(BB, IA64::ZXT1, 1, Result).addReg(Tmp1);
1474 break;
1475 case 16: // if AND 0x000000000000FFFF, be quaint and use zxt2
1476 BuildMI(BB, IA64::ZXT2, 1, Result).addReg(Tmp1);
1477 break;
1478 case 32: // if AND 0x00000000FFFFFFFF, be quaint and use zxt4
1479 BuildMI(BB, IA64::ZXT4, 1, Result).addReg(Tmp1);
1480 break;
1481 default: // otherwise, use dep.z to paste zeros
1482 BuildMI(BB, IA64::DEPZ, 3, Result).addReg(Tmp1)
1483 .addImm(0).addImm(Tmp3);
1484 break;
1485 }
1486 return Result; // early exit
Duraid Madinac02780e2005-04-13 04:50:54 +00001487 } // fallthrough and emit a simple AND:
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001488 Tmp2 = SelectExpr(N.getOperand(1));
1489 BuildMI(BB, IA64::AND, 2, Result).addReg(Tmp1).addReg(Tmp2);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001490 }
1491 }
1492 return Result;
1493 }
Misha Brukman4633f1c2005-04-21 23:13:11 +00001494
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001495 case ISD::OR: {
1496 switch (N.getValueType()) {
1497 default: assert(0 && "Cannot OR this type!");
1498 case MVT::i1: { // if a bool, we emit a pseudocode OR
1499 unsigned pA = SelectExpr(N.getOperand(0));
1500 unsigned pB = SelectExpr(N.getOperand(1));
1501
1502 unsigned pTemp1 = MakeReg(MVT::i1);
Misha Brukman4633f1c2005-04-21 23:13:11 +00001503
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001504/* our pseudocode for OR is:
1505 *
1506
1507pC = pA OR pB
1508-------------
1509
Misha Brukman7847fca2005-04-22 17:54:37 +00001510(pA) cmp.eq.unc pC,p0 = r0,r0 // pC = pA
1511 ;;
1512(pB) cmp.eq pC,p0 = r0,r0 // if (pB) pC = 1
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001513
1514*/
1515 BuildMI(BB, IA64::PCMPEQUNC, 3, pTemp1)
Misha Brukman7847fca2005-04-22 17:54:37 +00001516 .addReg(IA64::r0).addReg(IA64::r0).addReg(pA);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001517 BuildMI(BB, IA64::TPCMPEQ, 3, Result)
Misha Brukman7847fca2005-04-22 17:54:37 +00001518 .addReg(pTemp1).addReg(IA64::r0).addReg(IA64::r0).addReg(pB);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001519 break;
1520 }
1521 // if not a bool, we just OR away:
1522 case MVT::i8:
1523 case MVT::i16:
1524 case MVT::i32:
1525 case MVT::i64: {
1526 Tmp1 = SelectExpr(N.getOperand(0));
1527 Tmp2 = SelectExpr(N.getOperand(1));
1528 BuildMI(BB, IA64::OR, 2, Result).addReg(Tmp1).addReg(Tmp2);
1529 break;
1530 }
1531 }
1532 return Result;
1533 }
Misha Brukman7847fca2005-04-22 17:54:37 +00001534
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001535 case ISD::XOR: {
1536 switch (N.getValueType()) {
1537 default: assert(0 && "Cannot XOR this type!");
1538 case MVT::i1: { // if a bool, we emit a pseudocode XOR
1539 unsigned pY = SelectExpr(N.getOperand(0));
1540 unsigned pZ = SelectExpr(N.getOperand(1));
1541
1542/* one possible routine for XOR is:
1543
1544 // Compute px = py ^ pz
1545 // using sum of products: px = (py & !pz) | (pz & !py)
1546 // Uses 5 instructions in 3 cycles.
1547 // cycle 1
1548(pz) cmp.eq.unc px = r0, r0 // px = pz
1549(py) cmp.eq.unc pt = r0, r0 // pt = py
1550 ;;
1551 // cycle 2
1552(pt) cmp.ne.and px = r0, r0 // px = px & !pt (px = pz & !pt)
1553(pz) cmp.ne.and pt = r0, r0 // pt = pt & !pz
1554 ;;
1555 } { .mmi
1556 // cycle 3
1557(pt) cmp.eq.or px = r0, r0 // px = px | pt
1558
1559*** Another, which we use here, requires one scratch GR. it is:
1560
1561 mov rt = 0 // initialize rt off critical path
1562 ;;
1563
1564 // cycle 1
1565(pz) cmp.eq.unc px = r0, r0 // px = pz
1566(pz) mov rt = 1 // rt = pz
1567 ;;
1568 // cycle 2
1569(py) cmp.ne px = 1, rt // if (py) px = !pz
1570
1571.. these routines kindly provided by Jim Hull
1572*/
1573 unsigned rt = MakeReg(MVT::i64);
1574
1575 // these two temporaries will never actually appear,
1576 // due to the two-address form of some of the instructions below
1577 unsigned bogoPR = MakeReg(MVT::i1); // becomes Result
1578 unsigned bogoGR = MakeReg(MVT::i64); // becomes rt
1579
1580 BuildMI(BB, IA64::MOV, 1, bogoGR).addReg(IA64::r0);
1581 BuildMI(BB, IA64::PCMPEQUNC, 3, bogoPR)
Misha Brukman7847fca2005-04-22 17:54:37 +00001582 .addReg(IA64::r0).addReg(IA64::r0).addReg(pZ);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001583 BuildMI(BB, IA64::TPCADDIMM22, 2, rt)
Misha Brukman7847fca2005-04-22 17:54:37 +00001584 .addReg(bogoGR).addImm(1).addReg(pZ);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001585 BuildMI(BB, IA64::TPCMPIMM8NE, 3, Result)
Misha Brukman7847fca2005-04-22 17:54:37 +00001586 .addReg(bogoPR).addImm(1).addReg(rt).addReg(pY);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001587 break;
1588 }
1589 // if not a bool, we just XOR away:
1590 case MVT::i8:
1591 case MVT::i16:
1592 case MVT::i32:
1593 case MVT::i64: {
1594 Tmp1 = SelectExpr(N.getOperand(0));
1595 Tmp2 = SelectExpr(N.getOperand(1));
1596 BuildMI(BB, IA64::XOR, 2, Result).addReg(Tmp1).addReg(Tmp2);
1597 break;
1598 }
1599 }
1600 return Result;
1601 }
1602
Duraid Madina63bbed52005-05-11 05:16:09 +00001603 case ISD::CTPOP: {
1604 Tmp1 = SelectExpr(N.getOperand(0));
1605 BuildMI(BB, IA64::POPCNT, 1, Result).addReg(Tmp1);
1606 return Result;
1607 }
1608
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001609 case ISD::SHL: {
1610 Tmp1 = SelectExpr(N.getOperand(0));
Duraid Madinaf55e4032005-04-07 12:33:38 +00001611 if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(N.getOperand(1))) {
1612 Tmp2 = CN->getValue();
1613 BuildMI(BB, IA64::SHLI, 2, Result).addReg(Tmp1).addImm(Tmp2);
1614 } else {
1615 Tmp2 = SelectExpr(N.getOperand(1));
1616 BuildMI(BB, IA64::SHL, 2, Result).addReg(Tmp1).addReg(Tmp2);
1617 }
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001618 return Result;
1619 }
Misha Brukman7847fca2005-04-22 17:54:37 +00001620
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001621 case ISD::SRL: {
1622 Tmp1 = SelectExpr(N.getOperand(0));
Duraid Madinaf55e4032005-04-07 12:33:38 +00001623 if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(N.getOperand(1))) {
1624 Tmp2 = CN->getValue();
1625 BuildMI(BB, IA64::SHRUI, 2, Result).addReg(Tmp1).addImm(Tmp2);
1626 } else {
1627 Tmp2 = SelectExpr(N.getOperand(1));
1628 BuildMI(BB, IA64::SHRU, 2, Result).addReg(Tmp1).addReg(Tmp2);
1629 }
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001630 return Result;
1631 }
Misha Brukman7847fca2005-04-22 17:54:37 +00001632
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001633 case ISD::SRA: {
1634 Tmp1 = SelectExpr(N.getOperand(0));
Duraid Madinaf55e4032005-04-07 12:33:38 +00001635 if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(N.getOperand(1))) {
1636 Tmp2 = CN->getValue();
1637 BuildMI(BB, IA64::SHRSI, 2, Result).addReg(Tmp1).addImm(Tmp2);
1638 } else {
1639 Tmp2 = SelectExpr(N.getOperand(1));
1640 BuildMI(BB, IA64::SHRS, 2, Result).addReg(Tmp1).addReg(Tmp2);
1641 }
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001642 return Result;
1643 }
1644
1645 case ISD::SDIV:
1646 case ISD::UDIV:
1647 case ISD::SREM:
1648 case ISD::UREM: {
1649
1650 Tmp1 = SelectExpr(N.getOperand(0));
1651 Tmp2 = SelectExpr(N.getOperand(1));
1652
1653 bool isFP=false;
1654
1655 if(DestType == MVT::f64) // XXX: we're not gonna be fed MVT::f32, are we?
1656 isFP=true;
1657
1658 bool isModulus=false; // is it a division or a modulus?
1659 bool isSigned=false;
1660
1661 switch(N.getOpcode()) {
1662 case ISD::SDIV: isModulus=false; isSigned=true; break;
1663 case ISD::UDIV: isModulus=false; isSigned=false; break;
1664 case ISD::SREM: isModulus=true; isSigned=true; break;
1665 case ISD::UREM: isModulus=true; isSigned=false; break;
1666 }
1667
Duraid Madina4826a072005-04-06 09:55:17 +00001668 if(!isModulus && !isFP) { // if this is an integer divide,
1669 switch (ponderIntegerDivisionBy(N.getOperand(1), isSigned, Tmp3)) {
Misha Brukman7847fca2005-04-22 17:54:37 +00001670 case 1: // division by a constant that's a power of 2
1671 Tmp1 = SelectExpr(N.getOperand(0));
1672 if(isSigned) { // argument could be negative, so emit some code:
1673 unsigned divAmt=Tmp3;
1674 unsigned tempGR1=MakeReg(MVT::i64);
1675 unsigned tempGR2=MakeReg(MVT::i64);
1676 unsigned tempGR3=MakeReg(MVT::i64);
1677 BuildMI(BB, IA64::SHRS, 2, tempGR1)
1678 .addReg(Tmp1).addImm(divAmt-1);
1679 BuildMI(BB, IA64::EXTRU, 3, tempGR2)
1680 .addReg(tempGR1).addImm(64-divAmt).addImm(divAmt);
1681 BuildMI(BB, IA64::ADD, 2, tempGR3)
1682 .addReg(Tmp1).addReg(tempGR2);
1683 BuildMI(BB, IA64::SHRS, 2, Result)
1684 .addReg(tempGR3).addImm(divAmt);
1685 }
1686 else // unsigned div-by-power-of-2 becomes a simple shift right:
1687 BuildMI(BB, IA64::SHRU, 2, Result).addReg(Tmp1).addImm(Tmp3);
1688 return Result; // early exit
Duraid Madina4826a072005-04-06 09:55:17 +00001689 }
1690 }
1691
Misha Brukman4633f1c2005-04-21 23:13:11 +00001692 unsigned TmpPR=MakeReg(MVT::i1); // we need two scratch
Duraid Madinabeeaab22005-03-31 12:31:11 +00001693 unsigned TmpPR2=MakeReg(MVT::i1); // predicate registers,
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001694 unsigned TmpF1=MakeReg(MVT::f64); // and one metric truckload of FP regs.
1695 unsigned TmpF2=MakeReg(MVT::f64); // lucky we have IA64?
1696 unsigned TmpF3=MakeReg(MVT::f64); // well, the real FIXME is to have
1697 unsigned TmpF4=MakeReg(MVT::f64); // isTwoAddress forms of these
1698 unsigned TmpF5=MakeReg(MVT::f64); // FP instructions so we can end up with
1699 unsigned TmpF6=MakeReg(MVT::f64); // stuff like setf.sig f10=f10 etc.
1700 unsigned TmpF7=MakeReg(MVT::f64);
1701 unsigned TmpF8=MakeReg(MVT::f64);
1702 unsigned TmpF9=MakeReg(MVT::f64);
1703 unsigned TmpF10=MakeReg(MVT::f64);
1704 unsigned TmpF11=MakeReg(MVT::f64);
1705 unsigned TmpF12=MakeReg(MVT::f64);
1706 unsigned TmpF13=MakeReg(MVT::f64);
1707 unsigned TmpF14=MakeReg(MVT::f64);
1708 unsigned TmpF15=MakeReg(MVT::f64);
Misha Brukman4633f1c2005-04-21 23:13:11 +00001709
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001710 // OK, emit some code:
1711
1712 if(!isFP) {
1713 // first, load the inputs into FP regs.
1714 BuildMI(BB, IA64::SETFSIG, 1, TmpF1).addReg(Tmp1);
1715 BuildMI(BB, IA64::SETFSIG, 1, TmpF2).addReg(Tmp2);
Misha Brukman4633f1c2005-04-21 23:13:11 +00001716
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001717 // next, convert the inputs to FP
1718 if(isSigned) {
Misha Brukman7847fca2005-04-22 17:54:37 +00001719 BuildMI(BB, IA64::FCVTXF, 1, TmpF3).addReg(TmpF1);
1720 BuildMI(BB, IA64::FCVTXF, 1, TmpF4).addReg(TmpF2);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001721 } else {
Misha Brukman7847fca2005-04-22 17:54:37 +00001722 BuildMI(BB, IA64::FCVTXUFS1, 1, TmpF3).addReg(TmpF1);
1723 BuildMI(BB, IA64::FCVTXUFS1, 1, TmpF4).addReg(TmpF2);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001724 }
Misha Brukman4633f1c2005-04-21 23:13:11 +00001725
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001726 } else { // this is an FP divide/remainder, so we 'leak' some temp
1727 // regs and assign TmpF3=Tmp1, TmpF4=Tmp2
1728 TmpF3=Tmp1;
1729 TmpF4=Tmp2;
1730 }
1731
1732 // we start by computing an approximate reciprocal (good to 9 bits?)
Duraid Madina6dcceb52005-04-08 10:01:48 +00001733 // note, this instruction writes _both_ TmpF5 (answer) and TmpPR (predicate)
1734 BuildMI(BB, IA64::FRCPAS1, 4)
1735 .addReg(TmpF5, MachineOperand::Def)
1736 .addReg(TmpPR, MachineOperand::Def)
1737 .addReg(TmpF3).addReg(TmpF4);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001738
Duraid Madinabeeaab22005-03-31 12:31:11 +00001739 if(!isModulus) { // if this is a divide, we worry about div-by-zero
1740 unsigned bogusPR=MakeReg(MVT::i1); // won't appear, due to twoAddress
1741 // TPCMPNE below
1742 BuildMI(BB, IA64::CMPEQ, 2, bogusPR).addReg(IA64::r0).addReg(IA64::r0);
1743 BuildMI(BB, IA64::TPCMPNE, 3, TmpPR2).addReg(bogusPR)
Misha Brukman7847fca2005-04-22 17:54:37 +00001744 .addReg(IA64::r0).addReg(IA64::r0).addReg(TmpPR);
Duraid Madinabeeaab22005-03-31 12:31:11 +00001745 }
1746
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001747 // now we apply newton's method, thrice! (FIXME: this is ~72 bits of
1748 // precision, don't need this much for f32/i32)
1749 BuildMI(BB, IA64::CFNMAS1, 4, TmpF6)
1750 .addReg(TmpF4).addReg(TmpF5).addReg(IA64::F1).addReg(TmpPR);
1751 BuildMI(BB, IA64::CFMAS1, 4, TmpF7)
1752 .addReg(TmpF3).addReg(TmpF5).addReg(IA64::F0).addReg(TmpPR);
1753 BuildMI(BB, IA64::CFMAS1, 4, TmpF8)
1754 .addReg(TmpF6).addReg(TmpF6).addReg(IA64::F0).addReg(TmpPR);
1755 BuildMI(BB, IA64::CFMAS1, 4, TmpF9)
1756 .addReg(TmpF6).addReg(TmpF7).addReg(TmpF7).addReg(TmpPR);
1757 BuildMI(BB, IA64::CFMAS1, 4,TmpF10)
1758 .addReg(TmpF6).addReg(TmpF5).addReg(TmpF5).addReg(TmpPR);
1759 BuildMI(BB, IA64::CFMAS1, 4,TmpF11)
1760 .addReg(TmpF8).addReg(TmpF9).addReg(TmpF9).addReg(TmpPR);
1761 BuildMI(BB, IA64::CFMAS1, 4,TmpF12)
1762 .addReg(TmpF8).addReg(TmpF10).addReg(TmpF10).addReg(TmpPR);
1763 BuildMI(BB, IA64::CFNMAS1, 4,TmpF13)
1764 .addReg(TmpF4).addReg(TmpF11).addReg(TmpF3).addReg(TmpPR);
Duraid Madina6e02e682005-04-04 05:05:52 +00001765
1766 // FIXME: this is unfortunate :(
1767 // the story is that the dest reg of the fnma above and the fma below
1768 // (and therefore possibly the src of the fcvt.fx[u] as well) cannot
1769 // be the same register, or this code breaks if the first argument is
1770 // zero. (e.g. without this hack, 0%8 yields -64, not 0.)
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001771 BuildMI(BB, IA64::CFMAS1, 4,TmpF14)
1772 .addReg(TmpF13).addReg(TmpF12).addReg(TmpF11).addReg(TmpPR);
1773
Duraid Madina6e02e682005-04-04 05:05:52 +00001774 if(isModulus) { // XXX: fragile! fixes _only_ mod, *breaks* div! !
1775 BuildMI(BB, IA64::IUSE, 1).addReg(TmpF13); // hack :(
1776 }
1777
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001778 if(!isFP) {
1779 // round to an integer
1780 if(isSigned)
Misha Brukman7847fca2005-04-22 17:54:37 +00001781 BuildMI(BB, IA64::FCVTFXTRUNCS1, 1, TmpF15).addReg(TmpF14);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001782 else
Misha Brukman7847fca2005-04-22 17:54:37 +00001783 BuildMI(BB, IA64::FCVTFXUTRUNCS1, 1, TmpF15).addReg(TmpF14);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001784 } else {
1785 BuildMI(BB, IA64::FMOV, 1, TmpF15).addReg(TmpF14);
1786 // EXERCISE: can you see why TmpF15=TmpF14 does not work here, and
1787 // we really do need the above FMOV? ;)
1788 }
1789
1790 if(!isModulus) {
Duraid Madinabeeaab22005-03-31 12:31:11 +00001791 if(isFP) { // extra worrying about div-by-zero
1792 unsigned bogoResult=MakeReg(MVT::f64);
1793
1794 // we do a 'conditional fmov' (of the correct result, depending
1795 // on how the frcpa predicate turned out)
1796 BuildMI(BB, IA64::PFMOV, 2, bogoResult)
Misha Brukman7847fca2005-04-22 17:54:37 +00001797 .addReg(TmpF12).addReg(TmpPR2);
Duraid Madinabeeaab22005-03-31 12:31:11 +00001798 BuildMI(BB, IA64::CFMOV, 2, Result)
Misha Brukman7847fca2005-04-22 17:54:37 +00001799 .addReg(bogoResult).addReg(TmpF15).addReg(TmpPR);
Duraid Madinabeeaab22005-03-31 12:31:11 +00001800 }
Duraid Madina6e02e682005-04-04 05:05:52 +00001801 else {
Misha Brukman7847fca2005-04-22 17:54:37 +00001802 BuildMI(BB, IA64::GETFSIG, 1, Result).addReg(TmpF15);
Duraid Madina6e02e682005-04-04 05:05:52 +00001803 }
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001804 } else { // this is a modulus
1805 if(!isFP) {
Misha Brukman7847fca2005-04-22 17:54:37 +00001806 // answer = q * (-b) + a
1807 unsigned ModulusResult = MakeReg(MVT::f64);
1808 unsigned TmpF = MakeReg(MVT::f64);
1809 unsigned TmpI = MakeReg(MVT::i64);
1810
1811 BuildMI(BB, IA64::SUB, 2, TmpI).addReg(IA64::r0).addReg(Tmp2);
1812 BuildMI(BB, IA64::SETFSIG, 1, TmpF).addReg(TmpI);
1813 BuildMI(BB, IA64::XMAL, 3, ModulusResult)
1814 .addReg(TmpF15).addReg(TmpF).addReg(TmpF1);
1815 BuildMI(BB, IA64::GETFSIG, 1, Result).addReg(ModulusResult);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001816 } else { // FP modulus! The horror... the horror....
Misha Brukman7847fca2005-04-22 17:54:37 +00001817 assert(0 && "sorry, no FP modulus just yet!\n!\n");
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001818 }
1819 }
1820
1821 return Result;
1822 }
1823
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001824 case ISD::SIGN_EXTEND_INREG: {
1825 Tmp1 = SelectExpr(N.getOperand(0));
1826 MVTSDNode* MVN = dyn_cast<MVTSDNode>(Node);
1827 switch(MVN->getExtraValueType())
1828 {
1829 default:
1830 Node->dump();
1831 assert(0 && "don't know how to sign extend this type");
1832 break;
1833 case MVT::i8: Opc = IA64::SXT1; break;
1834 case MVT::i16: Opc = IA64::SXT2; break;
1835 case MVT::i32: Opc = IA64::SXT4; break;
1836 }
1837 BuildMI(BB, Opc, 1, Result).addReg(Tmp1);
1838 return Result;
1839 }
1840
1841 case ISD::SETCC: {
1842 Tmp1 = SelectExpr(N.getOperand(0));
Duraid Madina5ef2ec92005-04-11 05:55:56 +00001843
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001844 if (SetCCSDNode *SetCC = dyn_cast<SetCCSDNode>(Node)) {
1845 if (MVT::isInteger(SetCC->getOperand(0).getValueType())) {
Duraid Madina5ef2ec92005-04-11 05:55:56 +00001846
Misha Brukman7847fca2005-04-22 17:54:37 +00001847 if(ConstantSDNode *CSDN =
1848 dyn_cast<ConstantSDNode>(N.getOperand(1))) {
1849 // if we are comparing against a constant zero
1850 if(CSDN->getValue()==0)
1851 Tmp2 = IA64::r0; // then we can just compare against r0
1852 else
1853 Tmp2 = SelectExpr(N.getOperand(1));
1854 } else // not comparing against a constant
1855 Tmp2 = SelectExpr(N.getOperand(1));
1856
1857 switch (SetCC->getCondition()) {
1858 default: assert(0 && "Unknown integer comparison!");
1859 case ISD::SETEQ:
1860 BuildMI(BB, IA64::CMPEQ, 2, Result).addReg(Tmp1).addReg(Tmp2);
1861 break;
1862 case ISD::SETGT:
1863 BuildMI(BB, IA64::CMPGT, 2, Result).addReg(Tmp1).addReg(Tmp2);
1864 break;
1865 case ISD::SETGE:
1866 BuildMI(BB, IA64::CMPGE, 2, Result).addReg(Tmp1).addReg(Tmp2);
1867 break;
1868 case ISD::SETLT:
1869 BuildMI(BB, IA64::CMPLT, 2, Result).addReg(Tmp1).addReg(Tmp2);
1870 break;
1871 case ISD::SETLE:
1872 BuildMI(BB, IA64::CMPLE, 2, Result).addReg(Tmp1).addReg(Tmp2);
1873 break;
1874 case ISD::SETNE:
1875 BuildMI(BB, IA64::CMPNE, 2, Result).addReg(Tmp1).addReg(Tmp2);
1876 break;
1877 case ISD::SETULT:
1878 BuildMI(BB, IA64::CMPLTU, 2, Result).addReg(Tmp1).addReg(Tmp2);
1879 break;
1880 case ISD::SETUGT:
1881 BuildMI(BB, IA64::CMPGTU, 2, Result).addReg(Tmp1).addReg(Tmp2);
1882 break;
1883 case ISD::SETULE:
1884 BuildMI(BB, IA64::CMPLEU, 2, Result).addReg(Tmp1).addReg(Tmp2);
1885 break;
1886 case ISD::SETUGE:
1887 BuildMI(BB, IA64::CMPGEU, 2, Result).addReg(Tmp1).addReg(Tmp2);
1888 break;
1889 }
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001890 }
1891 else { // if not integer, should be FP. FIXME: what about bools? ;)
Misha Brukman7847fca2005-04-22 17:54:37 +00001892 assert(SetCC->getOperand(0).getValueType() != MVT::f32 &&
1893 "error: SETCC should have had incoming f32 promoted to f64!\n");
Duraid Madina5ef2ec92005-04-11 05:55:56 +00001894
Misha Brukman7847fca2005-04-22 17:54:37 +00001895 if(ConstantFPSDNode *CFPSDN =
1896 dyn_cast<ConstantFPSDNode>(N.getOperand(1))) {
Duraid Madina5ef2ec92005-04-11 05:55:56 +00001897
Misha Brukman7847fca2005-04-22 17:54:37 +00001898 // if we are comparing against a constant +0.0 or +1.0
1899 if(CFPSDN->isExactlyValue(+0.0))
1900 Tmp2 = IA64::F0; // then we can just compare against f0
1901 else if(CFPSDN->isExactlyValue(+1.0))
1902 Tmp2 = IA64::F1; // or f1
1903 else
1904 Tmp2 = SelectExpr(N.getOperand(1));
1905 } else // not comparing against a constant
1906 Tmp2 = SelectExpr(N.getOperand(1));
Duraid Madina5ef2ec92005-04-11 05:55:56 +00001907
Misha Brukman7847fca2005-04-22 17:54:37 +00001908 switch (SetCC->getCondition()) {
1909 default: assert(0 && "Unknown FP comparison!");
1910 case ISD::SETEQ:
1911 BuildMI(BB, IA64::FCMPEQ, 2, Result).addReg(Tmp1).addReg(Tmp2);
1912 break;
1913 case ISD::SETGT:
1914 BuildMI(BB, IA64::FCMPGT, 2, Result).addReg(Tmp1).addReg(Tmp2);
1915 break;
1916 case ISD::SETGE:
1917 BuildMI(BB, IA64::FCMPGE, 2, Result).addReg(Tmp1).addReg(Tmp2);
1918 break;
1919 case ISD::SETLT:
1920 BuildMI(BB, IA64::FCMPLT, 2, Result).addReg(Tmp1).addReg(Tmp2);
1921 break;
1922 case ISD::SETLE:
1923 BuildMI(BB, IA64::FCMPLE, 2, Result).addReg(Tmp1).addReg(Tmp2);
1924 break;
1925 case ISD::SETNE:
1926 BuildMI(BB, IA64::FCMPNE, 2, Result).addReg(Tmp1).addReg(Tmp2);
1927 break;
1928 case ISD::SETULT:
1929 BuildMI(BB, IA64::FCMPLTU, 2, Result).addReg(Tmp1).addReg(Tmp2);
1930 break;
1931 case ISD::SETUGT:
1932 BuildMI(BB, IA64::FCMPGTU, 2, Result).addReg(Tmp1).addReg(Tmp2);
1933 break;
1934 case ISD::SETULE:
1935 BuildMI(BB, IA64::FCMPLEU, 2, Result).addReg(Tmp1).addReg(Tmp2);
1936 break;
1937 case ISD::SETUGE:
1938 BuildMI(BB, IA64::FCMPGEU, 2, Result).addReg(Tmp1).addReg(Tmp2);
1939 break;
1940 }
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001941 }
1942 }
1943 else
1944 assert(0 && "this setcc not implemented yet");
1945
1946 return Result;
1947 }
1948
1949 case ISD::EXTLOAD:
1950 case ISD::ZEXTLOAD:
1951 case ISD::LOAD: {
1952 // Make sure we generate both values.
1953 if (Result != 1)
1954 ExprMap[N.getValue(1)] = 1; // Generate the token
1955 else
1956 Result = ExprMap[N.getValue(0)] = MakeReg(N.getValue(0).getValueType());
1957
1958 bool isBool=false;
Misha Brukman4633f1c2005-04-21 23:13:11 +00001959
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001960 if(opcode == ISD::LOAD) { // this is a LOAD
1961 switch (Node->getValueType(0)) {
Misha Brukman7847fca2005-04-22 17:54:37 +00001962 default: assert(0 && "Cannot load this type!");
1963 case MVT::i1: Opc = IA64::LD1; isBool=true; break;
1964 // FIXME: for now, we treat bool loads the same as i8 loads */
1965 case MVT::i8: Opc = IA64::LD1; break;
1966 case MVT::i16: Opc = IA64::LD2; break;
1967 case MVT::i32: Opc = IA64::LD4; break;
1968 case MVT::i64: Opc = IA64::LD8; break;
1969
1970 case MVT::f32: Opc = IA64::LDF4; break;
1971 case MVT::f64: Opc = IA64::LDF8; break;
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001972 }
1973 } else { // this is an EXTLOAD or ZEXTLOAD
1974 MVT::ValueType TypeBeingLoaded = cast<MVTSDNode>(Node)->getExtraValueType();
1975 switch (TypeBeingLoaded) {
Misha Brukman7847fca2005-04-22 17:54:37 +00001976 default: assert(0 && "Cannot extload/zextload this type!");
1977 // FIXME: bools?
1978 case MVT::i8: Opc = IA64::LD1; break;
1979 case MVT::i16: Opc = IA64::LD2; break;
1980 case MVT::i32: Opc = IA64::LD4; break;
1981 case MVT::f32: Opc = IA64::LDF4; break;
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001982 }
1983 }
Misha Brukman4633f1c2005-04-21 23:13:11 +00001984
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001985 SDOperand Chain = N.getOperand(0);
1986 SDOperand Address = N.getOperand(1);
1987
1988 if(Address.getOpcode() == ISD::GlobalAddress) {
1989 Select(Chain);
1990 unsigned dummy = MakeReg(MVT::i64);
1991 unsigned dummy2 = MakeReg(MVT::i64);
1992 BuildMI(BB, IA64::ADD, 2, dummy)
Misha Brukman7847fca2005-04-22 17:54:37 +00001993 .addGlobalAddress(cast<GlobalAddressSDNode>(Address)->getGlobal())
1994 .addReg(IA64::r1);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001995 BuildMI(BB, IA64::LD8, 1, dummy2).addReg(dummy);
1996 if(!isBool)
Misha Brukman7847fca2005-04-22 17:54:37 +00001997 BuildMI(BB, Opc, 1, Result).addReg(dummy2);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00001998 else { // emit a little pseudocode to load a bool (stored in one byte)
Misha Brukman7847fca2005-04-22 17:54:37 +00001999 // into a predicate register
2000 assert(Opc==IA64::LD1 && "problem loading a bool");
2001 unsigned dummy3 = MakeReg(MVT::i64);
2002 BuildMI(BB, Opc, 1, dummy3).addReg(dummy2);
2003 // we compare to 0. true? 0. false? 1.
2004 BuildMI(BB, IA64::CMPNE, 2, Result).addReg(dummy3).addReg(IA64::r0);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002005 }
2006 } else if(ConstantPoolSDNode *CP = dyn_cast<ConstantPoolSDNode>(Address)) {
2007 Select(Chain);
2008 IA64Lowering.restoreGP(BB);
2009 unsigned dummy = MakeReg(MVT::i64);
2010 BuildMI(BB, IA64::ADD, 2, dummy).addConstantPoolIndex(CP->getIndex())
Misha Brukman7847fca2005-04-22 17:54:37 +00002011 .addReg(IA64::r1); // CPI+GP
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002012 if(!isBool)
Misha Brukman7847fca2005-04-22 17:54:37 +00002013 BuildMI(BB, Opc, 1, Result).addReg(dummy);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002014 else { // emit a little pseudocode to load a bool (stored in one byte)
Misha Brukman7847fca2005-04-22 17:54:37 +00002015 // into a predicate register
2016 assert(Opc==IA64::LD1 && "problem loading a bool");
2017 unsigned dummy3 = MakeReg(MVT::i64);
2018 BuildMI(BB, Opc, 1, dummy3).addReg(dummy);
2019 // we compare to 0. true? 0. false? 1.
2020 BuildMI(BB, IA64::CMPNE, 2, Result).addReg(dummy3).addReg(IA64::r0);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002021 }
2022 } else if(Address.getOpcode() == ISD::FrameIndex) {
2023 Select(Chain); // FIXME ? what about bools?
2024 unsigned dummy = MakeReg(MVT::i64);
2025 BuildMI(BB, IA64::MOV, 1, dummy)
Misha Brukman7847fca2005-04-22 17:54:37 +00002026 .addFrameIndex(cast<FrameIndexSDNode>(Address)->getIndex());
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002027 if(!isBool)
Misha Brukman7847fca2005-04-22 17:54:37 +00002028 BuildMI(BB, Opc, 1, Result).addReg(dummy);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002029 else { // emit a little pseudocode to load a bool (stored in one byte)
Misha Brukman7847fca2005-04-22 17:54:37 +00002030 // into a predicate register
2031 assert(Opc==IA64::LD1 && "problem loading a bool");
2032 unsigned dummy3 = MakeReg(MVT::i64);
2033 BuildMI(BB, Opc, 1, dummy3).addReg(dummy);
2034 // we compare to 0. true? 0. false? 1.
2035 BuildMI(BB, IA64::CMPNE, 2, Result).addReg(dummy3).addReg(IA64::r0);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002036 }
Misha Brukman4633f1c2005-04-21 23:13:11 +00002037 } else { // none of the above...
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002038 Select(Chain);
2039 Tmp2 = SelectExpr(Address);
2040 if(!isBool)
Misha Brukman7847fca2005-04-22 17:54:37 +00002041 BuildMI(BB, Opc, 1, Result).addReg(Tmp2);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002042 else { // emit a little pseudocode to load a bool (stored in one byte)
Misha Brukman7847fca2005-04-22 17:54:37 +00002043 // into a predicate register
2044 assert(Opc==IA64::LD1 && "problem loading a bool");
2045 unsigned dummy = MakeReg(MVT::i64);
2046 BuildMI(BB, Opc, 1, dummy).addReg(Tmp2);
2047 // we compare to 0. true? 0. false? 1.
2048 BuildMI(BB, IA64::CMPNE, 2, Result).addReg(dummy).addReg(IA64::r0);
2049 }
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002050 }
2051
2052 return Result;
2053 }
Misha Brukman4633f1c2005-04-21 23:13:11 +00002054
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002055 case ISD::CopyFromReg: {
2056 if (Result == 1)
Misha Brukman4633f1c2005-04-21 23:13:11 +00002057 Result = ExprMap[N.getValue(0)] =
Misha Brukman7847fca2005-04-22 17:54:37 +00002058 MakeReg(N.getValue(0).getValueType());
Misha Brukman4633f1c2005-04-21 23:13:11 +00002059
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002060 SDOperand Chain = N.getOperand(0);
2061
2062 Select(Chain);
2063 unsigned r = dyn_cast<RegSDNode>(Node)->getReg();
2064
2065 if(N.getValueType() == MVT::i1) // if a bool, we use pseudocode
Misha Brukman7847fca2005-04-22 17:54:37 +00002066 BuildMI(BB, IA64::PCMPEQUNC, 3, Result)
2067 .addReg(IA64::r0).addReg(IA64::r0).addReg(r);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002068 // (r) Result =cmp.eq.unc(r0,r0)
2069 else
Misha Brukman7847fca2005-04-22 17:54:37 +00002070 BuildMI(BB, IA64::MOV, 1, Result).addReg(r); // otherwise MOV
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002071 return Result;
2072 }
2073
2074 case ISD::CALL: {
2075 Select(N.getOperand(0));
2076
2077 // The chain for this call is now lowered.
2078 ExprMap.insert(std::make_pair(N.getValue(Node->getNumValues()-1), 1));
Misha Brukman4633f1c2005-04-21 23:13:11 +00002079
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002080 //grab the arguments
2081 std::vector<unsigned> argvregs;
2082
2083 for(int i = 2, e = Node->getNumOperands(); i < e; ++i)
Misha Brukman7847fca2005-04-22 17:54:37 +00002084 argvregs.push_back(SelectExpr(N.getOperand(i)));
Misha Brukman4633f1c2005-04-21 23:13:11 +00002085
2086 // see section 8.5.8 of "Itanium Software Conventions and
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002087 // Runtime Architecture Guide to see some examples of what's going
2088 // on here. (in short: int args get mapped 1:1 'slot-wise' to out0->out7,
2089 // while FP args get mapped to F8->F15 as needed)
2090
2091 unsigned used_FPArgs=0; // how many FP Args have been used so far?
Misha Brukman4633f1c2005-04-21 23:13:11 +00002092
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002093 // in reg args
2094 for(int i = 0, e = std::min(8, (int)argvregs.size()); i < e; ++i)
2095 {
Misha Brukman7847fca2005-04-22 17:54:37 +00002096 unsigned intArgs[] = {IA64::out0, IA64::out1, IA64::out2, IA64::out3,
2097 IA64::out4, IA64::out5, IA64::out6, IA64::out7 };
2098 unsigned FPArgs[] = {IA64::F8, IA64::F9, IA64::F10, IA64::F11,
2099 IA64::F12, IA64::F13, IA64::F14, IA64::F15 };
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002100
Misha Brukman7847fca2005-04-22 17:54:37 +00002101 switch(N.getOperand(i+2).getValueType())
2102 {
2103 default: // XXX do we need to support MVT::i1 here?
2104 Node->dump();
2105 N.getOperand(i).Val->dump();
2106 std::cerr << "Type for " << i << " is: " <<
2107 N.getOperand(i+2).getValueType() << std::endl;
2108 assert(0 && "Unknown value type for call");
2109 case MVT::i64:
2110 BuildMI(BB, IA64::MOV, 1, intArgs[i]).addReg(argvregs[i]);
2111 break;
2112 case MVT::f64:
2113 BuildMI(BB, IA64::FMOV, 1, FPArgs[used_FPArgs++])
2114 .addReg(argvregs[i]);
2115 // FIXME: we don't need to do this _all_ the time:
2116 BuildMI(BB, IA64::GETFD, 1, intArgs[i]).addReg(argvregs[i]);
2117 break;
2118 }
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002119 }
2120
2121 //in mem args
2122 for (int i = 8, e = argvregs.size(); i < e; ++i)
2123 {
Misha Brukman7847fca2005-04-22 17:54:37 +00002124 unsigned tempAddr = MakeReg(MVT::i64);
2125
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002126 switch(N.getOperand(i+2).getValueType()) {
Misha Brukman4633f1c2005-04-21 23:13:11 +00002127 default:
2128 Node->dump();
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002129 N.getOperand(i).Val->dump();
Misha Brukman4633f1c2005-04-21 23:13:11 +00002130 std::cerr << "Type for " << i << " is: " <<
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002131 N.getOperand(i+2).getValueType() << "\n";
2132 assert(0 && "Unknown value type for call");
2133 case MVT::i1: // FIXME?
2134 case MVT::i8:
2135 case MVT::i16:
2136 case MVT::i32:
2137 case MVT::i64:
Misha Brukman7847fca2005-04-22 17:54:37 +00002138 BuildMI(BB, IA64::ADDIMM22, 2, tempAddr)
2139 .addReg(IA64::r12).addImm(16 + (i - 8) * 8); // r12 is SP
2140 BuildMI(BB, IA64::ST8, 2).addReg(tempAddr).addReg(argvregs[i]);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002141 break;
2142 case MVT::f32:
2143 case MVT::f64:
2144 BuildMI(BB, IA64::ADDIMM22, 2, tempAddr)
Misha Brukman7847fca2005-04-22 17:54:37 +00002145 .addReg(IA64::r12).addImm(16 + (i - 8) * 8); // r12 is SP
2146 BuildMI(BB, IA64::STF8, 2).addReg(tempAddr).addReg(argvregs[i]);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002147 break;
2148 }
2149 }
Duraid Madinabeeaab22005-03-31 12:31:11 +00002150
2151 /* XXX we want to re-enable direct branches! crippling them now
Misha Brukman4633f1c2005-04-21 23:13:11 +00002152 * to stress-test indirect branches.:
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002153 //build the right kind of call
2154 if (GlobalAddressSDNode *GASD =
Misha Brukman4633f1c2005-04-21 23:13:11 +00002155 dyn_cast<GlobalAddressSDNode>(N.getOperand(1)))
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002156 {
Misha Brukman7847fca2005-04-22 17:54:37 +00002157 BuildMI(BB, IA64::BRCALL, 1).addGlobalAddress(GASD->getGlobal(),true);
2158 IA64Lowering.restoreGP_SP_RP(BB);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002159 }
Misha Brukman4633f1c2005-04-21 23:13:11 +00002160 ^^^^^^^^^^^^^ we want this code one day XXX */
Duraid Madinabeeaab22005-03-31 12:31:11 +00002161 if (ExternalSymbolSDNode *ESSDN =
Misha Brukman7847fca2005-04-22 17:54:37 +00002162 dyn_cast<ExternalSymbolSDNode>(N.getOperand(1)))
Duraid Madinabeeaab22005-03-31 12:31:11 +00002163 { // FIXME : currently need this case for correctness, to avoid
Misha Brukman7847fca2005-04-22 17:54:37 +00002164 // "non-pic code with imm relocation against dynamic symbol" errors
2165 BuildMI(BB, IA64::BRCALL, 1)
2166 .addExternalSymbol(ESSDN->getSymbol(), true);
2167 IA64Lowering.restoreGP_SP_RP(BB);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002168 }
2169 else {
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002170 Tmp1 = SelectExpr(N.getOperand(1));
Duraid Madinabeeaab22005-03-31 12:31:11 +00002171
2172 unsigned targetEntryPoint=MakeReg(MVT::i64);
2173 unsigned targetGPAddr=MakeReg(MVT::i64);
2174 unsigned currentGP=MakeReg(MVT::i64);
Misha Brukman4633f1c2005-04-21 23:13:11 +00002175
Duraid Madinabeeaab22005-03-31 12:31:11 +00002176 // b6 is a scratch branch register, we load the target entry point
2177 // from the base of the function descriptor
2178 BuildMI(BB, IA64::LD8, 1, targetEntryPoint).addReg(Tmp1);
2179 BuildMI(BB, IA64::MOV, 1, IA64::B6).addReg(targetEntryPoint);
2180
2181 // save the current GP:
2182 BuildMI(BB, IA64::MOV, 1, currentGP).addReg(IA64::r1);
Misha Brukman4633f1c2005-04-21 23:13:11 +00002183
Duraid Madinabeeaab22005-03-31 12:31:11 +00002184 /* TODO: we need to make sure doing this never, ever loads a
2185 * bogus value into r1 (GP). */
2186 // load the target GP (which is at mem[functiondescriptor+8])
2187 BuildMI(BB, IA64::ADDIMM22, 2, targetGPAddr)
Misha Brukman7847fca2005-04-22 17:54:37 +00002188 .addReg(Tmp1).addImm(8); // FIXME: addimm22? why not postincrement ld
Duraid Madinabeeaab22005-03-31 12:31:11 +00002189 BuildMI(BB, IA64::LD8, 1, IA64::r1).addReg(targetGPAddr);
2190
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002191 // and then jump: (well, call)
2192 BuildMI(BB, IA64::BRCALL, 1).addReg(IA64::B6);
Duraid Madinabeeaab22005-03-31 12:31:11 +00002193 // and finally restore the old GP
2194 BuildMI(BB, IA64::MOV, 1, IA64::r1).addReg(currentGP);
2195 IA64Lowering.restoreSP_RP(BB);
2196 }
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002197
2198 switch (Node->getValueType(0)) {
2199 default: assert(0 && "Unknown value type for call result!");
2200 case MVT::Other: return 1;
2201 case MVT::i1:
2202 BuildMI(BB, IA64::CMPNE, 2, Result)
Misha Brukman7847fca2005-04-22 17:54:37 +00002203 .addReg(IA64::r8).addReg(IA64::r0);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002204 break;
2205 case MVT::i8:
2206 case MVT::i16:
2207 case MVT::i32:
2208 case MVT::i64:
2209 BuildMI(BB, IA64::MOV, 1, Result).addReg(IA64::r8);
2210 break;
2211 case MVT::f64:
2212 BuildMI(BB, IA64::FMOV, 1, Result).addReg(IA64::F8);
2213 break;
2214 }
2215 return Result+N.ResNo;
2216 }
2217
Misha Brukman4633f1c2005-04-21 23:13:11 +00002218 } // <- uhhh XXX
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002219 return 0;
2220}
2221
2222void ISel::Select(SDOperand N) {
2223 unsigned Tmp1, Tmp2, Opc;
2224 unsigned opcode = N.getOpcode();
2225
Nate Begeman85fdeb22005-03-24 04:39:54 +00002226 if (!LoweredTokens.insert(N).second)
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002227 return; // Already selected.
2228
2229 SDNode *Node = N.Val;
2230
2231 switch (Node->getOpcode()) {
2232 default:
2233 Node->dump(); std::cerr << "\n";
2234 assert(0 && "Node not handled yet!");
2235
2236 case ISD::EntryToken: return; // Noop
Misha Brukman4633f1c2005-04-21 23:13:11 +00002237
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002238 case ISD::TokenFactor: {
2239 for (unsigned i = 0, e = Node->getNumOperands(); i != e; ++i)
2240 Select(Node->getOperand(i));
2241 return;
2242 }
2243
2244 case ISD::CopyToReg: {
2245 Select(N.getOperand(0));
Misha Brukman4633f1c2005-04-21 23:13:11 +00002246 Tmp1 = SelectExpr(N.getOperand(1));
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002247 Tmp2 = cast<RegSDNode>(N)->getReg();
Misha Brukman4633f1c2005-04-21 23:13:11 +00002248
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002249 if (Tmp1 != Tmp2) {
2250 if(N.getValueType() == MVT::i1) // if a bool, we use pseudocode
Misha Brukman7847fca2005-04-22 17:54:37 +00002251 BuildMI(BB, IA64::PCMPEQUNC, 3, Tmp2)
2252 .addReg(IA64::r0).addReg(IA64::r0).addReg(Tmp1);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002253 // (Tmp1) Tmp2 = cmp.eq.unc(r0,r0)
2254 else
Misha Brukman7847fca2005-04-22 17:54:37 +00002255 BuildMI(BB, IA64::MOV, 1, Tmp2).addReg(Tmp1);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002256 // XXX is this the right way 'round? ;)
2257 }
2258 return;
2259 }
Misha Brukman4633f1c2005-04-21 23:13:11 +00002260
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002261 case ISD::RET: {
2262
2263 /* what the heck is going on here:
2264
2265<_sabre_> ret with two operands is obvious: chain and value
2266<camel_> yep
2267<_sabre_> ret with 3 values happens when 'expansion' occurs
2268<_sabre_> e.g. i64 gets split into 2x i32
2269<camel_> oh right
2270<_sabre_> you don't have this case on ia64
2271<camel_> yep
2272<_sabre_> so the two returned values go into EAX/EDX on ia32
2273<camel_> ahhh *memories*
2274<_sabre_> :)
2275<camel_> ok, thanks :)
2276<_sabre_> so yeah, everything that has a side effect takes a 'token chain'
2277<_sabre_> this is the first operand always
2278<_sabre_> these operand often define chains, they are the last operand
2279<_sabre_> they are printed as 'ch' if you do DAG.dump()
2280 */
Misha Brukman4633f1c2005-04-21 23:13:11 +00002281
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002282 switch (N.getNumOperands()) {
2283 default:
2284 assert(0 && "Unknown return instruction!");
2285 case 2:
2286 Select(N.getOperand(0));
2287 Tmp1 = SelectExpr(N.getOperand(1));
2288 switch (N.getOperand(1).getValueType()) {
2289 default: assert(0 && "All other types should have been promoted!!");
Misha Brukman7847fca2005-04-22 17:54:37 +00002290 // FIXME: do I need to add support for bools here?
2291 // (return '0' or '1' r8, basically...)
2292 //
2293 // FIXME: need to round floats - 80 bits is bad, the tester
2294 // told me so
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002295 case MVT::i64:
Misha Brukman7847fca2005-04-22 17:54:37 +00002296 // we mark r8 as live on exit up above in LowerArguments()
2297 BuildMI(BB, IA64::MOV, 1, IA64::r8).addReg(Tmp1);
2298 break;
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002299 case MVT::f64:
Misha Brukman7847fca2005-04-22 17:54:37 +00002300 // we mark F8 as live on exit up above in LowerArguments()
2301 BuildMI(BB, IA64::FMOV, 1, IA64::F8).addReg(Tmp1);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002302 }
2303 break;
2304 case 1:
2305 Select(N.getOperand(0));
2306 break;
2307 }
2308 // before returning, restore the ar.pfs register (set by the 'alloc' up top)
2309 BuildMI(BB, IA64::MOV, 1).addReg(IA64::AR_PFS).addReg(IA64Lowering.VirtGPR);
2310 BuildMI(BB, IA64::RET, 0); // and then just emit a 'ret' instruction
2311 return;
2312 }
Misha Brukman4633f1c2005-04-21 23:13:11 +00002313
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002314 case ISD::BR: {
2315 Select(N.getOperand(0));
2316 MachineBasicBlock *Dest =
2317 cast<BasicBlockSDNode>(N.getOperand(1))->getBasicBlock();
2318 BuildMI(BB, IA64::BRLCOND_NOTCALL, 1).addReg(IA64::p0).addMBB(Dest);
2319 // XXX HACK! we do _not_ need long branches all the time
2320 return;
2321 }
2322
2323 case ISD::ImplicitDef: {
2324 Select(N.getOperand(0));
2325 BuildMI(BB, IA64::IDEF, 0, cast<RegSDNode>(N)->getReg());
2326 return;
2327 }
2328
2329 case ISD::BRCOND: {
2330 MachineBasicBlock *Dest =
2331 cast<BasicBlockSDNode>(N.getOperand(2))->getBasicBlock();
2332
2333 Select(N.getOperand(0));
2334 Tmp1 = SelectExpr(N.getOperand(1));
2335 BuildMI(BB, IA64::BRLCOND_NOTCALL, 1).addReg(Tmp1).addMBB(Dest);
2336 // XXX HACK! we do _not_ need long branches all the time
2337 return;
2338 }
Misha Brukman4633f1c2005-04-21 23:13:11 +00002339
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002340 case ISD::EXTLOAD:
2341 case ISD::ZEXTLOAD:
2342 case ISD::SEXTLOAD:
2343 case ISD::LOAD:
2344 case ISD::CALL:
2345 case ISD::CopyFromReg:
2346 case ISD::DYNAMIC_STACKALLOC:
2347 SelectExpr(N);
2348 return;
2349
2350 case ISD::TRUNCSTORE:
2351 case ISD::STORE: {
2352 Select(N.getOperand(0));
2353 Tmp1 = SelectExpr(N.getOperand(1)); // value
2354
2355 bool isBool=false;
Misha Brukman4633f1c2005-04-21 23:13:11 +00002356
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002357 if(opcode == ISD::STORE) {
Misha Brukman7847fca2005-04-22 17:54:37 +00002358 switch (N.getOperand(1).getValueType()) {
2359 default: assert(0 && "Cannot store this type!");
2360 case MVT::i1: Opc = IA64::ST1; isBool=true; break;
2361 // FIXME?: for now, we treat bool loads the same as i8 stores */
2362 case MVT::i8: Opc = IA64::ST1; break;
2363 case MVT::i16: Opc = IA64::ST2; break;
2364 case MVT::i32: Opc = IA64::ST4; break;
2365 case MVT::i64: Opc = IA64::ST8; break;
2366
2367 case MVT::f32: Opc = IA64::STF4; break;
2368 case MVT::f64: Opc = IA64::STF8; break;
2369 }
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002370 } else { // truncstore
Misha Brukman7847fca2005-04-22 17:54:37 +00002371 switch(cast<MVTSDNode>(Node)->getExtraValueType()) {
2372 default: assert(0 && "unknown type in truncstore");
2373 case MVT::i1: Opc = IA64::ST1; isBool=true; break;
2374 //FIXME: DAG does not promote this load?
2375 case MVT::i8: Opc = IA64::ST1; break;
2376 case MVT::i16: Opc = IA64::ST2; break;
2377 case MVT::i32: Opc = IA64::ST4; break;
2378 case MVT::f32: Opc = IA64::STF4; break;
2379 }
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002380 }
2381
2382 if(N.getOperand(2).getOpcode() == ISD::GlobalAddress) {
Misha Brukman7847fca2005-04-22 17:54:37 +00002383 unsigned dummy = MakeReg(MVT::i64);
2384 unsigned dummy2 = MakeReg(MVT::i64);
2385 BuildMI(BB, IA64::ADD, 2, dummy)
2386 .addGlobalAddress(cast<GlobalAddressSDNode>
2387 (N.getOperand(2))->getGlobal()).addReg(IA64::r1);
2388 BuildMI(BB, IA64::LD8, 1, dummy2).addReg(dummy);
Misha Brukman4633f1c2005-04-21 23:13:11 +00002389
Misha Brukman7847fca2005-04-22 17:54:37 +00002390 if(!isBool)
2391 BuildMI(BB, Opc, 2).addReg(dummy2).addReg(Tmp1);
2392 else { // we are storing a bool, so emit a little pseudocode
2393 // to store a predicate register as one byte
2394 assert(Opc==IA64::ST1);
2395 unsigned dummy3 = MakeReg(MVT::i64);
2396 unsigned dummy4 = MakeReg(MVT::i64);
2397 BuildMI(BB, IA64::MOV, 1, dummy3).addReg(IA64::r0);
2398 BuildMI(BB, IA64::TPCADDIMM22, 2, dummy4)
2399 .addReg(dummy3).addImm(1).addReg(Tmp1); // if(Tmp1) dummy=0+1;
2400 BuildMI(BB, Opc, 2).addReg(dummy2).addReg(dummy4);
2401 }
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002402 } else if(N.getOperand(2).getOpcode() == ISD::FrameIndex) {
2403
Misha Brukman7847fca2005-04-22 17:54:37 +00002404 // FIXME? (what about bools?)
2405
2406 unsigned dummy = MakeReg(MVT::i64);
2407 BuildMI(BB, IA64::MOV, 1, dummy)
2408 .addFrameIndex(cast<FrameIndexSDNode>(N.getOperand(2))->getIndex());
2409 BuildMI(BB, Opc, 2).addReg(dummy).addReg(Tmp1);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002410 } else { // otherwise
Misha Brukman7847fca2005-04-22 17:54:37 +00002411 Tmp2 = SelectExpr(N.getOperand(2)); //address
2412 if(!isBool)
2413 BuildMI(BB, Opc, 2).addReg(Tmp2).addReg(Tmp1);
2414 else { // we are storing a bool, so emit a little pseudocode
2415 // to store a predicate register as one byte
2416 assert(Opc==IA64::ST1);
2417 unsigned dummy3 = MakeReg(MVT::i64);
2418 unsigned dummy4 = MakeReg(MVT::i64);
2419 BuildMI(BB, IA64::MOV, 1, dummy3).addReg(IA64::r0);
2420 BuildMI(BB, IA64::TPCADDIMM22, 2, dummy4)
2421 .addReg(dummy3).addImm(1).addReg(Tmp1); // if(Tmp1) dummy=0+1;
2422 BuildMI(BB, Opc, 2).addReg(Tmp2).addReg(dummy4);
2423 }
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002424 }
2425 return;
2426 }
Misha Brukman4633f1c2005-04-21 23:13:11 +00002427
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002428 case ISD::ADJCALLSTACKDOWN:
2429 case ISD::ADJCALLSTACKUP: {
2430 Select(N.getOperand(0));
2431 Tmp1 = cast<ConstantSDNode>(N.getOperand(1))->getValue();
Misha Brukman4633f1c2005-04-21 23:13:11 +00002432
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002433 Opc = N.getOpcode() == ISD::ADJCALLSTACKDOWN ? IA64::ADJUSTCALLSTACKDOWN :
2434 IA64::ADJUSTCALLSTACKUP;
2435 BuildMI(BB, Opc, 1).addImm(Tmp1);
2436 return;
2437 }
2438
2439 return;
2440 }
2441 assert(0 && "GAME OVER. INSERT COIN?");
2442}
2443
2444
2445/// createIA64PatternInstructionSelector - This pass converts an LLVM function
2446/// into a machine code representation using pattern matching and a machine
2447/// description file.
2448///
2449FunctionPass *llvm::createIA64PatternInstructionSelector(TargetMachine &TM) {
Misha Brukman4633f1c2005-04-21 23:13:11 +00002450 return new ISel(TM);
Duraid Madina9b9d45f2005-03-17 18:17:03 +00002451}
2452
2453