Blame - lib/Target/PowerPC/PPCISelLowering.cpp - platform/external/llvm

2007-07-18 16:29:46 +0000

[diff] [blame]

1

//===-- PPCISelLowering.cpp - PPC DAG Lowering Implementation -------------===//

2

//

3

// The LLVM Compiler Infrastructure

4

//

Chris Lattner

081ce94

2007-12-29 20:36:04 +0000

[diff] [blame]

5

// This file is distributed under the University of Illinois Open Source

6

// License. See LICENSE.TXT for details.

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

7

//

8

//===----------------------------------------------------------------------===//

9

//

10

// This file implements the PPCISelLowering class.

11

//

12

//===----------------------------------------------------------------------===//

13

14

#include "PPCISelLowering.h"

15

#include "PPCMachineFunctionInfo.h"

16

#include "PPCPredicates.h"

17

#include "PPCTargetMachine.h"

18

#include "PPCPerfectShuffle.h"

Owen Anderson

2007-09-07 04:06:50 +0000

[diff] [blame]

19

#include "llvm/ADT/STLExtras.h"

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

20

#include "llvm/ADT/VectorExtras.h"

21

#include "llvm/Analysis/ScalarEvolutionExpressions.h"

22

#include "llvm/CodeGen/CallingConvLower.h"

23

#include "llvm/CodeGen/MachineFrameInfo.h"

24

#include "llvm/CodeGen/MachineFunction.h"

25

#include "llvm/CodeGen/MachineInstrBuilder.h"

Chris Lattner

2007-12-31 04:13:23 +0000

[diff] [blame]

26

#include "llvm/CodeGen/MachineRegisterInfo.h"

Dan Gohman

2008-02-06 22:27:42 +0000

[diff] [blame]

27

#include "llvm/CodeGen/PseudoSourceValue.h"

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

28

#include "llvm/CodeGen/SelectionDAG.h"

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

29

#include "llvm/CallingConv.h"

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

30

#include "llvm/Constants.h"

31

#include "llvm/Function.h"

32

#include "llvm/Intrinsics.h"

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

33

#include "llvm/ParameterAttributes.h"

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

34

#include "llvm/Support/MathExtras.h"

35

#include "llvm/Target/TargetOptions.h"

36

#include "llvm/Support/CommandLine.h"

37

using namespace llvm;

38

39

static cl::opt<bool> EnablePPCPreinc("enable-ppc-preinc",

40

cl::desc("enable preincrement load/store generation on PPC (experimental)"),

41

cl::Hidden);

42

43

PPCTargetLowering::PPCTargetLowering(PPCTargetMachine &TM)

Evan Cheng

2008-04-19 01:30:48 +0000

[diff] [blame]

44

: TargetLowering(TM), PPCSubTarget(*TM.getSubtargetImpl()),

45

PPCAtomicLabelIndex(0) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

setPow2DivIsCheap();

// Use _setjmp/_longjmp instead of setjmp/longjmp.

50

setUseUnderscoreSetJmp(true);

51

setUseUnderscoreLongJmp(true);

52

53

// Set up the register classes.

54

addRegisterClass(MVT::i32, PPC::GPRCRegisterClass);

55

addRegisterClass(MVT::f32, PPC::F4RCRegisterClass);

56

addRegisterClass(MVT::f64, PPC::F8RCRegisterClass);

57

58

// PowerPC has an i16 but no i8 (or i1) SEXTLOAD

Duncan Sands

082524c

2008-01-23 20:39:46 +0000

[diff] [blame]

59

setLoadXAction(ISD::SEXTLOAD, MVT::i1, Promote);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

60

setLoadXAction(ISD::SEXTLOAD, MVT::i8, Expand);

Duncan Sands

082524c

2008-01-23 20:39:46 +0000

[diff] [blame]

61

Chris Lattner

3bc0850

2008-01-17 19:59:44 +0000

[diff] [blame]

62

setTruncStoreAction(MVT::f64, MVT::f32, Expand);

63

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

64

// PowerPC has pre-inc load and store's.

65

setIndexedLoadAction(ISD::PRE_INC, MVT::i1, Legal);

66

setIndexedLoadAction(ISD::PRE_INC, MVT::i8, Legal);

67

setIndexedLoadAction(ISD::PRE_INC, MVT::i16, Legal);

68

setIndexedLoadAction(ISD::PRE_INC, MVT::i32, Legal);

69

setIndexedLoadAction(ISD::PRE_INC, MVT::i64, Legal);

70

setIndexedStoreAction(ISD::PRE_INC, MVT::i1, Legal);

71

setIndexedStoreAction(ISD::PRE_INC, MVT::i8, Legal);

72

setIndexedStoreAction(ISD::PRE_INC, MVT::i16, Legal);

73

setIndexedStoreAction(ISD::PRE_INC, MVT::i32, Legal);

74

setIndexedStoreAction(ISD::PRE_INC, MVT::i64, Legal);

75

Dale Johannesen

472d15d

2007-10-06 01:24:11 +0000

[diff] [blame]

76

// Shortening conversions involving ppcf128 get expanded (2 regs -> 1 reg)

77

setConvertAction(MVT::ppcf128, MVT::f64, Expand);

78

setConvertAction(MVT::ppcf128, MVT::f32, Expand);

Dale Johannesen

2007-10-10 01:01:31 +0000

[diff] [blame]

79

// This is used in the ppcf128->int sequence. Note it has different semantics

80

// from FP_ROUND: that rounds to nearest, this rounds to zero.

81

setOperationAction(ISD::FP_ROUND_INREG, MVT::ppcf128, Custom);

Dale Johannesen

472d15d

2007-10-06 01:24:11 +0000

[diff] [blame]

82

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

83

// PowerPC has no intrinsics for these particular operations

Andrew Lenharth

0531ec5

2008-02-16 14:46:26 +0000

[diff] [blame]

84

setOperationAction(ISD::MEMBARRIER, MVT::Other, Expand);

85

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

86

// PowerPC has no SREM/UREM instructions

87

setOperationAction(ISD::SREM, MVT::i32, Expand);

88

setOperationAction(ISD::UREM, MVT::i32, Expand);

89

setOperationAction(ISD::SREM, MVT::i64, Expand);

90

setOperationAction(ISD::UREM, MVT::i64, Expand);

Dan Gohman

c9130bb

2007-10-08 17:28:24 +0000

[diff] [blame]

91

92

// Don't use SMUL_LOHI/UMUL_LOHI or SDIVREM/UDIVREM to lower SREM/UREM.

93

setOperationAction(ISD::UMUL_LOHI, MVT::i32, Expand);

94

setOperationAction(ISD::SMUL_LOHI, MVT::i32, Expand);

95

setOperationAction(ISD::UMUL_LOHI, MVT::i64, Expand);

96

setOperationAction(ISD::SMUL_LOHI, MVT::i64, Expand);

97

setOperationAction(ISD::UDIVREM, MVT::i32, Expand);

98

setOperationAction(ISD::SDIVREM, MVT::i32, Expand);

99

setOperationAction(ISD::UDIVREM, MVT::i64, Expand);

100

setOperationAction(ISD::SDIVREM, MVT::i64, Expand);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

101

Dan Gohman

2f7b198

2007-10-11 23:21:31 +0000

[diff] [blame]

102

// We don't support sin/cos/sqrt/fmod/pow

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

103

setOperationAction(ISD::FSIN , MVT::f64, Expand);

104

setOperationAction(ISD::FCOS , MVT::f64, Expand);

105

setOperationAction(ISD::FREM , MVT::f64, Expand);

Dan Gohman

2f7b198

2007-10-11 23:21:31 +0000

[diff] [blame]

106

setOperationAction(ISD::FPOW , MVT::f64, Expand);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

107

setOperationAction(ISD::FSIN , MVT::f32, Expand);

108

setOperationAction(ISD::FCOS , MVT::f32, Expand);

109

setOperationAction(ISD::FREM , MVT::f32, Expand);

Dan Gohman

2f7b198

2007-10-11 23:21:31 +0000

[diff] [blame]

110

setOperationAction(ISD::FPOW , MVT::f32, Expand);

Dale Johannesen

436e380

2008-01-18 19:55:37 +0000

[diff] [blame]

111

Dan Gohman

819574c

2008-01-31 00:41:03 +0000

[diff] [blame]

112

setOperationAction(ISD::FLT_ROUNDS_, MVT::i32, Custom);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

113

114

// If we're enabling GP optimizations, use hardware square root

115

if (!TM.getSubtarget<PPCSubtarget>().hasFSQRT()) {

116

setOperationAction(ISD::FSQRT, MVT::f64, Expand);

117

setOperationAction(ISD::FSQRT, MVT::f32, Expand);

118

}

119

120

setOperationAction(ISD::FCOPYSIGN, MVT::f64, Expand);

121

setOperationAction(ISD::FCOPYSIGN, MVT::f32, Expand);

122

123

// PowerPC does not have BSWAP, CTPOP or CTTZ

124

setOperationAction(ISD::BSWAP, MVT::i32 , Expand);

125

setOperationAction(ISD::CTPOP, MVT::i32 , Expand);

126

setOperationAction(ISD::CTTZ , MVT::i32 , Expand);

127

setOperationAction(ISD::BSWAP, MVT::i64 , Expand);

128

setOperationAction(ISD::CTPOP, MVT::i64 , Expand);

129

setOperationAction(ISD::CTTZ , MVT::i64 , Expand);

130

131

// PowerPC does not have ROTR

132

setOperationAction(ISD::ROTR, MVT::i32 , Expand);

133

134

// PowerPC does not have Select

135

setOperationAction(ISD::SELECT, MVT::i32, Expand);

136

setOperationAction(ISD::SELECT, MVT::i64, Expand);

137

setOperationAction(ISD::SELECT, MVT::f32, Expand);

138

setOperationAction(ISD::SELECT, MVT::f64, Expand);

139

140

// PowerPC wants to turn select_cc of FP into fsel when possible.

141

setOperationAction(ISD::SELECT_CC, MVT::f32, Custom);

142

setOperationAction(ISD::SELECT_CC, MVT::f64, Custom);

143

144

// PowerPC wants to optimize integer setcc a bit

145

setOperationAction(ISD::SETCC, MVT::i32, Custom);

146

147

// PowerPC does not have BRCOND which requires SetCC

148

setOperationAction(ISD::BRCOND, MVT::Other, Expand);

149

150

setOperationAction(ISD::BR_JT, MVT::Other, Expand);

151

152

// PowerPC turns FP_TO_SINT into FCTIWZ and some load/stores.

153

setOperationAction(ISD::FP_TO_SINT, MVT::i32, Custom);

154

155

// PowerPC does not have [U|S]INT_TO_FP

156

setOperationAction(ISD::SINT_TO_FP, MVT::i32, Expand);

157

setOperationAction(ISD::UINT_TO_FP, MVT::i32, Expand);

158

159

setOperationAction(ISD::BIT_CONVERT, MVT::f32, Expand);

160

setOperationAction(ISD::BIT_CONVERT, MVT::i32, Expand);

161

setOperationAction(ISD::BIT_CONVERT, MVT::i64, Expand);

162

setOperationAction(ISD::BIT_CONVERT, MVT::f64, Expand);

163

164

// We cannot sextinreg(i1). Expand to shifts.

165

setOperationAction(ISD::SIGN_EXTEND_INREG, MVT::i1, Expand);

166

167

// Support label based line numbers.

168

setOperationAction(ISD::LOCATION, MVT::Other, Expand);

169

setOperationAction(ISD::DEBUG_LOC, MVT::Other, Expand);

Nicolas Geoffray

6186476

2007-12-21 12:19:44 +0000

[diff] [blame]

170

171

setOperationAction(ISD::EXCEPTIONADDR, MVT::i64, Expand);

172

setOperationAction(ISD::EHSELECTION, MVT::i64, Expand);

173

setOperationAction(ISD::EXCEPTIONADDR, MVT::i32, Expand);

174

setOperationAction(ISD::EHSELECTION, MVT::i32, Expand);

175

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

176

177

// We want to legalize GlobalAddress and ConstantPool nodes into the

178

// appropriate instructions to materialize the address.

179

setOperationAction(ISD::GlobalAddress, MVT::i32, Custom);

180

setOperationAction(ISD::GlobalTLSAddress, MVT::i32, Custom);

181

setOperationAction(ISD::ConstantPool, MVT::i32, Custom);

182

setOperationAction(ISD::JumpTable, MVT::i32, Custom);

183

setOperationAction(ISD::GlobalAddress, MVT::i64, Custom);

184

setOperationAction(ISD::GlobalTLSAddress, MVT::i64, Custom);

185

setOperationAction(ISD::ConstantPool, MVT::i64, Custom);

186

setOperationAction(ISD::JumpTable, MVT::i64, Custom);

187

188

// RET must be custom lowered, to meet ABI requirements

189

setOperationAction(ISD::RET , MVT::Other, Custom);

Duncan Sands

38947cd

2007-07-27 12:58:54 +0000

[diff] [blame]

190

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

191

// VASTART needs to be custom lowered to use the VarArgsFrameIndex

192

setOperationAction(ISD::VASTART , MVT::Other, Custom);

193

194

// VAARG is custom lowered with ELF 32 ABI

195

if (TM.getSubtarget<PPCSubtarget>().isELF32_ABI())

196

setOperationAction(ISD::VAARG, MVT::Other, Custom);

197

else

198

setOperationAction(ISD::VAARG, MVT::Other, Expand);

199

200

// Use the default implementation.

201

setOperationAction(ISD::VACOPY , MVT::Other, Expand);

202

setOperationAction(ISD::VAEND , MVT::Other, Expand);

203

setOperationAction(ISD::STACKSAVE , MVT::Other, Expand);

204

setOperationAction(ISD::STACKRESTORE , MVT::Other, Custom);

205

setOperationAction(ISD::DYNAMIC_STACKALLOC, MVT::i32 , Custom);

206

setOperationAction(ISD::DYNAMIC_STACKALLOC, MVT::i64 , Custom);

207

Evan Cheng

2008-04-19 01:30:48 +0000

[diff] [blame]

208

setOperationAction(ISD::ATOMIC_LAS , MVT::i32 , Custom);

209

setOperationAction(ISD::ATOMIC_LCS , MVT::i32 , Custom);

210

setOperationAction(ISD::ATOMIC_SWAP , MVT::i32 , Custom);

Evan Cheng

2008-04-19 02:30:38 +0000

[diff] [blame]

211

if (TM.getSubtarget<PPCSubtarget>().has64BitSupport()) {

212

setOperationAction(ISD::ATOMIC_LAS , MVT::i64 , Custom);

213

setOperationAction(ISD::ATOMIC_LCS , MVT::i64 , Custom);

214

setOperationAction(ISD::ATOMIC_SWAP , MVT::i64 , Custom);

215

}

Evan Cheng

2008-04-19 01:30:48 +0000

[diff] [blame]

216

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

217

// We want to custom lower some of our intrinsics.

218

setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::Other, Custom);

219

220

if (TM.getSubtarget<PPCSubtarget>().has64BitSupport()) {

221

// They also have instructions for converting between i64 and fp.

222

setOperationAction(ISD::FP_TO_SINT, MVT::i64, Custom);

223

setOperationAction(ISD::FP_TO_UINT, MVT::i64, Expand);

224

setOperationAction(ISD::SINT_TO_FP, MVT::i64, Custom);

225

setOperationAction(ISD::UINT_TO_FP, MVT::i64, Expand);

226

setOperationAction(ISD::FP_TO_UINT, MVT::i32, Expand);

227

228

// FIXME: disable this lowered code. This generates 64-bit register values,

229

// and we don't model the fact that the top part is clobbered by calls. We

230

// need to flag these together so that the value isn't live across a call.

231

//setOperationAction(ISD::SINT_TO_FP, MVT::i32, Custom);

232

233

// To take advantage of the above i64 FP_TO_SINT, promote i32 FP_TO_UINT

234

setOperationAction(ISD::FP_TO_UINT, MVT::i32, Promote);

235

} else {

236

// PowerPC does not have FP_TO_UINT on 32-bit implementations.

237

setOperationAction(ISD::FP_TO_UINT, MVT::i32, Expand);

238

}

239

240

if (TM.getSubtarget<PPCSubtarget>().use64BitRegs()) {

Chris Lattner

c882caf

2007-10-19 04:08:28 +0000

[diff] [blame]

241

// 64-bit PowerPC implementations can support i64 types directly

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

242

addRegisterClass(MVT::i64, PPC::G8RCRegisterClass);

243

// BUILD_PAIR can't be handled natively, and should be expanded to shl/or

244

setOperationAction(ISD::BUILD_PAIR, MVT::i64, Expand);

Dan Gohman

2008-03-07 20:36:53 +0000

[diff] [blame]

245

// 64-bit PowerPC wants to expand i128 shifts itself.

246

setOperationAction(ISD::SHL_PARTS, MVT::i64, Custom);

247

setOperationAction(ISD::SRA_PARTS, MVT::i64, Custom);

248

setOperationAction(ISD::SRL_PARTS, MVT::i64, Custom);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

249

} else {

Chris Lattner

c882caf

2007-10-19 04:08:28 +0000

[diff] [blame]

250

// 32-bit PowerPC wants to expand i64 shifts itself.

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

251

setOperationAction(ISD::SHL_PARTS, MVT::i32, Custom);

252

setOperationAction(ISD::SRA_PARTS, MVT::i32, Custom);

253

setOperationAction(ISD::SRL_PARTS, MVT::i32, Custom);

254

}

255

256

if (TM.getSubtarget<PPCSubtarget>().hasAltivec()) {

257

// First set operation action for all vector types to expand. Then we

258

// will selectively turn on ones that can be effectively codegen'd.

259

for (unsigned VT = (unsigned)MVT::FIRST_VECTOR_VALUETYPE;

260

VT <= (unsigned)MVT::LAST_VECTOR_VALUETYPE; ++VT) {

261

// add/sub are legal for all supported vector VT's.

262

setOperationAction(ISD::ADD , (MVT::ValueType)VT, Legal);

263

setOperationAction(ISD::SUB , (MVT::ValueType)VT, Legal);

264

265

// We promote all shuffles to v16i8.

266

setOperationAction(ISD::VECTOR_SHUFFLE, (MVT::ValueType)VT, Promote);

267

AddPromotedToType (ISD::VECTOR_SHUFFLE, (MVT::ValueType)VT, MVT::v16i8);

268

269

// We promote all non-typed operations to v4i32.

270

setOperationAction(ISD::AND , (MVT::ValueType)VT, Promote);

271

AddPromotedToType (ISD::AND , (MVT::ValueType)VT, MVT::v4i32);

272

setOperationAction(ISD::OR , (MVT::ValueType)VT, Promote);

273

AddPromotedToType (ISD::OR , (MVT::ValueType)VT, MVT::v4i32);

274

setOperationAction(ISD::XOR , (MVT::ValueType)VT, Promote);

275

AddPromotedToType (ISD::XOR , (MVT::ValueType)VT, MVT::v4i32);

276

setOperationAction(ISD::LOAD , (MVT::ValueType)VT, Promote);

277

AddPromotedToType (ISD::LOAD , (MVT::ValueType)VT, MVT::v4i32);

278

setOperationAction(ISD::SELECT, (MVT::ValueType)VT, Promote);

279

AddPromotedToType (ISD::SELECT, (MVT::ValueType)VT, MVT::v4i32);

280

setOperationAction(ISD::STORE, (MVT::ValueType)VT, Promote);

281

AddPromotedToType (ISD::STORE, (MVT::ValueType)VT, MVT::v4i32);

282

283

// No other operations are legal.

284

setOperationAction(ISD::MUL , (MVT::ValueType)VT, Expand);

285

setOperationAction(ISD::SDIV, (MVT::ValueType)VT, Expand);

286

setOperationAction(ISD::SREM, (MVT::ValueType)VT, Expand);

287

setOperationAction(ISD::UDIV, (MVT::ValueType)VT, Expand);

288

setOperationAction(ISD::UREM, (MVT::ValueType)VT, Expand);

289

setOperationAction(ISD::FDIV, (MVT::ValueType)VT, Expand);

Evan Cheng

c5912e3

2007-07-30 07:51:22 +0000

[diff] [blame]

290

setOperationAction(ISD::FNEG, (MVT::ValueType)VT, Expand);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

291

setOperationAction(ISD::EXTRACT_VECTOR_ELT, (MVT::ValueType)VT, Expand);

292

setOperationAction(ISD::INSERT_VECTOR_ELT, (MVT::ValueType)VT, Expand);

293

setOperationAction(ISD::BUILD_VECTOR, (MVT::ValueType)VT, Expand);

Dan Gohman

c9130bb

2007-10-08 17:28:24 +0000

[diff] [blame]

294

setOperationAction(ISD::UMUL_LOHI, (MVT::ValueType)VT, Expand);

295

setOperationAction(ISD::SMUL_LOHI, (MVT::ValueType)VT, Expand);

296

setOperationAction(ISD::UDIVREM, (MVT::ValueType)VT, Expand);

297

setOperationAction(ISD::SDIVREM, (MVT::ValueType)VT, Expand);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

298

setOperationAction(ISD::SCALAR_TO_VECTOR, (MVT::ValueType)VT, Expand);

Dan Gohman

4e22ac4

2007-10-12 14:08:57 +0000

[diff] [blame]

299

setOperationAction(ISD::FPOW, (MVT::ValueType)VT, Expand);

300

setOperationAction(ISD::CTPOP, (MVT::ValueType)VT, Expand);

301

setOperationAction(ISD::CTLZ, (MVT::ValueType)VT, Expand);

302

setOperationAction(ISD::CTTZ, (MVT::ValueType)VT, Expand);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

303

}

304

305

// We can custom expand all VECTOR_SHUFFLEs to VPERM, others we can handle

306

// with merges, splats, etc.

307

setOperationAction(ISD::VECTOR_SHUFFLE, MVT::v16i8, Custom);

308

309

setOperationAction(ISD::AND , MVT::v4i32, Legal);

310

setOperationAction(ISD::OR , MVT::v4i32, Legal);

311

setOperationAction(ISD::XOR , MVT::v4i32, Legal);

312

setOperationAction(ISD::LOAD , MVT::v4i32, Legal);

313

setOperationAction(ISD::SELECT, MVT::v4i32, Expand);

314

setOperationAction(ISD::STORE , MVT::v4i32, Legal);

315

316

addRegisterClass(MVT::v4f32, PPC::VRRCRegisterClass);

317

addRegisterClass(MVT::v4i32, PPC::VRRCRegisterClass);

318

addRegisterClass(MVT::v8i16, PPC::VRRCRegisterClass);

319

addRegisterClass(MVT::v16i8, PPC::VRRCRegisterClass);

320

321

setOperationAction(ISD::MUL, MVT::v4f32, Legal);

322

setOperationAction(ISD::MUL, MVT::v4i32, Custom);

323

setOperationAction(ISD::MUL, MVT::v8i16, Custom);

324

setOperationAction(ISD::MUL, MVT::v16i8, Custom);

325

326

setOperationAction(ISD::SCALAR_TO_VECTOR, MVT::v4f32, Custom);

327

setOperationAction(ISD::SCALAR_TO_VECTOR, MVT::v4i32, Custom);

328

329

setOperationAction(ISD::BUILD_VECTOR, MVT::v16i8, Custom);

330

setOperationAction(ISD::BUILD_VECTOR, MVT::v8i16, Custom);

331

setOperationAction(ISD::BUILD_VECTOR, MVT::v4i32, Custom);

332

setOperationAction(ISD::BUILD_VECTOR, MVT::v4f32, Custom);

333

}

334

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

335

setShiftAmountType(MVT::i32);

336

setSetCCResultContents(ZeroOrOneSetCCResult);

337

338

if (TM.getSubtarget<PPCSubtarget>().isPPC64()) {

339

setStackPointerRegisterToSaveRestore(PPC::X1);

340

setExceptionPointerRegister(PPC::X3);

341

setExceptionSelectorRegister(PPC::X4);

342

} else {

343

setStackPointerRegisterToSaveRestore(PPC::R1);

344

setExceptionPointerRegister(PPC::R3);

345

setExceptionSelectorRegister(PPC::R4);

346

}

347

348

// We have target-specific dag combine patterns for the following nodes:

349

setTargetDAGCombine(ISD::SINT_TO_FP);

350

setTargetDAGCombine(ISD::STORE);

351

setTargetDAGCombine(ISD::BR_CC);

352

setTargetDAGCombine(ISD::BSWAP);

353

Dale Johannesen

6f3c7bf

2007-10-19 00:59:18 +0000

[diff] [blame]

354

// Darwin long double math library functions have $LDBL128 appended.

355

if (TM.getSubtarget<PPCSubtarget>().isDarwin()) {

Duncan Sands

37a3f47

2008-01-10 10:28:30 +0000

[diff] [blame]

356

setLibcallName(RTLIB::COS_PPCF128, "cosl$LDBL128");

Dale Johannesen

6f3c7bf

2007-10-19 00:59:18 +0000

[diff] [blame]

357

setLibcallName(RTLIB::POW_PPCF128, "powl$LDBL128");

358

setLibcallName(RTLIB::REM_PPCF128, "fmodl$LDBL128");

Duncan Sands

37a3f47

2008-01-10 10:28:30 +0000

[diff] [blame]

359

setLibcallName(RTLIB::SIN_PPCF128, "sinl$LDBL128");

360

setLibcallName(RTLIB::SQRT_PPCF128, "sqrtl$LDBL128");

Dale Johannesen

6f3c7bf

2007-10-19 00:59:18 +0000

[diff] [blame]

361

}

362

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

363

computeRegisterProperties();

364

}

365

Dale Johannesen

88945f8

2008-02-28 22:31:51 +0000

[diff] [blame]

366

/// getByValTypeAlignment - Return the desired alignment for ByVal aggregate

367

/// function arguments in the caller parameter area.

368

unsigned PPCTargetLowering::getByValTypeAlignment(const Type *Ty) const {

369

TargetMachine &TM = getTargetMachine();

370

// Darwin passes everything on 4 byte boundary.

371

if (TM.getSubtarget<PPCSubtarget>().isDarwin())

return 4;

// FIXME Elf TBD

return 4;

}

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

377

const char *PPCTargetLowering::getTargetNodeName(unsigned Opcode) const {

378

switch (Opcode) {

379

default: return 0;

380

case PPCISD::FSEL: return "PPCISD::FSEL";

381

case PPCISD::FCFID: return "PPCISD::FCFID";

382

case PPCISD::FCTIDZ: return "PPCISD::FCTIDZ";

383

case PPCISD::FCTIWZ: return "PPCISD::FCTIWZ";

384

case PPCISD::STFIWX: return "PPCISD::STFIWX";

385

case PPCISD::VMADDFP: return "PPCISD::VMADDFP";

386

case PPCISD::VNMSUBFP: return "PPCISD::VNMSUBFP";

387

case PPCISD::VPERM: return "PPCISD::VPERM";

388

case PPCISD::Hi: return "PPCISD::Hi";

389

case PPCISD::Lo: return "PPCISD::Lo";

390

case PPCISD::DYNALLOC: return "PPCISD::DYNALLOC";

391

case PPCISD::GlobalBaseReg: return "PPCISD::GlobalBaseReg";

392

case PPCISD::SRL: return "PPCISD::SRL";

393

case PPCISD::SRA: return "PPCISD::SRA";

394

case PPCISD::SHL: return "PPCISD::SHL";

395

case PPCISD::EXTSW_32: return "PPCISD::EXTSW_32";

396

case PPCISD::STD_32: return "PPCISD::STD_32";

397

case PPCISD::CALL_ELF: return "PPCISD::CALL_ELF";

398

case PPCISD::CALL_Macho: return "PPCISD::CALL_Macho";

399

case PPCISD::MTCTR: return "PPCISD::MTCTR";

400

case PPCISD::BCTRL_Macho: return "PPCISD::BCTRL_Macho";

401

case PPCISD::BCTRL_ELF: return "PPCISD::BCTRL_ELF";

402

case PPCISD::RET_FLAG: return "PPCISD::RET_FLAG";

403

case PPCISD::MFCR: return "PPCISD::MFCR";

404

case PPCISD::VCMP: return "PPCISD::VCMP";

405

case PPCISD::VCMPo: return "PPCISD::VCMPo";

406

case PPCISD::LBRX: return "PPCISD::LBRX";

407

case PPCISD::STBRX: return "PPCISD::STBRX";

Evan Cheng

2008-04-19 02:30:38 +0000

[diff] [blame]

408

case PPCISD::LARX: return "PPCISD::LARX";

409

case PPCISD::STCX: return "PPCISD::STCX";

Evan Cheng

2008-04-19 01:30:48 +0000

[diff] [blame]

410

case PPCISD::CMP_UNRESERVE: return "PPCISD::CMP_UNRESERVE";

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

411

case PPCISD::COND_BRANCH: return "PPCISD::COND_BRANCH";

Chris Lattner

e2a6e9f

2008-01-18 18:51:16 +0000

[diff] [blame]

412

case PPCISD::MFFS: return "PPCISD::MFFS";

413

case PPCISD::MTFSB0: return "PPCISD::MTFSB0";

414

case PPCISD::MTFSB1: return "PPCISD::MTFSB1";

415

case PPCISD::FADDRTZ: return "PPCISD::FADDRTZ";

416

case PPCISD::MTFSF: return "PPCISD::MTFSF";

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

417

case PPCISD::TAILCALL: return "PPCISD::TAILCALL";

418

case PPCISD::TC_RETURN: return "PPCISD::TC_RETURN";

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

}

}

Scott Michel

2008-03-10 15:42:14 +0000

[diff] [blame]

422

423

MVT::ValueType

424

PPCTargetLowering::getSetCCResultType(const SDOperand &) const {

return MVT::i32;

}

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

429

//===----------------------------------------------------------------------===//

430

// Node matching predicates, for use by the tblgen matching code.

431

//===----------------------------------------------------------------------===//

432

433

/// isFloatingPointZero - Return true if this is 0.0 or -0.0.

434

static bool isFloatingPointZero(SDOperand Op) {

435

if (ConstantFPSDNode *CFP = dyn_cast<ConstantFPSDNode>(Op))

Dale Johannesen

2007-08-31 04:03:46 +0000

[diff] [blame]

436

return CFP->getValueAPF().isZero();

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

437

else if (ISD::isEXTLoad(Op.Val) || ISD::isNON_EXTLoad(Op.Val)) {

438

// Maybe this has already been legalized into the constant pool?

439

if (ConstantPoolSDNode *CP = dyn_cast<ConstantPoolSDNode>(Op.getOperand(1)))

440

if (ConstantFP *CFP = dyn_cast<ConstantFP>(CP->getConstVal()))

Dale Johannesen

2007-08-31 04:03:46 +0000

[diff] [blame]

441

return CFP->getValueAPF().isZero();

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

}

return false;

}

/// isConstantOrUndef - Op is either an undef node or a ConstantSDNode. Return

447

/// true if Op is undef or if it matches the specified value.

448

static bool isConstantOrUndef(SDOperand Op, unsigned Val) {

449

return Op.getOpcode() == ISD::UNDEF ||

450

cast<ConstantSDNode>(Op)->getValue() == Val;

451

}

452

453

/// isVPKUHUMShuffleMask - Return true if this is the shuffle mask for a

454

/// VPKUHUM instruction.

455

bool PPC::isVPKUHUMShuffleMask(SDNode *N, bool isUnary) {

456

if (!isUnary) {

457

for (unsigned i = 0; i != 16; ++i)

458

if (!isConstantOrUndef(N->getOperand(i), i*2+1))

459

return false;

460

} else {

461

for (unsigned i = 0; i != 8; ++i)

462

if (!isConstantOrUndef(N->getOperand(i), i*2+1) ||

463

!isConstantOrUndef(N->getOperand(i+8), i*2+1))

return false;

}

return true;

}

/// isVPKUWUMShuffleMask - Return true if this is the shuffle mask for a

470

/// VPKUWUM instruction.

471

bool PPC::isVPKUWUMShuffleMask(SDNode *N, bool isUnary) {

472

if (!isUnary) {

473

for (unsigned i = 0; i != 16; i += 2)

474

if (!isConstantOrUndef(N->getOperand(i ), i*2+2) ||

475

!isConstantOrUndef(N->getOperand(i+1), i*2+3))

476

return false;

477

} else {

478

for (unsigned i = 0; i != 8; i += 2)

479

if (!isConstantOrUndef(N->getOperand(i ), i*2+2) ||

480

!isConstantOrUndef(N->getOperand(i+1), i*2+3) ||

481

!isConstantOrUndef(N->getOperand(i+8), i*2+2) ||

482

!isConstantOrUndef(N->getOperand(i+9), i*2+3))

return false;

}

return true;

}

/// isVMerge - Common function, used to match vmrg* shuffles.

489

///

490

static bool isVMerge(SDNode *N, unsigned UnitSize,

491

unsigned LHSStart, unsigned RHSStart) {

492

assert(N->getOpcode() == ISD::BUILD_VECTOR &&

493

N->getNumOperands() == 16 && "PPC only supports shuffles by bytes!");

494

assert((UnitSize == 1 || UnitSize == 2 || UnitSize == 4) &&

495

"Unsupported merge size!");

496

497

for (unsigned i = 0; i != 8/UnitSize; ++i) // Step over units

498

for (unsigned j = 0; j != UnitSize; ++j) { // Step over bytes within unit

499

if (!isConstantOrUndef(N->getOperand(i*UnitSize*2+j),

500

LHSStart+j+i*UnitSize) ||

501

!isConstantOrUndef(N->getOperand(i*UnitSize*2+UnitSize+j),

502

RHSStart+j+i*UnitSize))

return false;

}

return true;

}

/// isVMRGLShuffleMask - Return true if this is a shuffle mask suitable for

509

/// a VRGL* instruction with the specified unit size (1,2 or 4 bytes).

510

bool PPC::isVMRGLShuffleMask(SDNode *N, unsigned UnitSize, bool isUnary) {

511

if (!isUnary)

512

return isVMerge(N, UnitSize, 8, 24);

513

return isVMerge(N, UnitSize, 8, 8);

514

}

515

516

/// isVMRGHShuffleMask - Return true if this is a shuffle mask suitable for

517

/// a VRGH* instruction with the specified unit size (1,2 or 4 bytes).

518

bool PPC::isVMRGHShuffleMask(SDNode *N, unsigned UnitSize, bool isUnary) {

519

if (!isUnary)

520

return isVMerge(N, UnitSize, 0, 16);

521

return isVMerge(N, UnitSize, 0, 0);

}

/// isVSLDOIShuffleMask - If this is a vsldoi shuffle mask, return the shift

526

/// amount, otherwise return -1.

527

int PPC::isVSLDOIShuffleMask(SDNode *N, bool isUnary) {

528

assert(N->getOpcode() == ISD::BUILD_VECTOR &&

529

N->getNumOperands() == 16 && "PPC only supports shuffles by bytes!");

530

// Find the first non-undef value in the shuffle mask.

531

unsigned i;

532

for (i = 0; i != 16 && N->getOperand(i).getOpcode() == ISD::UNDEF; ++i)

533

/*search*/;

534

535

if (i == 16) return -1; // all undef.

536

537

// Otherwise, check to see if the rest of the elements are consequtively

538

// numbered from this value.

539

unsigned ShiftAmt = cast<ConstantSDNode>(N->getOperand(i))->getValue();

540

if (ShiftAmt < i) return -1;

ShiftAmt -= i;

if (!isUnary) {

// Check the rest of the elements to see if they are consequtive.

545

for (++i; i != 16; ++i)

546

if (!isConstantOrUndef(N->getOperand(i), ShiftAmt+i))

547

return -1;

548

} else {

549

// Check the rest of the elements to see if they are consequtive.

550

for (++i; i != 16; ++i)

551

if (!isConstantOrUndef(N->getOperand(i), (ShiftAmt+i) & 15))

return -1;

}

return ShiftAmt;

}

/// isSplatShuffleMask - Return true if the specified VECTOR_SHUFFLE operand

559

/// specifies a splat of a single element that is suitable for input to

560

/// VSPLTB/VSPLTH/VSPLTW.

561

bool PPC::isSplatShuffleMask(SDNode *N, unsigned EltSize) {

562

assert(N->getOpcode() == ISD::BUILD_VECTOR &&

563

N->getNumOperands() == 16 &&

564

(EltSize == 1 || EltSize == 2 || EltSize == 4));

565

566

// This is a splat operation if each element of the permute is the same, and

567

// if the value doesn't reference the second vector.

568

unsigned ElementBase = 0;

569

SDOperand Elt = N->getOperand(0);

570

if (ConstantSDNode *EltV = dyn_cast<ConstantSDNode>(Elt))

571

ElementBase = EltV->getValue();

572

else

573

return false; // FIXME: Handle UNDEF elements too!

574

575

if (cast<ConstantSDNode>(Elt)->getValue() >= 16)

576

return false;

577

578

// Check that they are consequtive.

579

for (unsigned i = 1; i != EltSize; ++i) {

580

if (!isa<ConstantSDNode>(N->getOperand(i)) ||

581

cast<ConstantSDNode>(N->getOperand(i))->getValue() != i+ElementBase)

return false;

}

assert(isa<ConstantSDNode>(Elt) && "Invalid VECTOR_SHUFFLE mask!");

586

for (unsigned i = EltSize, e = 16; i != e; i += EltSize) {

587

if (N->getOperand(i).getOpcode() == ISD::UNDEF) continue;

588

assert(isa<ConstantSDNode>(N->getOperand(i)) &&

589

"Invalid VECTOR_SHUFFLE mask!");

590

for (unsigned j = 0; j != EltSize; ++j)

591

if (N->getOperand(i+j) != N->getOperand(j))

return false;

}

return true;

}

Evan Cheng

2007-07-30 07:51:22 +0000

[diff] [blame]

598

/// isAllNegativeZeroVector - Returns true if all elements of build_vector

599

/// are -0.0.

600

bool PPC::isAllNegativeZeroVector(SDNode *N) {

601

assert(N->getOpcode() == ISD::BUILD_VECTOR);

602

if (PPC::isSplatShuffleMask(N, N->getNumOperands()))

603

if (ConstantFPSDNode *CFP = dyn_cast<ConstantFPSDNode>(N))

Dale Johannesen

2007-08-31 04:03:46 +0000

[diff] [blame]

604

return CFP->getValueAPF().isNegZero();

Evan Cheng

c5912e3

2007-07-30 07:51:22 +0000

[diff] [blame]

return false;

}

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

608

/// getVSPLTImmediate - Return the appropriate VSPLT* immediate to splat the

609

/// specified isSplatShuffleMask VECTOR_SHUFFLE mask.

610

unsigned PPC::getVSPLTImmediate(SDNode *N, unsigned EltSize) {

611

assert(isSplatShuffleMask(N, EltSize));

612

return cast<ConstantSDNode>(N->getOperand(0))->getValue() / EltSize;

613

}

614

615

/// get_VSPLTI_elt - If this is a build_vector of constants which can be formed

616

/// by using a vspltis[bhw] instruction of the specified element size, return

617

/// the constant being splatted. The ByteSize field indicates the number of

618

/// bytes of each element [124] -> [bhw].

619

SDOperand PPC::get_VSPLTI_elt(SDNode *N, unsigned ByteSize, SelectionDAG &DAG) {

620

SDOperand OpVal(0, 0);

621

622

// If ByteSize of the splat is bigger than the element size of the

623

// build_vector, then we have a case where we are checking for a splat where

624

// multiple elements of the buildvector are folded together into a single

625

// logical element of the splat (e.g. "vsplish 1" to splat {0,1}*8).

626

unsigned EltSize = 16/N->getNumOperands();

627

if (EltSize < ByteSize) {

628

unsigned Multiple = ByteSize/EltSize; // Number of BV entries per spltval.

629

SDOperand UniquedVals[4];

630

assert(Multiple > 1 && Multiple <= 4 && "How can this happen?");

631

632

// See if all of the elements in the buildvector agree across.

633

for (unsigned i = 0, e = N->getNumOperands(); i != e; ++i) {

634

if (N->getOperand(i).getOpcode() == ISD::UNDEF) continue;

635

// If the element isn't a constant, bail fully out.

636

if (!isa<ConstantSDNode>(N->getOperand(i))) return SDOperand();

637

638

639

if (UniquedVals[i&(Multiple-1)].Val == 0)

640

UniquedVals[i&(Multiple-1)] = N->getOperand(i);

641

else if (UniquedVals[i&(Multiple-1)] != N->getOperand(i))

642

return SDOperand(); // no match.

643

}

644

645

// Okay, if we reached this point, UniquedVals[0..Multiple-1] contains

646

// either constant or undef values that are identical for each chunk. See

647

// if these chunks can form into a larger vspltis*.

648

649

// Check to see if all of the leading entries are either 0 or -1. If

650

// neither, then this won't fit into the immediate field.

651

bool LeadingZero = true;

652

bool LeadingOnes = true;

653

for (unsigned i = 0; i != Multiple-1; ++i) {

654

if (UniquedVals[i].Val == 0) continue; // Must have been undefs.

655

656

LeadingZero &= cast<ConstantSDNode>(UniquedVals[i])->isNullValue();

657

LeadingOnes &= cast<ConstantSDNode>(UniquedVals[i])->isAllOnesValue();

658

}

659

// Finally, check the least significant entry.

660

if (LeadingZero) {

661

if (UniquedVals[Multiple-1].Val == 0)

662

return DAG.getTargetConstant(0, MVT::i32); // 0,0,0,undef

663

int Val = cast<ConstantSDNode>(UniquedVals[Multiple-1])->getValue();

664

if (Val < 16)

665

return DAG.getTargetConstant(Val, MVT::i32); // 0,0,0,4 -> vspltisw(4)

666

}

667

if (LeadingOnes) {

668

if (UniquedVals[Multiple-1].Val == 0)

669

return DAG.getTargetConstant(~0U, MVT::i32); // -1,-1,-1,undef

670

int Val =cast<ConstantSDNode>(UniquedVals[Multiple-1])->getSignExtended();

671

if (Val >= -16) // -1,-1,-1,-2 -> vspltisw(-2)

672

return DAG.getTargetConstant(Val, MVT::i32);

}

return SDOperand();

}

// Check to see if this buildvec has a single non-undef value in its elements.

679

for (unsigned i = 0, e = N->getNumOperands(); i != e; ++i) {

680

if (N->getOperand(i).getOpcode() == ISD::UNDEF) continue;

681

if (OpVal.Val == 0)

682

OpVal = N->getOperand(i);

683

else if (OpVal != N->getOperand(i))

return SDOperand();

}

if (OpVal.Val == 0) return SDOperand(); // All UNDEF: use implicit def.

688

689

unsigned ValSizeInBytes = 0;

690

uint64_t Value = 0;

691

if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(OpVal)) {

692

Value = CN->getValue();

693

ValSizeInBytes = MVT::getSizeInBits(CN->getValueType(0))/8;

694

} else if (ConstantFPSDNode *CN = dyn_cast<ConstantFPSDNode>(OpVal)) {

695

assert(CN->getValueType(0) == MVT::f32 && "Only one legal FP vector type!");

Dale Johannesen

2007-08-31 04:03:46 +0000

[diff] [blame]

696

Value = FloatToBits(CN->getValueAPF().convertToFloat());

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

ValSizeInBytes = 4;

}

// If the splat value is larger than the element value, then we can never do

701

// this splat. The only case that we could fit the replicated bits into our

702

// immediate field for would be zero, and we prefer to use vxor for it.

703

if (ValSizeInBytes < ByteSize) return SDOperand();

704

705

// If the element value is larger than the splat value, cut it in half and

706

// check to see if the two halves are equal. Continue doing this until we

707

// get to ByteSize. This allows us to handle 0x01010101 as 0x01.

708

while (ValSizeInBytes > ByteSize) {

709

ValSizeInBytes >>= 1;

710

711

// If the top half equals the bottom half, we're still ok.

712

if (((Value >> (ValSizeInBytes*8)) & ((1 << (8*ValSizeInBytes))-1)) !=

713

(Value & ((1 << (8*ValSizeInBytes))-1)))

return SDOperand();

}

// Properly sign extend the value.

718

int ShAmt = (4-ByteSize)*8;

719

int MaskVal = ((int)Value << ShAmt) >> ShAmt;

720

721

// If this is zero, don't match, zero matches ISD::isBuildVectorAllZeros.

722

if (MaskVal == 0) return SDOperand();

723

724

// Finally, if this value fits in a 5 bit sext field, return it

725

if (((MaskVal << (32-5)) >> (32-5)) == MaskVal)

726

return DAG.getTargetConstant(MaskVal, MVT::i32);

return SDOperand();

}

//===----------------------------------------------------------------------===//

731

// Addressing Mode Selection

732

//===----------------------------------------------------------------------===//

733

734

/// isIntS16Immediate - This method tests to see if the node is either a 32-bit

735

/// or 64-bit immediate, and if the value can be accurately represented as a

736

/// sign extension from a 16-bit value. If so, this returns true and the

737

/// immediate.

738

static bool isIntS16Immediate(SDNode *N, short &Imm) {

739

if (N->getOpcode() != ISD::Constant)

740

return false;

741

742

Imm = (short)cast<ConstantSDNode>(N)->getValue();

743

if (N->getValueType(0) == MVT::i32)

744

return Imm == (int32_t)cast<ConstantSDNode>(N)->getValue();

745

else

746

return Imm == (int64_t)cast<ConstantSDNode>(N)->getValue();

747

}

748

static bool isIntS16Immediate(SDOperand Op, short &Imm) {

749

return isIntS16Immediate(Op.Val, Imm);

}

/// SelectAddressRegReg - Given the specified addressed, check to see if it

754

/// can be represented as an indexed [r+r] operation. Returns false if it

755

/// can be more efficiently represented with [r+imm].

756

bool PPCTargetLowering::SelectAddressRegReg(SDOperand N, SDOperand &Base,

SDOperand &Index,

SelectionDAG &DAG) {

short imm = 0;

if (N.getOpcode() == ISD::ADD) {

761

if (isIntS16Immediate(N.getOperand(1), imm))

762

return false; // r+i

763

if (N.getOperand(1).getOpcode() == PPCISD::Lo)

764

return false; // r+i

765

766

Base = N.getOperand(0);

767

Index = N.getOperand(1);

768

return true;

769

} else if (N.getOpcode() == ISD::OR) {

770

if (isIntS16Immediate(N.getOperand(1), imm))

771

return false; // r+i can fold it if we can.

772

773

// If this is an or of disjoint bitfields, we can codegen this as an add

774

// (for better address arithmetic) if the LHS and RHS of the OR are provably

775

// disjoint.

Dan Gohman

2008-02-27 01:23:58 +0000

[diff] [blame]

776

APInt LHSKnownZero, LHSKnownOne;

777

APInt RHSKnownZero, RHSKnownOne;

778

DAG.ComputeMaskedBits(N.getOperand(0),

Dan Gohman

c9cd46f

2008-02-27 21:12:32 +0000

[diff] [blame]

779

APInt::getAllOnesValue(N.getOperand(0)

780

.getValueSizeInBits()),

Dan Gohman

2008-02-27 01:23:58 +0000

[diff] [blame]

781

LHSKnownZero, LHSKnownOne);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

782

Dan Gohman

2008-02-27 01:23:58 +0000

[diff] [blame]

783

if (LHSKnownZero.getBoolValue()) {

784

DAG.ComputeMaskedBits(N.getOperand(1),

Dan Gohman

c9cd46f

2008-02-27 21:12:32 +0000

[diff] [blame]

785

APInt::getAllOnesValue(N.getOperand(1)

786

.getValueSizeInBits()),

Dan Gohman

2008-02-27 01:23:58 +0000

[diff] [blame]

787

RHSKnownZero, RHSKnownOne);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

788

// If all of the bits are known zero on the LHS or RHS, the add won't

789

// carry.

Dan Gohman

c9cd46f

2008-02-27 21:12:32 +0000

[diff] [blame]

790

if (~(LHSKnownZero | RHSKnownZero) == 0) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

791

Base = N.getOperand(0);

792

Index = N.getOperand(1);

return true;

}

}

}

return false;

}

/// Returns true if the address N can be represented by a base register plus

802

/// a signed 16-bit displacement [r+imm], and if it is not better

803

/// represented as reg+reg.

804

bool PPCTargetLowering::SelectAddressRegImm(SDOperand N, SDOperand &Disp,

805

SDOperand &Base, SelectionDAG &DAG){

806

// If this can be more profitably realized as r+r, fail.

807

if (SelectAddressRegReg(N, Disp, Base, DAG))

808

return false;

809

810

if (N.getOpcode() == ISD::ADD) {

811

short imm = 0;

812

if (isIntS16Immediate(N.getOperand(1), imm)) {

813

Disp = DAG.getTargetConstant((int)imm & 0xFFFF, MVT::i32);

814

if (FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(N.getOperand(0))) {

815

Base = DAG.getTargetFrameIndex(FI->getIndex(), N.getValueType());

816

} else {

817

Base = N.getOperand(0);

818

}

819

return true; // [r+i]

820

} else if (N.getOperand(1).getOpcode() == PPCISD::Lo) {

821

// Match LOAD (ADD (X, Lo(G))).

822

assert(!cast<ConstantSDNode>(N.getOperand(1).getOperand(1))->getValue()

823

&& "Cannot handle constant offsets yet!");

824

Disp = N.getOperand(1).getOperand(0); // The global address.

825

assert(Disp.getOpcode() == ISD::TargetGlobalAddress ||

826

Disp.getOpcode() == ISD::TargetConstantPool ||

827

Disp.getOpcode() == ISD::TargetJumpTable);

828

Base = N.getOperand(0);

829

return true; // [&g+r]

830

}

831

} else if (N.getOpcode() == ISD::OR) {

832

short imm = 0;

833

if (isIntS16Immediate(N.getOperand(1), imm)) {

834

// If this is an or of disjoint bitfields, we can codegen this as an add

835

// (for better address arithmetic) if the LHS and RHS of the OR are

836

// provably disjoint.

Dan Gohman

2008-02-27 01:23:58 +0000

[diff] [blame]

837

APInt LHSKnownZero, LHSKnownOne;

838

DAG.ComputeMaskedBits(N.getOperand(0),

Bill Wendling

a77e9f0

2008-03-24 23:16:37 +0000

[diff] [blame]

839

APInt::getAllOnesValue(N.getOperand(0)

840

.getValueSizeInBits()),

Dan Gohman

2008-02-27 01:23:58 +0000

[diff] [blame]

841

LHSKnownZero, LHSKnownOne);

Bill Wendling

a77e9f0

2008-03-24 23:16:37 +0000

[diff] [blame]

842

Dan Gohman

2008-02-27 01:23:58 +0000

[diff] [blame]

843

if ((LHSKnownZero.getZExtValue()|~(uint64_t)imm) == ~0ULL) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

844

// If all of the bits are known zero on the LHS or RHS, the add won't

845

// carry.

846

Base = N.getOperand(0);

847

Disp = DAG.getTargetConstant((int)imm & 0xFFFF, MVT::i32);

return true;

}

}

} else if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(N)) {

852

// Loading from a constant address.

853

854

// If this address fits entirely in a 16-bit sext immediate field, codegen

855

// this as "d, 0"

856

short Imm;

857

if (isIntS16Immediate(CN, Imm)) {

858

Disp = DAG.getTargetConstant(Imm, CN->getValueType(0));

859

Base = DAG.getRegister(PPC::R0, CN->getValueType(0));

return true;

}

// Handle 32-bit sext immediates with LIS + addr mode.

864

if (CN->getValueType(0) == MVT::i32 ||

865

(int64_t)CN->getValue() == (int)CN->getValue()) {

866

int Addr = (int)CN->getValue();

867

868

// Otherwise, break this down into an LIS + disp.

869

Disp = DAG.getTargetConstant((short)Addr, MVT::i32);

870

871

Base = DAG.getTargetConstant((Addr - (signed short)Addr) >> 16, MVT::i32);

872

unsigned Opc = CN->getValueType(0) == MVT::i32 ? PPC::LIS : PPC::LIS8;

873

Base = SDOperand(DAG.getTargetNode(Opc, CN->getValueType(0), Base), 0);

return true;

}

}

Disp = DAG.getTargetConstant(0, getPointerTy());

879

if (FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(N))

880

Base = DAG.getTargetFrameIndex(FI->getIndex(), N.getValueType());

881

else

882

Base = N;

883

return true; // [r+0]

884

}

885

886

/// SelectAddressRegRegOnly - Given the specified addressed, force it to be

887

/// represented as an indexed [r+r] operation.

888

bool PPCTargetLowering::SelectAddressRegRegOnly(SDOperand N, SDOperand &Base,

889

SDOperand &Index,

890

SelectionDAG &DAG) {

891

// Check to see if we can easily represent this as an [r+r] address. This

892

// will fail if it thinks that the address is more profitably represented as

893

// reg+imm, e.g. where imm = 0.

894

if (SelectAddressRegReg(N, Base, Index, DAG))

895

return true;

896

897

// If the operand is an addition, always emit this as [r+r], since this is

898

// better (for code size, and execution, as the memop does the add for free)

899

// than emitting an explicit add.

900

if (N.getOpcode() == ISD::ADD) {

901

Base = N.getOperand(0);

902

Index = N.getOperand(1);

return true;

}

// Otherwise, do it the hard way, using R0 as the base register.

907

Base = DAG.getRegister(PPC::R0, N.getValueType());

Index = N;

return true;

}

/// SelectAddressRegImmShift - Returns true if the address N can be

913

/// represented by a base register plus a signed 14-bit displacement

914

/// [r+imm*4]. Suitable for use by STD and friends.

915

bool PPCTargetLowering::SelectAddressRegImmShift(SDOperand N, SDOperand &Disp,

916

SDOperand &Base,

917

SelectionDAG &DAG) {

918

// If this can be more profitably realized as r+r, fail.

919

if (SelectAddressRegReg(N, Disp, Base, DAG))

920

return false;

921

922

if (N.getOpcode() == ISD::ADD) {

923

short imm = 0;

924

if (isIntS16Immediate(N.getOperand(1), imm) && (imm & 3) == 0) {

925

Disp = DAG.getTargetConstant(((int)imm & 0xFFFF) >> 2, MVT::i32);

926

if (FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(N.getOperand(0))) {

927

Base = DAG.getTargetFrameIndex(FI->getIndex(), N.getValueType());

928

} else {

929

Base = N.getOperand(0);

930

}

931

return true; // [r+i]

932

} else if (N.getOperand(1).getOpcode() == PPCISD::Lo) {

933

// Match LOAD (ADD (X, Lo(G))).

934

assert(!cast<ConstantSDNode>(N.getOperand(1).getOperand(1))->getValue()

935

&& "Cannot handle constant offsets yet!");

936

Disp = N.getOperand(1).getOperand(0); // The global address.

937

assert(Disp.getOpcode() == ISD::TargetGlobalAddress ||

938

Disp.getOpcode() == ISD::TargetConstantPool ||

939

Disp.getOpcode() == ISD::TargetJumpTable);

940

Base = N.getOperand(0);

941

return true; // [&g+r]

942

}

943

} else if (N.getOpcode() == ISD::OR) {

944

short imm = 0;

945

if (isIntS16Immediate(N.getOperand(1), imm) && (imm & 3) == 0) {

946

// If this is an or of disjoint bitfields, we can codegen this as an add

947

// (for better address arithmetic) if the LHS and RHS of the OR are

948

// provably disjoint.

Dan Gohman

2008-02-27 01:23:58 +0000

[diff] [blame]

949

APInt LHSKnownZero, LHSKnownOne;

950

DAG.ComputeMaskedBits(N.getOperand(0),

Bill Wendling

a77e9f0

2008-03-24 23:16:37 +0000

[diff] [blame]

951

APInt::getAllOnesValue(N.getOperand(0)

952

.getValueSizeInBits()),

Dan Gohman

2008-02-27 01:23:58 +0000

[diff] [blame]

953

LHSKnownZero, LHSKnownOne);

954

if ((LHSKnownZero.getZExtValue()|~(uint64_t)imm) == ~0ULL) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

955

// If all of the bits are known zero on the LHS or RHS, the add won't

956

// carry.

957

Base = N.getOperand(0);

958

Disp = DAG.getTargetConstant(((int)imm & 0xFFFF) >> 2, MVT::i32);

return true;

}

}

} else if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(N)) {

963

// Loading from a constant address. Verify low two bits are clear.

964

if ((CN->getValue() & 3) == 0) {

965

// If this address fits entirely in a 14-bit sext immediate field, codegen

966

// this as "d, 0"

967

short Imm;

968

if (isIntS16Immediate(CN, Imm)) {

969

Disp = DAG.getTargetConstant((unsigned short)Imm >> 2, getPointerTy());

970

Base = DAG.getRegister(PPC::R0, CN->getValueType(0));

return true;

}

// Fold the low-part of 32-bit absolute addresses into addr mode.

975

if (CN->getValueType(0) == MVT::i32 ||

976

(int64_t)CN->getValue() == (int)CN->getValue()) {

977

int Addr = (int)CN->getValue();

978

979

// Otherwise, break this down into an LIS + disp.

980

Disp = DAG.getTargetConstant((short)Addr >> 2, MVT::i32);

981

982

Base = DAG.getTargetConstant((Addr-(signed short)Addr) >> 16, MVT::i32);

983

unsigned Opc = CN->getValueType(0) == MVT::i32 ? PPC::LIS : PPC::LIS8;

984

Base = SDOperand(DAG.getTargetNode(Opc, CN->getValueType(0), Base), 0);

return true;

}

}

}

Disp = DAG.getTargetConstant(0, getPointerTy());

991

if (FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(N))

992

Base = DAG.getTargetFrameIndex(FI->getIndex(), N.getValueType());

993

else

994

Base = N;

995

return true; // [r+0]

}

/// getPreIndexedAddressParts - returns true by value, base pointer and

1000

/// offset pointer and addressing mode by reference if the node's address

1001

/// can be legally represented as pre-indexed load / store address.

1002

bool PPCTargetLowering::getPreIndexedAddressParts(SDNode *N, SDOperand &Base,

1003

SDOperand &Offset,

1004

ISD::MemIndexedMode &AM,

1005

SelectionDAG &DAG) {

1006

// Disabled by default for now.

1007

if (!EnablePPCPreinc) return false;

SDOperand Ptr;

MVT::ValueType VT;

if (LoadSDNode *LD = dyn_cast<LoadSDNode>(N)) {

1012

Ptr = LD->getBasePtr();

Dan Gohman

9a4c92c

2008-01-30 00:15:11 +0000

[diff] [blame]

1013

VT = LD->getMemoryVT();

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1014

1015

} else if (StoreSDNode *ST = dyn_cast<StoreSDNode>(N)) {

1016

ST = ST;

1017

Ptr = ST->getBasePtr();

Dan Gohman

9a4c92c

2008-01-30 00:15:11 +0000

[diff] [blame]

1018

VT = ST->getMemoryVT();

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

} else

return false;

// PowerPC doesn't have preinc load/store instructions for vectors.

1023

if (MVT::isVector(VT))

1024

return false;

1025

1026

// TODO: Check reg+reg first.

1027

1028

// LDU/STU use reg+imm*4, others use reg+imm.

1029

if (VT != MVT::i64) {

1030

// reg + imm

1031

if (!SelectAddressRegImm(Ptr, Offset, Base, DAG))

return false;

} else {

// reg + imm * 4.

if (!SelectAddressRegImmShift(Ptr, Offset, Base, DAG))

return false;

}

if (LoadSDNode *LD = dyn_cast<LoadSDNode>(N)) {

1040

// PPC64 doesn't have lwau, but it does have lwaux. Reject preinc load of

1041

// sext i32 to i64 when addr mode is r+i.

Dan Gohman

9a4c92c

2008-01-30 00:15:11 +0000

[diff] [blame]

1042

if (LD->getValueType(0) == MVT::i64 && LD->getMemoryVT() == MVT::i32 &&

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1043

LD->getExtensionType() == ISD::SEXTLOAD &&

1044

isa<ConstantSDNode>(Offset))

return false;

}

AM = ISD::PRE_INC;

return true;

}

//===----------------------------------------------------------------------===//

1053

// LowerOperation implementation

1054

//===----------------------------------------------------------------------===//

1055

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

1056

SDOperand PPCTargetLowering::LowerConstantPool(SDOperand Op,

1057

SelectionDAG &DAG) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1058

MVT::ValueType PtrVT = Op.getValueType();

1059

ConstantPoolSDNode *CP = cast<ConstantPoolSDNode>(Op);

1060

Constant *C = CP->getConstVal();

1061

SDOperand CPI = DAG.getTargetConstantPool(C, PtrVT, CP->getAlignment());

1062

SDOperand Zero = DAG.getConstant(0, PtrVT);

1063

1064

const TargetMachine &TM = DAG.getTarget();

1065

1066

SDOperand Hi = DAG.getNode(PPCISD::Hi, PtrVT, CPI, Zero);

1067

SDOperand Lo = DAG.getNode(PPCISD::Lo, PtrVT, CPI, Zero);

1068

1069

// If this is a non-darwin platform, we don't support non-static relo models

1070

// yet.

1071

if (TM.getRelocationModel() == Reloc::Static ||

1072

!TM.getSubtarget<PPCSubtarget>().isDarwin()) {

1073

// Generate non-pic code that has direct accesses to the constant pool.

1074

// The address of the global is just (hi(&g)+lo(&g)).

1075

return DAG.getNode(ISD::ADD, PtrVT, Hi, Lo);

1076

}

1077

1078

if (TM.getRelocationModel() == Reloc::PIC_) {

1079

// With PIC, the first instruction is actually "GR+hi(&G)".

1080

Hi = DAG.getNode(ISD::ADD, PtrVT,

1081

DAG.getNode(PPCISD::GlobalBaseReg, PtrVT), Hi);

1082

}

1083

1084

Lo = DAG.getNode(ISD::ADD, PtrVT, Hi, Lo);

return Lo;

}

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

1088

SDOperand PPCTargetLowering::LowerJumpTable(SDOperand Op, SelectionDAG &DAG) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1089

MVT::ValueType PtrVT = Op.getValueType();

1090

JumpTableSDNode *JT = cast<JumpTableSDNode>(Op);

1091

SDOperand JTI = DAG.getTargetJumpTable(JT->getIndex(), PtrVT);

1092

SDOperand Zero = DAG.getConstant(0, PtrVT);

1093

1094

const TargetMachine &TM = DAG.getTarget();

1095

1096

SDOperand Hi = DAG.getNode(PPCISD::Hi, PtrVT, JTI, Zero);

1097

SDOperand Lo = DAG.getNode(PPCISD::Lo, PtrVT, JTI, Zero);

1098

1099

// If this is a non-darwin platform, we don't support non-static relo models

1100

// yet.

1101

if (TM.getRelocationModel() == Reloc::Static ||

1102

!TM.getSubtarget<PPCSubtarget>().isDarwin()) {

1103

// Generate non-pic code that has direct accesses to the constant pool.

1104

// The address of the global is just (hi(&g)+lo(&g)).

1105

return DAG.getNode(ISD::ADD, PtrVT, Hi, Lo);

1106

}

1107

1108

if (TM.getRelocationModel() == Reloc::PIC_) {

1109

// With PIC, the first instruction is actually "GR+hi(&G)".

1110

Hi = DAG.getNode(ISD::ADD, PtrVT,

1111

DAG.getNode(PPCISD::GlobalBaseReg, PtrVT), Hi);

1112

}

1113

1114

Lo = DAG.getNode(ISD::ADD, PtrVT, Hi, Lo);

return Lo;

}

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

1118

SDOperand PPCTargetLowering::LowerGlobalTLSAddress(SDOperand Op,

1119

SelectionDAG &DAG) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1120

assert(0 && "TLS not implemented for PPC.");

Chris Lattner

2b06cd3

2008-03-30 18:22:13 +0000

[diff] [blame]

1121

return SDOperand(); // Not reached

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1122

}

1123

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

1124

SDOperand PPCTargetLowering::LowerGlobalAddress(SDOperand Op,

1125

SelectionDAG &DAG) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1126

MVT::ValueType PtrVT = Op.getValueType();

1127

GlobalAddressSDNode *GSDN = cast<GlobalAddressSDNode>(Op);

1128

GlobalValue *GV = GSDN->getGlobal();

1129

SDOperand GA = DAG.getTargetGlobalAddress(GV, PtrVT, GSDN->getOffset());

Evan Cheng

a5a257d

2008-02-02 05:06:29 +0000

[diff] [blame]

1130

// If it's a debug information descriptor, don't mess with it.

1131

if (DAG.isVerifiedDebugInfoDesc(Op))

1132

return GA;

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1133

SDOperand Zero = DAG.getConstant(0, PtrVT);

1134

1135

const TargetMachine &TM = DAG.getTarget();

1136

1137

SDOperand Hi = DAG.getNode(PPCISD::Hi, PtrVT, GA, Zero);

1138

SDOperand Lo = DAG.getNode(PPCISD::Lo, PtrVT, GA, Zero);

1139

1140

// If this is a non-darwin platform, we don't support non-static relo models

1141

// yet.

1142

if (TM.getRelocationModel() == Reloc::Static ||

1143

!TM.getSubtarget<PPCSubtarget>().isDarwin()) {

1144

// Generate non-pic code that has direct accesses to globals.

1145

// The address of the global is just (hi(&g)+lo(&g)).

1146

return DAG.getNode(ISD::ADD, PtrVT, Hi, Lo);

1147

}

1148

1149

if (TM.getRelocationModel() == Reloc::PIC_) {

1150

// With PIC, the first instruction is actually "GR+hi(&G)".

1151

Hi = DAG.getNode(ISD::ADD, PtrVT,

1152

DAG.getNode(PPCISD::GlobalBaseReg, PtrVT), Hi);

1153

}

1154

1155

Lo = DAG.getNode(ISD::ADD, PtrVT, Hi, Lo);

1156

1157

if (!TM.getSubtarget<PPCSubtarget>().hasLazyResolverStub(GV))

1158

return Lo;

1159

1160

// If the global is weak or external, we have to go through the lazy

1161

// resolution stub.

1162

return DAG.getLoad(PtrVT, DAG.getEntryNode(), Lo, NULL, 0);

1163

}

1164

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

1165

SDOperand PPCTargetLowering::LowerSETCC(SDOperand Op, SelectionDAG &DAG) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1166

ISD::CondCode CC = cast<CondCodeSDNode>(Op.getOperand(2))->get();

1167

1168

// If we're comparing for equality to zero, expose the fact that this is

1169

// implented as a ctlz/srl pair on ppc, so that the dag combiner can

1170

// fold the new nodes.

1171

if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op.getOperand(1))) {

1172

if (C->isNullValue() && CC == ISD::SETEQ) {

1173

MVT::ValueType VT = Op.getOperand(0).getValueType();

1174

SDOperand Zext = Op.getOperand(0);

1175

if (VT < MVT::i32) {

1176

VT = MVT::i32;

1177

Zext = DAG.getNode(ISD::ZERO_EXTEND, VT, Op.getOperand(0));

1178

}

1179

unsigned Log2b = Log2_32(MVT::getSizeInBits(VT));

1180

SDOperand Clz = DAG.getNode(ISD::CTLZ, VT, Zext);

1181

SDOperand Scc = DAG.getNode(ISD::SRL, VT, Clz,

1182

DAG.getConstant(Log2b, MVT::i32));

1183

return DAG.getNode(ISD::TRUNCATE, MVT::i32, Scc);

1184

}

1185

// Leave comparisons against 0 and -1 alone for now, since they're usually

1186

// optimized. FIXME: revisit this when we can custom lower all setcc

1187

// optimizations.

1188

if (C->isAllOnesValue() || C->isNullValue())

return SDOperand();

}

// If we have an integer seteq/setne, turn it into a compare against zero

1193

// by xor'ing the rhs with the lhs, which is faster than setting a

1194

// condition register, reading it back out, and masking the correct bit. The

1195

// normal approach here uses sub to do this instead of xor. Using xor exposes

1196

// the result to other bit-twiddling opportunities.

1197

MVT::ValueType LHSVT = Op.getOperand(0).getValueType();

1198

if (MVT::isInteger(LHSVT) && (CC == ISD::SETEQ || CC == ISD::SETNE)) {

1199

MVT::ValueType VT = Op.getValueType();

1200

SDOperand Sub = DAG.getNode(ISD::XOR, LHSVT, Op.getOperand(0),

1201

Op.getOperand(1));

1202

return DAG.getSetCC(VT, Sub, DAG.getConstant(0, LHSVT), CC);

}

return SDOperand();

}

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

1207

SDOperand PPCTargetLowering::LowerVAARG(SDOperand Op, SelectionDAG &DAG,

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1208

int VarArgsFrameIndex,

1209

int VarArgsStackOffset,

1210

unsigned VarArgsNumGPR,

1211

unsigned VarArgsNumFPR,

1212

const PPCSubtarget &Subtarget) {

1213

1214

assert(0 && "VAARG in ELF32 ABI not implemented yet!");

Chris Lattner

2b06cd3

2008-03-30 18:22:13 +0000

[diff] [blame]

1215

return SDOperand(); // Not reached

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1216

}

1217

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

1218

SDOperand PPCTargetLowering::LowerVASTART(SDOperand Op, SelectionDAG &DAG,

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1219

int VarArgsFrameIndex,

1220

int VarArgsStackOffset,

1221

unsigned VarArgsNumGPR,

1222

unsigned VarArgsNumFPR,

1223

const PPCSubtarget &Subtarget) {

1224

1225

if (Subtarget.isMachoABI()) {

1226

// vastart just stores the address of the VarArgsFrameIndex slot into the

1227

// memory location argument.

1228

MVT::ValueType PtrVT = DAG.getTargetLoweringInfo().getPointerTy();

1229

SDOperand FR = DAG.getFrameIndex(VarArgsFrameIndex, PtrVT);

Dan Gohman

2008-02-06 22:27:42 +0000

[diff] [blame]

1230

const Value *SV = cast<SrcValueSDNode>(Op.getOperand(2))->getValue();

1231

return DAG.getStore(Op.getOperand(0), FR, Op.getOperand(1), SV, 0);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1232

}

1233

1234

// For ELF 32 ABI we follow the layout of the va_list struct.

1235

// We suppose the given va_list is already allocated.

1236

//

1237

// typedef struct {

1238

// char gpr; /* index into the array of 8 GPRs

1239

// * stored in the register save area

1240

// * gpr=0 corresponds to r3,

1241

// * gpr=1 to r4, etc.

1242

// */

1243

// char fpr; /* index into the array of 8 FPRs

1244

// * stored in the register save area

1245

// * fpr=0 corresponds to f1,

1246

// * fpr=1 to f2, etc.

1247

// */

1248

// char *overflow_arg_area;

1249

// /* location on stack that holds

1250

// * the next overflow argument

1251

// */

1252

// char *reg_save_area;

1253

// /* where r3:r10 and f1:f8 (if saved)

// * are stored

// */

// } va_list[1];

SDOperand ArgGPR = DAG.getConstant(VarArgsNumGPR, MVT::i8);

1260

SDOperand ArgFPR = DAG.getConstant(VarArgsNumFPR, MVT::i8);

1261

1262

1263

MVT::ValueType PtrVT = DAG.getTargetLoweringInfo().getPointerTy();

1264

Dan Gohman

2008-02-06 22:27:42 +0000

[diff] [blame]

1265

SDOperand StackOffsetFI = DAG.getFrameIndex(VarArgsStackOffset, PtrVT);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1266

SDOperand FR = DAG.getFrameIndex(VarArgsFrameIndex, PtrVT);

1267

Dan Gohman

2008-02-06 22:27:42 +0000

[diff] [blame]

1268

uint64_t FrameOffset = MVT::getSizeInBits(PtrVT)/8;

1269

SDOperand ConstFrameOffset = DAG.getConstant(FrameOffset, PtrVT);

1270

1271

uint64_t StackOffset = MVT::getSizeInBits(PtrVT)/8 - 1;

1272

SDOperand ConstStackOffset = DAG.getConstant(StackOffset, PtrVT);

1273

1274

uint64_t FPROffset = 1;

1275

SDOperand ConstFPROffset = DAG.getConstant(FPROffset, PtrVT);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1276

Dan Gohman

2008-02-06 22:27:42 +0000

[diff] [blame]

1277

const Value *SV = cast<SrcValueSDNode>(Op.getOperand(2))->getValue();

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1278

1279

// Store first byte : number of int regs

1280

SDOperand firstStore = DAG.getStore(Op.getOperand(0), ArgGPR,

Dan Gohman

2008-02-06 22:27:42 +0000

[diff] [blame]

1281

Op.getOperand(1), SV, 0);

1282

uint64_t nextOffset = FPROffset;

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1283

SDOperand nextPtr = DAG.getNode(ISD::ADD, PtrVT, Op.getOperand(1),

1284

ConstFPROffset);

1285

1286

// Store second byte : number of float regs

Dan Gohman

2008-02-06 22:27:42 +0000

[diff] [blame]

1287

SDOperand secondStore =

1288

DAG.getStore(firstStore, ArgFPR, nextPtr, SV, nextOffset);

1289

nextOffset += StackOffset;

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1290

nextPtr = DAG.getNode(ISD::ADD, PtrVT, nextPtr, ConstStackOffset);

1291

1292

// Store second word : arguments given on stack

Dan Gohman

2008-02-06 22:27:42 +0000

[diff] [blame]

1293

SDOperand thirdStore =

1294

DAG.getStore(secondStore, StackOffsetFI, nextPtr, SV, nextOffset);

1295

nextOffset += FrameOffset;

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1296

nextPtr = DAG.getNode(ISD::ADD, PtrVT, nextPtr, ConstFrameOffset);

1297

1298

// Store third word : arguments given in registers

Dan Gohman

2008-02-06 22:27:42 +0000

[diff] [blame]

1299

return DAG.getStore(thirdStore, FR, nextPtr, SV, nextOffset);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

}

#include "PPCGenCallingConv.inc"

1304

1305

/// GetFPR - Get the set of FP registers that should be allocated for arguments,

1306

/// depending on which subtarget is selected.

1307

static const unsigned *GetFPR(const PPCSubtarget &Subtarget) {

1308

if (Subtarget.isMachoABI()) {

1309

static const unsigned FPR[] = {

1310

PPC::F1, PPC::F2, PPC::F3, PPC::F4, PPC::F5, PPC::F6, PPC::F7,

1311

PPC::F8, PPC::F9, PPC::F10, PPC::F11, PPC::F12, PPC::F13

};

return FPR;

}

static const unsigned FPR[] = {

1318

PPC::F1, PPC::F2, PPC::F3, PPC::F4, PPC::F5, PPC::F6, PPC::F7,

PPC::F8

};

return FPR;

}

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

1324

/// CalculateStackSlotSize - Calculates the size reserved for this argument on

1325

/// the stack.

1326

static unsigned CalculateStackSlotSize(SDOperand Arg, SDOperand Flag,

1327

bool isVarArg, unsigned PtrByteSize) {

1328

MVT::ValueType ArgVT = Arg.getValueType();

1329

ISD::ArgFlagsTy Flags = cast<ARG_FLAGSSDNode>(Flag)->getArgFlags();

1330

unsigned ArgSize =MVT::getSizeInBits(ArgVT)/8;

1331

if (Flags.isByVal())

1332

ArgSize = Flags.getByValSize();

1333

ArgSize = ((ArgSize + PtrByteSize - 1)/PtrByteSize) * PtrByteSize;

return ArgSize;

}

Bill Wendling

2008-03-07 20:49:02 +0000

[diff] [blame]

1338

SDOperand

1339

PPCTargetLowering::LowerFORMAL_ARGUMENTS(SDOperand Op,

1340

SelectionDAG &DAG,

1341

int &VarArgsFrameIndex,

1342

int &VarArgsStackOffset,

1343

unsigned &VarArgsNumGPR,

1344

unsigned &VarArgsNumFPR,

1345

const PPCSubtarget &Subtarget) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1346

// TODO: add description of PPC stack frame format, or at least some docs.

1347

//

1348

MachineFunction &MF = DAG.getMachineFunction();

1349

MachineFrameInfo *MFI = MF.getFrameInfo();

Chris Lattner

2007-12-31 04:13:23 +0000

[diff] [blame]

1350

MachineRegisterInfo &RegInfo = MF.getRegInfo();

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1351

SmallVector<SDOperand, 8> ArgValues;

1352

SDOperand Root = Op.getOperand(0);

Dale Johannesen

2008-03-12 00:22:17 +0000

[diff] [blame]

1353

bool isVarArg = cast<ConstantSDNode>(Op.getOperand(2))->getValue() != 0;

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1354

1355

MVT::ValueType PtrVT = DAG.getTargetLoweringInfo().getPointerTy();

1356

bool isPPC64 = PtrVT == MVT::i64;

1357

bool isMachoABI = Subtarget.isMachoABI();

1358

bool isELF32_ABI = Subtarget.isELF32_ABI();

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

1359

// Potential tail calls could cause overwriting of argument stack slots.

1360

unsigned CC = MF.getFunction()->getCallingConv();

1361

bool isImmutable = !(PerformTailCallOpt && (CC==CallingConv::Fast));

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1362

unsigned PtrByteSize = isPPC64 ? 8 : 4;

1363

1364

unsigned ArgOffset = PPCFrameInfo::getLinkageSize(isPPC64, isMachoABI);

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

1365

// Area that is at least reserved in caller of this function.

1366

unsigned MinReservedArea = ArgOffset;

1367

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1368

static const unsigned GPR_32[] = { // 32-bit registers.

1369

PPC::R3, PPC::R4, PPC::R5, PPC::R6,

1370

PPC::R7, PPC::R8, PPC::R9, PPC::R10,

1371

};

1372

static const unsigned GPR_64[] = { // 64-bit registers.

1373

PPC::X3, PPC::X4, PPC::X5, PPC::X6,

1374

PPC::X7, PPC::X8, PPC::X9, PPC::X10,

1375

};

1376

1377

static const unsigned *FPR = GetFPR(Subtarget);

1378

1379

static const unsigned VR[] = {

1380

PPC::V2, PPC::V3, PPC::V4, PPC::V5, PPC::V6, PPC::V7, PPC::V8,

1381

PPC::V9, PPC::V10, PPC::V11, PPC::V12, PPC::V13

1382

};

1383

Owen Anderson

2007-09-07 04:06:50 +0000

[diff] [blame]

1384

const unsigned Num_GPR_Regs = array_lengthof(GPR_32);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1385

const unsigned Num_FPR_Regs = isMachoABI ? 13 : 8;

Owen Anderson

2007-09-07 04:06:50 +0000

[diff] [blame]

1386

const unsigned Num_VR_Regs = array_lengthof( VR);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1387

1388

unsigned GPR_idx = 0, FPR_idx = 0, VR_idx = 0;

1389

1390

const unsigned *GPR = isPPC64 ? GPR_64 : GPR_32;

1391

Dale Johannesen

2008-03-14 17:41:26 +0000

[diff] [blame]

1392

// In 32-bit non-varargs functions, the stack space for vectors is after the

1393

// stack space for non-vectors. We do not use this space unless we have

1394

// too many vectors to fit in registers, something that only occurs in

1395

// constructed examples:), but we have to walk the arglist to figure

1396

// that out...for the pathological case, compute VecArgOffset as the

1397

// start of the vector parameter area. Computing VecArgOffset is the

1398

// entire point of the following loop.

1399

// Altivec is not mentioned in the ppc32 Elf Supplement, so I'm not trying

1400

// to handle Elf here.

1401

unsigned VecArgOffset = ArgOffset;

1402

if (!isVarArg && !isPPC64) {

1403

for (unsigned ArgNo = 0, e = Op.Val->getNumValues()-1; ArgNo != e;

1404

++ArgNo) {

1405

MVT::ValueType ObjectVT = Op.getValue(ArgNo).getValueType();

1406

unsigned ObjSize = MVT::getSizeInBits(ObjectVT)/8;

Duncan Sands

2008-03-21 09:14:45 +0000

[diff] [blame]

1407

ISD::ArgFlagsTy Flags =

1408

cast<ARG_FLAGSSDNode>(Op.getOperand(ArgNo+3))->getArgFlags();

Dale Johannesen

2008-03-14 17:41:26 +0000

[diff] [blame]

1409

Duncan Sands

2008-03-21 09:14:45 +0000

[diff] [blame]

1410

if (Flags.isByVal()) {

Dale Johannesen

2008-03-14 17:41:26 +0000

[diff] [blame]

1411

// ObjSize is the true size, ArgSize rounded up to multiple of regs.

Duncan Sands

2008-03-21 09:14:45 +0000

[diff] [blame]

1412

ObjSize = Flags.getByValSize();

Dale Johannesen

2008-03-14 17:41:26 +0000

[diff] [blame]

1413

unsigned ArgSize =

1414

((ObjSize + PtrByteSize - 1)/PtrByteSize) * PtrByteSize;

1415

VecArgOffset += ArgSize;

continue;

}

switch(ObjectVT) {

default: assert(0 && "Unhandled argument type!");

1421

case MVT::i32:

1422

case MVT::f32:

1423

VecArgOffset += isPPC64 ? 8 : 4;

1424

break;

1425

case MVT::i64: // PPC64

case MVT::f64:

VecArgOffset += 8;

break;

case MVT::v4f32:

case MVT::v4i32:

case MVT::v8i16:

case MVT::v16i8:

// Nothing to do, we're only looking at Nonvector args here.

break;

}

}

}

// We've found where the vector parameter area in memory is. Skip the

1439

// first 12 parameters; these don't use that memory.

1440

VecArgOffset = ((VecArgOffset+15)/16)*16;

1441

VecArgOffset += 12*16;

1442

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1443

// Add DAG nodes to load the arguments or copy them out of registers. On

1444

// entry to a function on PPC, the arguments start after the linkage area,

1445

// although the first ones are often in registers.

1446

//

1447

// In the ELF 32 ABI, GPRs and stack are double word align: an argument

1448

// represented with two words (long long or double) must be copied to an

Nicolas Geoffray

2008-04-13 13:40:22 +0000

[diff] [blame]

1449

// even GPR_idx value or to an even ArgOffset value.

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1450

Dale Johannesen

2008-03-07 20:27:40 +0000

[diff] [blame]

1451

SmallVector<SDOperand, 8> MemOps;

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

1452

unsigned nAltivecParamsAtEnd = 0;

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1453

for (unsigned ArgNo = 0, e = Op.Val->getNumValues()-1; ArgNo != e; ++ArgNo) {

1454

SDOperand ArgVal;

1455

bool needsLoad = false;

1456

MVT::ValueType ObjectVT = Op.getValue(ArgNo).getValueType();

1457

unsigned ObjSize = MVT::getSizeInBits(ObjectVT)/8;

1458

unsigned ArgSize = ObjSize;

Duncan Sands

2008-03-21 09:14:45 +0000

[diff] [blame]

1459

ISD::ArgFlagsTy Flags =

1460

cast<ARG_FLAGSSDNode>(Op.getOperand(ArgNo+3))->getArgFlags();

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1461

// See if next argument requires stack alignment in ELF

Nicolas Geoffray

4fda257

2008-04-15 08:08:50 +0000

[diff] [blame]

1462

bool Align = Flags.isSplit();

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1463

1464

unsigned CurArgOffset = ArgOffset;

Dale Johannesen

2008-03-07 20:27:40 +0000

[diff] [blame]

1465

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

1466

// Varargs or 64 bit Altivec parameters are padded to a 16 byte boundary.

1467

if (ObjectVT==MVT::v4f32 || ObjectVT==MVT::v4i32 ||

1468

ObjectVT==MVT::v8i16 || ObjectVT==MVT::v16i8) {

1469

if (isVarArg || isPPC64) {

1470

MinReservedArea = ((MinReservedArea+15)/16)*16;

1471

MinReservedArea += CalculateStackSlotSize(Op.getValue(ArgNo),

1472

Op.getOperand(ArgNo+3),

1473

isVarArg,

1474

PtrByteSize);

1475

} else nAltivecParamsAtEnd++;

1476

} else

1477

// Calculate min reserved area.

1478

MinReservedArea += CalculateStackSlotSize(Op.getValue(ArgNo),

1479

Op.getOperand(ArgNo+3),

isVarArg,

PtrByteSize);

Dale Johannesen

2008-03-07 20:27:40 +0000

[diff] [blame]

1483

// FIXME alignment for ELF may not be right

1484

// FIXME the codegen can be much improved in some cases.

1485

// We do not have to keep everything in memory.

Duncan Sands

2008-03-21 09:14:45 +0000

[diff] [blame]

1486

if (Flags.isByVal()) {

Dale Johannesen

2008-03-07 20:27:40 +0000

[diff] [blame]

1487

// ObjSize is the true size, ArgSize rounded up to multiple of registers.

Duncan Sands

2008-03-21 09:14:45 +0000

[diff] [blame]

1488

ObjSize = Flags.getByValSize();

Dale Johannesen

2008-03-07 20:27:40 +0000

[diff] [blame]

1489

ArgSize = ((ObjSize + PtrByteSize - 1)/PtrByteSize) * PtrByteSize;

Dale Johannesen

05b4dbc

2008-03-08 01:41:42 +0000

[diff] [blame]

1490

// Double word align in ELF

Nicolas Geoffray

2008-04-13 13:40:22 +0000

[diff] [blame]

1491

if (Align && isELF32_ABI) GPR_idx += (GPR_idx % 2);

Dale Johannesen

05b4dbc

2008-03-08 01:41:42 +0000

[diff] [blame]

1492

// Objects of size 1 and 2 are right justified, everything else is

1493

// left justified. This means the memory address is adjusted forwards.

1494

if (ObjSize==1 || ObjSize==2) {

1495

CurArgOffset = CurArgOffset + (4 - ObjSize);

1496

}

Dale Johannesen

2008-03-07 20:27:40 +0000

[diff] [blame]

1497

// The value of the object is its address.

1498

int FI = MFI->CreateFixedObject(ObjSize, CurArgOffset);

1499

SDOperand FIN = DAG.getFrameIndex(FI, PtrVT);

1500

ArgValues.push_back(FIN);

Dale Johannesen

05b4dbc

2008-03-08 01:41:42 +0000

[diff] [blame]

1501

if (ObjSize==1 || ObjSize==2) {

1502

if (GPR_idx != Num_GPR_Regs) {

1503

unsigned VReg = RegInfo.createVirtualRegister(&PPC::GPRCRegClass);

1504

RegInfo.addLiveIn(GPR[GPR_idx], VReg);

1505

SDOperand Val = DAG.getCopyFromReg(Root, VReg, PtrVT);

1506

SDOperand Store = DAG.getTruncStore(Val.getValue(1), Val, FIN,

1507

NULL, 0, ObjSize==1 ? MVT::i8 : MVT::i16 );

1508

MemOps.push_back(Store);

1509

++GPR_idx;

1510

if (isMachoABI) ArgOffset += PtrByteSize;

1511

} else {

1512

ArgOffset += PtrByteSize;

1513

}

1514

continue;

1515

}

Dale Johannesen

2008-03-07 20:27:40 +0000

[diff] [blame]

1516

for (unsigned j = 0; j < ArgSize; j += PtrByteSize) {

1517

// Store whatever pieces of the object are in registers

1518

// to memory. ArgVal will be address of the beginning of

1519

// the object.

1520

if (GPR_idx != Num_GPR_Regs) {

1521

unsigned VReg = RegInfo.createVirtualRegister(&PPC::GPRCRegClass);

1522

RegInfo.addLiveIn(GPR[GPR_idx], VReg);

1523

int FI = MFI->CreateFixedObject(PtrByteSize, ArgOffset);

1524

SDOperand FIN = DAG.getFrameIndex(FI, PtrVT);

1525

SDOperand Val = DAG.getCopyFromReg(Root, VReg, PtrVT);

1526

SDOperand Store = DAG.getStore(Val.getValue(1), Val, FIN, NULL, 0);

1527

MemOps.push_back(Store);

1528

++GPR_idx;

1529

if (isMachoABI) ArgOffset += PtrByteSize;

1530

} else {

1531

ArgOffset += ArgSize - (ArgOffset-CurArgOffset);

break;

}

}

continue;

}

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1538

switch (ObjectVT) {

1539

default: assert(0 && "Unhandled argument type!");

1540

case MVT::i32:

Bill Wendling

2008-03-07 20:49:02 +0000

[diff] [blame]

1541

if (!isPPC64) {

1542

// Double word align in ELF

Nicolas Geoffray

2008-04-13 13:40:22 +0000

[diff] [blame]

1543

if (Align && isELF32_ABI) GPR_idx += (GPR_idx % 2);

Bill Wendling

2008-03-07 20:49:02 +0000

[diff] [blame]

1544

1545

if (GPR_idx != Num_GPR_Regs) {

1546

unsigned VReg = RegInfo.createVirtualRegister(&PPC::GPRCRegClass);

1547

RegInfo.addLiveIn(GPR[GPR_idx], VReg);

1548

ArgVal = DAG.getCopyFromReg(Root, VReg, MVT::i32);

++GPR_idx;

} else {

needsLoad = true;

ArgSize = PtrByteSize;

1553

}

1554

// Stack align in ELF

Nicolas Geoffray

2008-04-13 13:40:22 +0000

[diff] [blame]

1555

if (needsLoad && Align && isELF32_ABI)

Bill Wendling

2008-03-07 20:49:02 +0000

[diff] [blame]

1556

ArgOffset += ((ArgOffset/4) % 2) * PtrByteSize;

1557

// All int arguments reserve stack space in Macho ABI.

1558

if (isMachoABI || needsLoad) ArgOffset += PtrByteSize;

1559

break;

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1560

}

Bill Wendling

2008-03-07 20:49:02 +0000

[diff] [blame]

1561

// FALLTHROUGH

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1562

case MVT::i64: // PPC64

1563

if (GPR_idx != Num_GPR_Regs) {

Chris Lattner

2007-12-31 04:13:23 +0000

[diff] [blame]

1564

unsigned VReg = RegInfo.createVirtualRegister(&PPC::G8RCRegClass);

1565

RegInfo.addLiveIn(GPR[GPR_idx], VReg);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1566

ArgVal = DAG.getCopyFromReg(Root, VReg, MVT::i64);

Bill Wendling

2008-03-07 20:49:02 +0000

[diff] [blame]

1567

1568

if (ObjectVT == MVT::i32) {

1569

// PPC64 passes i8, i16, and i32 values in i64 registers. Promote

1570

// value to MVT::i64 and then truncate to the correct register size.

Duncan Sands

2008-03-21 09:14:45 +0000

[diff] [blame]

1571

if (Flags.isSExt())

Bill Wendling

2008-03-07 20:49:02 +0000

[diff] [blame]

1572

ArgVal = DAG.getNode(ISD::AssertSext, MVT::i64, ArgVal,

1573

DAG.getValueType(ObjectVT));

Duncan Sands

2008-03-21 09:14:45 +0000

[diff] [blame]

1574

else if (Flags.isZExt())

Bill Wendling

2008-03-07 20:49:02 +0000

[diff] [blame]

1575

ArgVal = DAG.getNode(ISD::AssertZext, MVT::i64, ArgVal,

1576

DAG.getValueType(ObjectVT));

1577

1578

ArgVal = DAG.getNode(ISD::TRUNCATE, MVT::i32, ArgVal);

1579

}

1580

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

++GPR_idx;

} else {

needsLoad = true;

}

// All int arguments reserve stack space in Macho ABI.

1586

if (isMachoABI || needsLoad) ArgOffset += 8;

break;

case MVT::f32:

case MVT::f64:

// Every 4 bytes of argument space consumes one of the GPRs available for

1592

// argument passing.

1593

if (GPR_idx != Num_GPR_Regs && isMachoABI) {

1594

++GPR_idx;

1595

if (ObjSize == 8 && GPR_idx != Num_GPR_Regs && !isPPC64)

1596

++GPR_idx;

1597

}

1598

if (FPR_idx != Num_FPR_Regs) {

1599

unsigned VReg;

1600

if (ObjectVT == MVT::f32)

Chris Lattner

2007-12-31 04:13:23 +0000

[diff] [blame]

1601

VReg = RegInfo.createVirtualRegister(&PPC::F4RCRegClass);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1602

else

Chris Lattner

2007-12-31 04:13:23 +0000

[diff] [blame]

1603

VReg = RegInfo.createVirtualRegister(&PPC::F8RCRegClass);

1604

RegInfo.addLiveIn(FPR[FPR_idx], VReg);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1605

ArgVal = DAG.getCopyFromReg(Root, VReg, ObjectVT);

++FPR_idx;

} else {

needsLoad = true;

}

// Stack align in ELF

Nicolas Geoffray

2008-04-13 13:40:22 +0000

[diff] [blame]

1612

if (needsLoad && Align && isELF32_ABI)

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1613

ArgOffset += ((ArgOffset/4) % 2) * PtrByteSize;

1614

// All FP arguments reserve stack space in Macho ABI.

1615

if (isMachoABI || needsLoad) ArgOffset += isPPC64 ? 8 : ObjSize;

break;

case MVT::v4f32:

case MVT::v4i32:

case MVT::v8i16:

case MVT::v16i8:

Dale Johannesen

2008-03-12 00:22:17 +0000

[diff] [blame]

1621

// Note that vector arguments in registers don't reserve stack space,

1622

// except in varargs functions.

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1623

if (VR_idx != Num_VR_Regs) {

Chris Lattner

2007-12-31 04:13:23 +0000

[diff] [blame]

1624

unsigned VReg = RegInfo.createVirtualRegister(&PPC::VRRCRegClass);

1625

RegInfo.addLiveIn(VR[VR_idx], VReg);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1626

ArgVal = DAG.getCopyFromReg(Root, VReg, ObjectVT);

Dale Johannesen

2008-03-12 00:22:17 +0000

[diff] [blame]

1627

if (isVarArg) {

1628

while ((ArgOffset % 16) != 0) {

1629

ArgOffset += PtrByteSize;

1630

if (GPR_idx != Num_GPR_Regs)

GPR_idx++;

}

ArgOffset += 16;

GPR_idx = std::min(GPR_idx+4, Num_GPR_Regs);

1635

}

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1636

++VR_idx;

1637

} else {

Dale Johannesen

2008-03-14 17:41:26 +0000

[diff] [blame]

1638

if (!isVarArg && !isPPC64) {

1639

// Vectors go after all the nonvectors.

1640

CurArgOffset = VecArgOffset;

1641

VecArgOffset += 16;

1642

} else {

1643

// Vectors are aligned.

1644

ArgOffset = ((ArgOffset+15)/16)*16;

1645

CurArgOffset = ArgOffset;

1646

ArgOffset += 16;

Dale Johannesen

896870b

2008-03-12 00:49:20 +0000

[diff] [blame]

1647

}

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

needsLoad = true;

}

break;

}

// We need to load the argument to a virtual register if we determined above

Chris Lattner

6006945

2008-02-13 07:35:30 +0000

[diff] [blame]

1654

// that we ran out of physical registers of the appropriate type.

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1655

if (needsLoad) {

Chris Lattner

6006945

2008-02-13 07:35:30 +0000

[diff] [blame]

1656

int FI = MFI->CreateFixedObject(ObjSize,

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

1657

CurArgOffset + (ArgSize - ObjSize),

1658

isImmutable);

Chris Lattner

6006945

2008-02-13 07:35:30 +0000

[diff] [blame]

1659

SDOperand FIN = DAG.getFrameIndex(FI, PtrVT);

1660

ArgVal = DAG.getLoad(ObjectVT, Root, FIN, NULL, 0);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1661

}

1662

1663

ArgValues.push_back(ArgVal);

1664

}

Dale Johannesen

2008-03-07 20:27:40 +0000

[diff] [blame]

1665

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

1666

// Set the size that is at least reserved in caller of this function. Tail

1667

// call optimized function's reserved stack space needs to be aligned so that

1668

// taking the difference between two stack areas will result in an aligned

1669

// stack.

1670

PPCFunctionInfo *FI = MF.getInfo<PPCFunctionInfo>();

1671

// Add the Altivec parameters at the end, if needed.

1672

if (nAltivecParamsAtEnd) {

1673

MinReservedArea = ((MinReservedArea+15)/16)*16;

1674

MinReservedArea += 16*nAltivecParamsAtEnd;

1675

}

1676

MinReservedArea =

1677

std::max(MinReservedArea,

1678

PPCFrameInfo::getMinCallFrameSize(isPPC64, isMachoABI));

1679

unsigned TargetAlign = DAG.getMachineFunction().getTarget().getFrameInfo()->

1680

getStackAlignment();

1681

unsigned AlignMask = TargetAlign-1;

1682

MinReservedArea = (MinReservedArea + AlignMask) & ~AlignMask;

1683

FI->setMinReservedArea(MinReservedArea);

1684

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1685

// If the function takes variable number of arguments, make a frame index for

1686

// the start of the first vararg value... for expansion of llvm.va_start.

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

if (isVarArg) {

int depth;

if (isELF32_ABI) {

VarArgsNumGPR = GPR_idx;

1692

VarArgsNumFPR = FPR_idx;

1693

1694

// Make room for Num_GPR_Regs, Num_FPR_Regs and for a possible frame

1695

// pointer.

1696

depth = -(Num_GPR_Regs * MVT::getSizeInBits(PtrVT)/8 +

1697

Num_FPR_Regs * MVT::getSizeInBits(MVT::f64)/8 +

1698

MVT::getSizeInBits(PtrVT)/8);

1699

1700

VarArgsStackOffset = MFI->CreateFixedObject(MVT::getSizeInBits(PtrVT)/8,

ArgOffset);

}

else

depth = ArgOffset;

VarArgsFrameIndex = MFI->CreateFixedObject(MVT::getSizeInBits(PtrVT)/8,

1708

depth);

1709

SDOperand FIN = DAG.getFrameIndex(VarArgsFrameIndex, PtrVT);

1710

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1711

// In ELF 32 ABI, the fixed integer arguments of a variadic function are

1712

// stored to the VarArgsFrameIndex on the stack.

1713

if (isELF32_ABI) {

1714

for (GPR_idx = 0; GPR_idx != VarArgsNumGPR; ++GPR_idx) {

1715

SDOperand Val = DAG.getRegister(GPR[GPR_idx], PtrVT);

1716

SDOperand Store = DAG.getStore(Root, Val, FIN, NULL, 0);

1717

MemOps.push_back(Store);

1718

// Increment the address by four for the next argument to store

1719

SDOperand PtrOff = DAG.getConstant(MVT::getSizeInBits(PtrVT)/8, PtrVT);

1720

FIN = DAG.getNode(ISD::ADD, PtrOff.getValueType(), FIN, PtrOff);

}

}

// If this function is vararg, store any remaining integer argument regs

1725

// to their spots on the stack so that they may be loaded by deferencing the

1726

// result of va_next.

1727

for (; GPR_idx != Num_GPR_Regs; ++GPR_idx) {

1728

unsigned VReg;

1729

if (isPPC64)

Chris Lattner

2007-12-31 04:13:23 +0000

[diff] [blame]

1730

VReg = RegInfo.createVirtualRegister(&PPC::G8RCRegClass);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1731

else

Chris Lattner

2007-12-31 04:13:23 +0000

[diff] [blame]

1732

VReg = RegInfo.createVirtualRegister(&PPC::GPRCRegClass);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1733

Chris Lattner

2007-12-31 04:13:23 +0000

[diff] [blame]

1734

RegInfo.addLiveIn(GPR[GPR_idx], VReg);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1735

SDOperand Val = DAG.getCopyFromReg(Root, VReg, PtrVT);

1736

SDOperand Store = DAG.getStore(Val.getValue(1), Val, FIN, NULL, 0);

1737

MemOps.push_back(Store);

1738

// Increment the address by four for the next argument to store

1739

SDOperand PtrOff = DAG.getConstant(MVT::getSizeInBits(PtrVT)/8, PtrVT);

1740

FIN = DAG.getNode(ISD::ADD, PtrOff.getValueType(), FIN, PtrOff);

1741

}

1742

1743

// In ELF 32 ABI, the double arguments are stored to the VarArgsFrameIndex

1744

// on the stack.

1745

if (isELF32_ABI) {

1746

for (FPR_idx = 0; FPR_idx != VarArgsNumFPR; ++FPR_idx) {

1747

SDOperand Val = DAG.getRegister(FPR[FPR_idx], MVT::f64);

1748

SDOperand Store = DAG.getStore(Root, Val, FIN, NULL, 0);

1749

MemOps.push_back(Store);

1750

// Increment the address by eight for the next argument to store

1751

SDOperand PtrOff = DAG.getConstant(MVT::getSizeInBits(MVT::f64)/8,

1752

PtrVT);

1753

FIN = DAG.getNode(ISD::ADD, PtrOff.getValueType(), FIN, PtrOff);

1754

}

1755

1756

for (; FPR_idx != Num_FPR_Regs; ++FPR_idx) {

1757

unsigned VReg;

Chris Lattner

2007-12-31 04:13:23 +0000

[diff] [blame]

1758

VReg = RegInfo.createVirtualRegister(&PPC::F8RCRegClass);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1759

Chris Lattner

2007-12-31 04:13:23 +0000

[diff] [blame]

1760

RegInfo.addLiveIn(FPR[FPR_idx], VReg);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1761

SDOperand Val = DAG.getCopyFromReg(Root, VReg, MVT::f64);

1762

SDOperand Store = DAG.getStore(Val.getValue(1), Val, FIN, NULL, 0);

1763

MemOps.push_back(Store);

1764

// Increment the address by eight for the next argument to store

1765

SDOperand PtrOff = DAG.getConstant(MVT::getSizeInBits(MVT::f64)/8,

1766

PtrVT);

1767

FIN = DAG.getNode(ISD::ADD, PtrOff.getValueType(), FIN, PtrOff);

1768

}

1769

}

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1770

}

1771

Dale Johannesen

2008-03-07 20:27:40 +0000

[diff] [blame]

1772

if (!MemOps.empty())

1773

Root = DAG.getNode(ISD::TokenFactor, MVT::Other,&MemOps[0],MemOps.size());

1774

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1775

ArgValues.push_back(Root);

1776

1777

// Return the new list of results.

1778

std::vector<MVT::ValueType> RetVT(Op.Val->value_begin(),

1779

Op.Val->value_end());

1780

return DAG.getNode(ISD::MERGE_VALUES, RetVT, &ArgValues[0], ArgValues.size());

1781

}

1782

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

1783

/// CalculateParameterAndLinkageAreaSize - Get the size of the paramter plus

1784

/// linkage area.

1785

static unsigned

1786

CalculateParameterAndLinkageAreaSize(SelectionDAG &DAG,

bool isPPC64,

bool isMachoABI,

bool isVarArg,

unsigned CC,

SDOperand Call,

unsigned &nAltivecParamsAtEnd) {

1793

// Count how many bytes are to be pushed on the stack, including the linkage

1794

// area, and parameter passing area. We start with 24/48 bytes, which is

1795

// prereserved space for [SP][CR][LR][3 x unused].

1796

unsigned NumBytes = PPCFrameInfo::getLinkageSize(isPPC64, isMachoABI);

1797

unsigned NumOps = (Call.getNumOperands() - 5) / 2;

1798

unsigned PtrByteSize = isPPC64 ? 8 : 4;

1799

1800

// Add up all the space actually used.

1801

// In 32-bit non-varargs calls, Altivec parameters all go at the end; usually

1802

// they all go in registers, but we must reserve stack space for them for

1803

// possible use by the caller. In varargs or 64-bit calls, parameters are

1804

// assigned stack space in order, with padding so Altivec parameters are

1805

// 16-byte aligned.

1806

nAltivecParamsAtEnd = 0;

1807

for (unsigned i = 0; i != NumOps; ++i) {

1808

SDOperand Arg = Call.getOperand(5+2*i);

1809

SDOperand Flag = Call.getOperand(5+2*i+1);

1810

MVT::ValueType ArgVT = Arg.getValueType();

1811

// Varargs Altivec parameters are padded to a 16 byte boundary.

1812

if (ArgVT==MVT::v4f32 || ArgVT==MVT::v4i32 ||

1813

ArgVT==MVT::v8i16 || ArgVT==MVT::v16i8) {

1814

if (!isVarArg && !isPPC64) {

1815

// Non-varargs Altivec parameters go after all the non-Altivec

1816

// parameters; handle those later so we know how much padding we need.

1817

nAltivecParamsAtEnd++;

1818

continue;

1819

}

1820

// Varargs and 64-bit Altivec parameters are padded to 16 byte boundary.

1821

NumBytes = ((NumBytes+15)/16)*16;

1822

}

1823

NumBytes += CalculateStackSlotSize(Arg, Flag, isVarArg, PtrByteSize);

1824

}

1825

1826

// Allow for Altivec parameters at the end, if needed.

1827

if (nAltivecParamsAtEnd) {

1828

NumBytes = ((NumBytes+15)/16)*16;

1829

NumBytes += 16*nAltivecParamsAtEnd;

1830

}

1831

1832

// The prolog code of the callee may store up to 8 GPR argument registers to

1833

// the stack, allowing va_start to index over them in memory if its varargs.

1834

// Because we cannot tell if this is needed on the caller side, we have to

1835

// conservatively assume that it is needed. As such, make sure we have at

1836

// least enough stack space for the caller to store the 8 GPRs.

1837

NumBytes = std::max(NumBytes,

1838

PPCFrameInfo::getMinCallFrameSize(isPPC64, isMachoABI));

1839

1840

// Tail call needs the stack to be aligned.

1841

if (CC==CallingConv::Fast && PerformTailCallOpt) {

1842

unsigned TargetAlign = DAG.getMachineFunction().getTarget().getFrameInfo()->

1843

getStackAlignment();

1844

unsigned AlignMask = TargetAlign-1;

1845

NumBytes = (NumBytes + AlignMask) & ~AlignMask;

}

return NumBytes;

}

/// CalculateTailCallSPDiff - Get the amount the stack pointer has to be

1852

/// adjusted to accomodate the arguments for the tailcall.

1853

static int CalculateTailCallSPDiff(SelectionDAG& DAG, bool IsTailCall,

1854

unsigned ParamSize) {

1855

1856

if (!IsTailCall) return 0;

1857

1858

PPCFunctionInfo *FI = DAG.getMachineFunction().getInfo<PPCFunctionInfo>();

1859

unsigned CallerMinReservedArea = FI->getMinReservedArea();

1860

int SPDiff = (int)CallerMinReservedArea - (int)ParamSize;

1861

// Remember only if the new adjustement is bigger.

1862

if (SPDiff < FI->getTailCallSPDelta())

1863

FI->setTailCallSPDelta(SPDiff);

return SPDiff;

}

/// IsEligibleForTailCallElimination - Check to see whether the next instruction

1869

/// following the call is a return. A function is eligible if caller/callee

1870

/// calling conventions match, currently only fastcc supports tail calls, and

1871

/// the function CALL is immediatly followed by a RET.

1872

bool

1873

PPCTargetLowering::IsEligibleForTailCallOptimization(SDOperand Call,

1874

SDOperand Ret,

1875

SelectionDAG& DAG) const {

1876

// Variable argument functions are not supported.

1877

if (!PerformTailCallOpt ||

1878

cast<ConstantSDNode>(Call.getOperand(2))->getValue() != 0) return false;

1879

1880

if (CheckTailCallReturnConstraints(Call, Ret)) {

1881

MachineFunction &MF = DAG.getMachineFunction();

1882

unsigned CallerCC = MF.getFunction()->getCallingConv();

1883

unsigned CalleeCC = cast<ConstantSDNode>(Call.getOperand(1))->getValue();

1884

if (CalleeCC == CallingConv::Fast && CallerCC == CalleeCC) {

1885

// Functions containing by val parameters are not supported.

1886

for (unsigned i = 0; i != ((Call.getNumOperands()-5)/2); i++) {

1887

ISD::ArgFlagsTy Flags = cast<ARG_FLAGSSDNode>(Call.getOperand(5+2*i+1))

1888

->getArgFlags();

1889

if (Flags.isByVal()) return false;

1890

}

1891

1892

SDOperand Callee = Call.getOperand(4);

1893

// Non PIC/GOT tail calls are supported.

1894

if (getTargetMachine().getRelocationModel() != Reloc::PIC_)

1895

return true;

1896

1897

// At the moment we can only do local tail calls (in same module, hidden

1898

// or protected) if we are generating PIC.

1899

if (GlobalAddressSDNode *G = dyn_cast<GlobalAddressSDNode>(Callee))

1900

return G->getGlobal()->hasHiddenVisibility()

1901

|| G->getGlobal()->hasProtectedVisibility();

}

}

return false;

}

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1908

/// isCallCompatibleAddress - Return the immediate to use if the specified

1909

/// 32-bit value is representable in the immediate field of a BxA instruction.

1910

static SDNode *isBLACompatibleAddress(SDOperand Op, SelectionDAG &DAG) {

1911

ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op);

1912

if (!C) return 0;

1913

1914

int Addr = C->getValue();

1915

if ((Addr & 3) != 0 || // Low 2 bits are implicitly zero.

1916

(Addr << 6 >> 6) != Addr)

1917

return 0; // Top 6 bits have to be sext of immediate.

1918

Evan Cheng

282c646

2007-10-22 19:46:19 +0000

[diff] [blame]

1919

return DAG.getConstant((int)C->getValue() >> 2,

1920

DAG.getTargetLoweringInfo().getPointerTy()).Val;

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

1921

}

1922

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

1923

struct TailCallArgumentInfo {

1924

SDOperand Arg;

1925

SDOperand FrameIdxOp;

1926

int FrameIdx;

1927

1928

TailCallArgumentInfo() : FrameIdx(0) {}

1929

};

1930

1931

/// StoreTailCallArgumentsToStackSlot - Stores arguments to their stack slot.

1932

static void

1933

StoreTailCallArgumentsToStackSlot(SelectionDAG &DAG,

1934

SDOperand Chain,

1935

const SmallVector<TailCallArgumentInfo, 8> &TailCallArgs,

1936

SmallVector<SDOperand, 8> &MemOpChains) {

1937

for (unsigned i = 0, e = TailCallArgs.size(); i != e; ++i) {

1938

SDOperand Arg = TailCallArgs[i].Arg;

1939

SDOperand FIN = TailCallArgs[i].FrameIdxOp;

1940

int FI = TailCallArgs[i].FrameIdx;

1941

// Store relative to framepointer.

1942

MemOpChains.push_back(DAG.getStore(Chain, Arg, FIN,

1943

PseudoSourceValue::getFixedStack(),

FI));

}

}

/// EmitTailCallStoreFPAndRetAddr - Move the frame pointer and return address to

1949

/// the appropriate stack slot for the tail call optimized function call.

1950

static SDOperand EmitTailCallStoreFPAndRetAddr(SelectionDAG &DAG,

1951

MachineFunction &MF,

1952

SDOperand Chain,

1953

SDOperand OldRetAddr,

SDOperand OldFP,

int SPDiff,

bool isPPC64,

bool isMachoABI) {

if (SPDiff) {

// Calculate the new stack slot for the return address.

1960

int SlotSize = isPPC64 ? 8 : 4;

1961

int NewRetAddrLoc = SPDiff + PPCFrameInfo::getReturnSaveOffset(isPPC64,

1962

isMachoABI);

1963

int NewRetAddr = MF.getFrameInfo()->CreateFixedObject(SlotSize,

1964

NewRetAddrLoc);

1965

int NewFPLoc = SPDiff + PPCFrameInfo::getFramePointerSaveOffset(isPPC64,

1966

isMachoABI);

1967

int NewFPIdx = MF.getFrameInfo()->CreateFixedObject(SlotSize, NewFPLoc);

1968

1969

MVT::ValueType VT = isPPC64 ? MVT::i64 : MVT::i32;

1970

SDOperand NewRetAddrFrIdx = DAG.getFrameIndex(NewRetAddr, VT);

1971

Chain = DAG.getStore(Chain, OldRetAddr, NewRetAddrFrIdx,

1972

PseudoSourceValue::getFixedStack(), NewRetAddr);

1973

SDOperand NewFramePtrIdx = DAG.getFrameIndex(NewFPIdx, VT);

1974

Chain = DAG.getStore(Chain, OldFP, NewFramePtrIdx,

1975

PseudoSourceValue::getFixedStack(), NewFPIdx);

}

return Chain;

}

/// CalculateTailCallArgDest - Remember Argument for later processing. Calculate

1981

/// the position of the argument.

1982

static void

1983

CalculateTailCallArgDest(SelectionDAG &DAG, MachineFunction &MF, bool isPPC64,

1984

SDOperand Arg, int SPDiff, unsigned ArgOffset,

1985

SmallVector<TailCallArgumentInfo, 8>& TailCallArguments) {

1986

int Offset = ArgOffset + SPDiff;

1987

uint32_t OpSize = (MVT::getSizeInBits(Arg.getValueType())+7)/8;

1988

int FI = MF.getFrameInfo()->CreateFixedObject(OpSize, Offset);

1989

MVT::ValueType VT = isPPC64 ? MVT::i64 : MVT::i32;

1990

SDOperand FIN = DAG.getFrameIndex(FI, VT);

1991

TailCallArgumentInfo Info;

1992

Info.Arg = Arg;

1993

Info.FrameIdxOp = FIN;

1994

Info.FrameIdx = FI;

1995

TailCallArguments.push_back(Info);

1996

}

1997

1998

/// EmitTCFPAndRetAddrLoad - Emit load from frame pointer and return address

1999

/// stack slot. Returns the chain as result and the loaded frame pointers in

2000

/// LROpOut/FPOpout. Used when tail calling.

2001

SDOperand PPCTargetLowering::EmitTailCallLoadFPAndRetAddr(SelectionDAG & DAG,

int SPDiff,

SDOperand Chain,

SDOperand &LROpOut,

SDOperand &FPOpOut) {

2006

if (SPDiff) {

2007

// Load the LR and FP stack slot for later adjusting.

2008

MVT::ValueType VT = PPCSubTarget.isPPC64() ? MVT::i64 : MVT::i32;

2009

LROpOut = getReturnAddrFrameIndex(DAG);

2010

LROpOut = DAG.getLoad(VT, Chain, LROpOut, NULL, 0);

2011

Chain = SDOperand(LROpOut.Val, 1);

2012

FPOpOut = getFramePointerFrameIndex(DAG);

2013

FPOpOut = DAG.getLoad(VT, Chain, FPOpOut, NULL, 0);

2014

Chain = SDOperand(FPOpOut.Val, 1);

}

return Chain;

}

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

2019

/// CreateCopyOfByValArgument - Make a copy of an aggregate at address specified

2020

/// by "Src" to address "Dst" of size "Size". Alignment information is

2021

/// specified by the specific parameter attribute. The copy will be passed as

2022

/// a byval function parameter.

2023

/// Sometimes what we are copying is the end of a larger object, the part that

2024

/// does not fit in registers.

2025

static SDOperand

2026

CreateCopyOfByValArgument(SDOperand Src, SDOperand Dst, SDOperand Chain,

Duncan Sands

2008-03-21 09:14:45 +0000

[diff] [blame]

2027

ISD::ArgFlagsTy Flags, SelectionDAG &DAG,

2028

unsigned Size) {

Dan Gohman

e8b391e

2008-04-12 04:36:06 +0000

[diff] [blame]

2029

SDOperand SizeNode = DAG.getConstant(Size, MVT::i32);

2030

return DAG.getMemcpy(Chain, Dst, Src, SizeNode, Flags.getByValAlign(), false,

2031

NULL, 0, NULL, 0);

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

2032

}

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2033

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2034

/// LowerMemOpCallTo - Store the argument to the stack or remember it in case of

2035

/// tail calls.

2036

static void

2037

LowerMemOpCallTo(SelectionDAG &DAG, MachineFunction &MF, SDOperand Chain,

2038

SDOperand Arg, SDOperand PtrOff, int SPDiff,

2039

unsigned ArgOffset, bool isPPC64, bool isTailCall,

2040

bool isVector, SmallVector<SDOperand, 8> &MemOpChains,

2041

SmallVector<TailCallArgumentInfo, 8>& TailCallArguments) {

2042

MVT::ValueType PtrVT = DAG.getTargetLoweringInfo().getPointerTy();

if (!isTailCall) {

if (isVector) {

SDOperand StackPtr;

if (isPPC64)

StackPtr = DAG.getRegister(PPC::X1, MVT::i64);

2048

else

2049

StackPtr = DAG.getRegister(PPC::R1, MVT::i32);

2050

PtrOff = DAG.getNode(ISD::ADD, PtrVT, StackPtr,

2051

DAG.getConstant(ArgOffset, PtrVT));

2052

}

2053

MemOpChains.push_back(DAG.getStore(Chain, Arg, PtrOff, NULL, 0));

2054

// Calculate and remember argument location.

2055

} else CalculateTailCallArgDest(DAG, MF, isPPC64, Arg, SPDiff, ArgOffset,

TailCallArguments);

}

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

2059

SDOperand PPCTargetLowering::LowerCALL(SDOperand Op, SelectionDAG &DAG,

Dan Gohman

2008-03-19 21:39:28 +0000

[diff] [blame]

2060

const PPCSubtarget &Subtarget,

2061

TargetMachine &TM) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2062

SDOperand Chain = Op.getOperand(0);

2063

bool isVarArg = cast<ConstantSDNode>(Op.getOperand(2))->getValue() != 0;

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2064

unsigned CC = cast<ConstantSDNode>(Op.getOperand(1))->getValue();

2065

bool isTailCall = cast<ConstantSDNode>(Op.getOperand(3))->getValue() != 0 &&

2066

CC == CallingConv::Fast && PerformTailCallOpt;

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2067

SDOperand Callee = Op.getOperand(4);

2068

unsigned NumOps = (Op.getNumOperands() - 5) / 2;

2069

2070

bool isMachoABI = Subtarget.isMachoABI();

2071

bool isELF32_ABI = Subtarget.isELF32_ABI();

2072

2073

MVT::ValueType PtrVT = DAG.getTargetLoweringInfo().getPointerTy();

2074

bool isPPC64 = PtrVT == MVT::i64;

2075

unsigned PtrByteSize = isPPC64 ? 8 : 4;

2076

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2077

MachineFunction &MF = DAG.getMachineFunction();

2078

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2079

// args_to_use will accumulate outgoing args for the PPCISD::CALL case in

2080

// SelectExpr to use to put the arguments in the appropriate registers.

2081

std::vector<SDOperand> args_to_use;

2082

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2083

// Mark this function as potentially containing a function that contains a

2084

// tail call. As a consequence the frame pointer will be used for dynamicalloc

2085

// and restoring the callers stack pointer in this functions epilog. This is

2086

// done because by tail calling the called function might overwrite the value

2087

// in this function's (MF) stack pointer stack slot 0(SP).

2088

if (PerformTailCallOpt && CC==CallingConv::Fast)

2089

MF.getInfo<PPCFunctionInfo>()->setHasFastCall();

2090

2091

unsigned nAltivecParamsAtEnd = 0;

2092

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2093

// Count how many bytes are to be pushed on the stack, including the linkage

2094

// area, and parameter passing area. We start with 24/48 bytes, which is

2095

// prereserved space for [SP][CR][LR][3 x unused].

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2096

unsigned NumBytes =

2097

CalculateParameterAndLinkageAreaSize(DAG, isPPC64, isMachoABI, isVarArg, CC,

2098

Op, nAltivecParamsAtEnd);

Dale Johannesen

2008-03-12 00:22:17 +0000

[diff] [blame]

2099

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2100

// Calculate by how many bytes the stack has to be adjusted in case of tail

2101

// call optimization.

2102

int SPDiff = CalculateTailCallSPDiff(DAG, isTailCall, NumBytes);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2103

2104

// Adjust the stack pointer for the new arguments...

2105

// These operations are automatically eliminated by the prolog/epilog pass

2106

Chain = DAG.getCALLSEQ_START(Chain,

2107

DAG.getConstant(NumBytes, PtrVT));

Dale Johannesen

7a7aa10

2008-03-05 23:31:27 +0000

[diff] [blame]

2108

SDOperand CallSeqStart = Chain;

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2109

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2110

// Load the return address and frame pointer so it can be move somewhere else

2111

// later.

2112

SDOperand LROp, FPOp;

2113

Chain = EmitTailCallLoadFPAndRetAddr(DAG, SPDiff, Chain, LROp, FPOp);

2114

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2115

// Set up a copy of the stack pointer for use loading and storing any

2116

// arguments that may not fit in the registers available for argument

// passing.

SDOperand StackPtr;

if (isPPC64)

StackPtr = DAG.getRegister(PPC::X1, MVT::i64);

2121

else

2122

StackPtr = DAG.getRegister(PPC::R1, MVT::i32);

2123

2124

// Figure out which arguments are going to go in registers, and which in

2125

// memory. Also, if this is a vararg function, floating point operations

2126

// must be stored to our stack, and loaded into integer regs as well, if

2127

// any integer regs are available for argument passing.

2128

unsigned ArgOffset = PPCFrameInfo::getLinkageSize(isPPC64, isMachoABI);

2129

unsigned GPR_idx = 0, FPR_idx = 0, VR_idx = 0;

2130

2131

static const unsigned GPR_32[] = { // 32-bit registers.

2132

PPC::R3, PPC::R4, PPC::R5, PPC::R6,

2133

PPC::R7, PPC::R8, PPC::R9, PPC::R10,

2134

};

2135

static const unsigned GPR_64[] = { // 64-bit registers.

2136

PPC::X3, PPC::X4, PPC::X5, PPC::X6,

2137

PPC::X7, PPC::X8, PPC::X9, PPC::X10,

2138

};

2139

static const unsigned *FPR = GetFPR(Subtarget);

2140

2141

static const unsigned VR[] = {

2142

PPC::V2, PPC::V3, PPC::V4, PPC::V5, PPC::V6, PPC::V7, PPC::V8,

2143

PPC::V9, PPC::V10, PPC::V11, PPC::V12, PPC::V13

2144

};

Owen Anderson

2007-09-07 04:06:50 +0000

[diff] [blame]

2145

const unsigned NumGPRs = array_lengthof(GPR_32);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2146

const unsigned NumFPRs = isMachoABI ? 13 : 8;

Owen Anderson

2007-09-07 04:06:50 +0000

[diff] [blame]

2147

const unsigned NumVRs = array_lengthof( VR);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2148

2149

const unsigned *GPR = isPPC64 ? GPR_64 : GPR_32;

2150

2151

std::vector<std::pair<unsigned, SDOperand> > RegsToPass;

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2152

SmallVector<TailCallArgumentInfo, 8> TailCallArguments;

2153

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2154

SmallVector<SDOperand, 8> MemOpChains;

2155

for (unsigned i = 0; i != NumOps; ++i) {

2156

bool inMem = false;

2157

SDOperand Arg = Op.getOperand(5+2*i);

Duncan Sands

2008-03-21 09:14:45 +0000

[diff] [blame]

2158

ISD::ArgFlagsTy Flags =

2159

cast<ARG_FLAGSSDNode>(Op.getOperand(5+2*i+1))->getArgFlags();

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2160

// See if next argument requires stack alignment in ELF

Nicolas Geoffray

4fda257

2008-04-15 08:08:50 +0000

[diff] [blame]

2161

bool Align = Flags.isSplit();

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2162

2163

// PtrOff will be used to store the current argument to the stack if a

2164

// register cannot be found for it.

2165

SDOperand PtrOff;

2166

2167

// Stack align in ELF 32

Nicolas Geoffray

2008-04-13 13:40:22 +0000

[diff] [blame]

2168

if (isELF32_ABI && Align)

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2169

PtrOff = DAG.getConstant(ArgOffset + ((ArgOffset/4) % 2) * PtrByteSize,

2170

StackPtr.getValueType());

2171

else

2172

PtrOff = DAG.getConstant(ArgOffset, StackPtr.getValueType());

2173

2174

PtrOff = DAG.getNode(ISD::ADD, PtrVT, StackPtr, PtrOff);

2175

2176

// On PPC64, promote integers to 64-bit values.

2177

if (isPPC64 && Arg.getValueType() == MVT::i32) {

Duncan Sands

2008-03-21 09:14:45 +0000

[diff] [blame]

2178

// FIXME: Should this use ANY_EXTEND if neither sext nor zext?

2179

unsigned ExtOp = Flags.isSExt() ? ISD::SIGN_EXTEND : ISD::ZERO_EXTEND;

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2180

Arg = DAG.getNode(ExtOp, MVT::i64, Arg);

2181

}

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

2182

2183

// FIXME Elf untested, what are alignment rules?

Dale Johannesen

2008-03-07 20:27:40 +0000

[diff] [blame]

2184

// FIXME memcpy is used way more than necessary. Correctness first.

Duncan Sands

2008-03-21 09:14:45 +0000

[diff] [blame]

2185

if (Flags.isByVal()) {

2186

unsigned Size = Flags.getByValSize();

Nicolas Geoffray

2008-04-13 13:40:22 +0000

[diff] [blame]

2187

if (isELF32_ABI && Align) GPR_idx += (GPR_idx % 2);

Dale Johannesen

2008-03-07 20:27:40 +0000

[diff] [blame]

2188

if (Size==1 || Size==2) {

2189

// Very small objects are passed right-justified.

2190

// Everything else is passed left-justified.

2191

MVT::ValueType VT = (Size==1) ? MVT::i8 : MVT::i16;

2192

if (GPR_idx != NumGPRs) {

2193

SDOperand Load = DAG.getExtLoad(ISD::EXTLOAD, PtrVT, Chain, Arg,

2194

NULL, 0, VT);

2195

MemOpChains.push_back(Load.getValue(1));

2196

RegsToPass.push_back(std::make_pair(GPR[GPR_idx++], Load));

2197

if (isMachoABI)

2198

ArgOffset += PtrByteSize;

2199

} else {

2200

SDOperand Const = DAG.getConstant(4 - Size, PtrOff.getValueType());

2201

SDOperand AddPtr = DAG.getNode(ISD::ADD, PtrVT, PtrOff, Const);

2202

SDOperand MemcpyCall = CreateCopyOfByValArgument(Arg, AddPtr,

2203

CallSeqStart.Val->getOperand(0),

2204

Flags, DAG, Size);

2205

// This must go outside the CALLSEQ_START..END.

2206

SDOperand NewCallSeqStart = DAG.getCALLSEQ_START(MemcpyCall,

2207

CallSeqStart.Val->getOperand(1));

2208

DAG.ReplaceAllUsesWith(CallSeqStart.Val, NewCallSeqStart.Val);

2209

Chain = CallSeqStart = NewCallSeqStart;

2210

ArgOffset += PtrByteSize;

2211

}

2212

continue;

2213

}

Dale Johannesen

bfadf4b

2008-03-17 02:13:43 +0000

[diff] [blame]

2214

// Copy entire object into memory. There are cases where gcc-generated

2215

// code assumes it is there, even if it could be put entirely into

2216

// registers. (This is not what the doc says.)

2217

SDOperand MemcpyCall = CreateCopyOfByValArgument(Arg, PtrOff,

2218

CallSeqStart.Val->getOperand(0),

2219

Flags, DAG, Size);

2220

// This must go outside the CALLSEQ_START..END.

2221

SDOperand NewCallSeqStart = DAG.getCALLSEQ_START(MemcpyCall,

2222

CallSeqStart.Val->getOperand(1));

2223

DAG.ReplaceAllUsesWith(CallSeqStart.Val, NewCallSeqStart.Val);

2224

Chain = CallSeqStart = NewCallSeqStart;

2225

// And copy the pieces of it that fit into registers.

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

2226

for (unsigned j=0; j<Size; j+=PtrByteSize) {

2227

SDOperand Const = DAG.getConstant(j, PtrOff.getValueType());

2228

SDOperand AddArg = DAG.getNode(ISD::ADD, PtrVT, Arg, Const);

2229

if (GPR_idx != NumGPRs) {

2230

SDOperand Load = DAG.getLoad(PtrVT, Chain, AddArg, NULL, 0);

Dale Johannesen

7a7aa10

2008-03-05 23:31:27 +0000

[diff] [blame]

2231

MemOpChains.push_back(Load.getValue(1));

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

2232

RegsToPass.push_back(std::make_pair(GPR[GPR_idx++], Load));

2233

if (isMachoABI)

2234

ArgOffset += PtrByteSize;

2235

} else {

Dale Johannesen

bfadf4b

2008-03-17 02:13:43 +0000

[diff] [blame]

2236

ArgOffset += ((Size - j + PtrByteSize-1)/PtrByteSize)*PtrByteSize;

Dale Johannesen

2008-03-07 20:27:40 +0000

[diff] [blame]

2237

break;

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

}

}

continue;

}

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2243

switch (Arg.getValueType()) {

2244

default: assert(0 && "Unexpected ValueType for argument!");

2245

case MVT::i32:

2246

case MVT::i64:

2247

// Double word align in ELF

Nicolas Geoffray

2008-04-13 13:40:22 +0000

[diff] [blame]

2248

if (isELF32_ABI && Align) GPR_idx += (GPR_idx % 2);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2249

if (GPR_idx != NumGPRs) {

2250

RegsToPass.push_back(std::make_pair(GPR[GPR_idx++], Arg));

2251

} else {

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2252

LowerMemOpCallTo(DAG, MF, Chain, Arg, PtrOff, SPDiff, ArgOffset,

2253

isPPC64, isTailCall, false, MemOpChains,

2254

TailCallArguments);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2255

inMem = true;

2256

}

2257

if (inMem || isMachoABI) {

2258

// Stack align in ELF

Nicolas Geoffray

2008-04-13 13:40:22 +0000

[diff] [blame]

2259

if (isELF32_ABI && Align)

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2260

ArgOffset += ((ArgOffset/4) % 2) * PtrByteSize;

2261

2262

ArgOffset += PtrByteSize;

}

break;

case MVT::f32:

case MVT::f64:

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2267

if (FPR_idx != NumFPRs) {

2268

RegsToPass.push_back(std::make_pair(FPR[FPR_idx++], Arg));

2269

2270

if (isVarArg) {

2271

SDOperand Store = DAG.getStore(Chain, Arg, PtrOff, NULL, 0);

2272

MemOpChains.push_back(Store);

2273

2274

// Float varargs are always shadowed in available integer registers

2275

if (GPR_idx != NumGPRs) {

2276

SDOperand Load = DAG.getLoad(PtrVT, Store, PtrOff, NULL, 0);

2277

MemOpChains.push_back(Load.getValue(1));

2278

if (isMachoABI) RegsToPass.push_back(std::make_pair(GPR[GPR_idx++],

2279

Load));

2280

}

2281

if (GPR_idx != NumGPRs && Arg.getValueType() == MVT::f64 && !isPPC64){

2282

SDOperand ConstFour = DAG.getConstant(4, PtrOff.getValueType());

2283

PtrOff = DAG.getNode(ISD::ADD, PtrVT, PtrOff, ConstFour);

2284

SDOperand Load = DAG.getLoad(PtrVT, Store, PtrOff, NULL, 0);

2285

MemOpChains.push_back(Load.getValue(1));

2286

if (isMachoABI) RegsToPass.push_back(std::make_pair(GPR[GPR_idx++],

Load));

}

} else {

// If we have any FPRs remaining, we may also have GPRs remaining.

2291

// Args passed in FPRs consume either 1 (f32) or 2 (f64) available

2292

// GPRs.

2293

if (isMachoABI) {

2294

if (GPR_idx != NumGPRs)

2295

++GPR_idx;

2296

if (GPR_idx != NumGPRs && Arg.getValueType() == MVT::f64 &&

2297

!isPPC64) // PPC64 has 64-bit GPR's obviously :)

++GPR_idx;

}

}

} else {

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2302

LowerMemOpCallTo(DAG, MF, Chain, Arg, PtrOff, SPDiff, ArgOffset,

2303

isPPC64, isTailCall, false, MemOpChains,

2304

TailCallArguments);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2305

inMem = true;

2306

}

2307

if (inMem || isMachoABI) {

2308

// Stack align in ELF

Nicolas Geoffray

2008-04-13 13:40:22 +0000

[diff] [blame]

2309

if (isELF32_ABI && Align)

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2310

ArgOffset += ((ArgOffset/4) % 2) * PtrByteSize;

if (isPPC64)

ArgOffset += 8;

else

ArgOffset += Arg.getValueType() == MVT::f32 ? 4 : 8;

}

break;

case MVT::v4f32:

case MVT::v4i32:

case MVT::v8i16:

case MVT::v16i8:

Dale Johannesen

2008-03-12 00:22:17 +0000

[diff] [blame]

2321

if (isVarArg) {

2322

// These go aligned on the stack, or in the corresponding R registers

2323

// when within range. The Darwin PPC ABI doc claims they also go in

2324

// V registers; in fact gcc does this only for arguments that are

2325

// prototyped, not for those that match the ... We do it for all

2326

// arguments, seems to work.

2327

while (ArgOffset % 16 !=0) {

2328

ArgOffset += PtrByteSize;

2329

if (GPR_idx != NumGPRs)

2330

GPR_idx++;

2331

}

2332

// We could elide this store in the case where the object fits

2333

// entirely in R registers. Maybe later.

2334

PtrOff = DAG.getNode(ISD::ADD, PtrVT, StackPtr,

2335

DAG.getConstant(ArgOffset, PtrVT));

2336

SDOperand Store = DAG.getStore(Chain, Arg, PtrOff, NULL, 0);

2337

MemOpChains.push_back(Store);

2338

if (VR_idx != NumVRs) {

2339

SDOperand Load = DAG.getLoad(MVT::v4f32, Store, PtrOff, NULL, 0);

2340

MemOpChains.push_back(Load.getValue(1));

2341

RegsToPass.push_back(std::make_pair(VR[VR_idx++], Load));

2342

}

2343

ArgOffset += 16;

2344

for (unsigned i=0; i<16; i+=PtrByteSize) {

2345

if (GPR_idx == NumGPRs)

2346

break;

2347

SDOperand Ix = DAG.getNode(ISD::ADD, PtrVT, PtrOff,

2348

DAG.getConstant(i, PtrVT));

2349

SDOperand Load = DAG.getLoad(PtrVT, Store, Ix, NULL, 0);

2350

MemOpChains.push_back(Load.getValue(1));

2351

RegsToPass.push_back(std::make_pair(GPR[GPR_idx++], Load));

2352

}

2353

break;

2354

}

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2355

Dale Johannesen

2008-03-14 17:41:26 +0000

[diff] [blame]

2356

// Non-varargs Altivec params generally go in registers, but have

2357

// stack space allocated at the end.

2358

if (VR_idx != NumVRs) {

2359

// Doesn't have GPR space allocated.

2360

RegsToPass.push_back(std::make_pair(VR[VR_idx++], Arg));

2361

} else if (nAltivecParamsAtEnd==0) {

2362

// We are emitting Altivec params in order.

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2363

LowerMemOpCallTo(DAG, MF, Chain, Arg, PtrOff, SPDiff, ArgOffset,

2364

isPPC64, isTailCall, true, MemOpChains,

2365

TailCallArguments);

Dale Johannesen

2008-03-12 00:22:17 +0000

[diff] [blame]

2366

ArgOffset += 16;

Dale Johannesen

2008-03-12 00:22:17 +0000

[diff] [blame]

2367

}

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2368

break;

2369

}

2370

}

Dale Johannesen

2008-03-14 17:41:26 +0000

[diff] [blame]

2371

// If all Altivec parameters fit in registers, as they usually do,

2372

// they get stack space following the non-Altivec parameters. We

2373

// don't track this here because nobody below needs it.

2374

// If there are more Altivec parameters than fit in registers emit

2375

// the stores here.

2376

if (!isVarArg && nAltivecParamsAtEnd > NumVRs) {

2377

unsigned j = 0;

2378

// Offset is aligned; skip 1st 12 params which go in V registers.

2379

ArgOffset = ((ArgOffset+15)/16)*16;

2380

ArgOffset += 12*16;

2381

for (unsigned i = 0; i != NumOps; ++i) {

2382

SDOperand Arg = Op.getOperand(5+2*i);

2383

MVT::ValueType ArgType = Arg.getValueType();

2384

if (ArgType==MVT::v4f32 || ArgType==MVT::v4i32 ||

2385

ArgType==MVT::v8i16 || ArgType==MVT::v16i8) {

2386

if (++j > NumVRs) {

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2387

SDOperand PtrOff;

2388

// We are emitting Altivec params in order.

2389

LowerMemOpCallTo(DAG, MF, Chain, Arg, PtrOff, SPDiff, ArgOffset,

2390

isPPC64, isTailCall, true, MemOpChains,

2391

TailCallArguments);

Dale Johannesen

2008-03-14 17:41:26 +0000

[diff] [blame]

ArgOffset += 16;

}

}

}

}

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2398

if (!MemOpChains.empty())

2399

Chain = DAG.getNode(ISD::TokenFactor, MVT::Other,

2400

&MemOpChains[0], MemOpChains.size());

2401

2402

// Build a sequence of copy-to-reg nodes chained together with token chain

2403

// and flag operands which copy the outgoing args into the appropriate regs.

2404

SDOperand InFlag;

2405

for (unsigned i = 0, e = RegsToPass.size(); i != e; ++i) {

2406

Chain = DAG.getCopyToReg(Chain, RegsToPass[i].first, RegsToPass[i].second,

2407

InFlag);

2408

InFlag = Chain.getValue(1);

2409

}

2410

2411

// With the ELF 32 ABI, set CR6 to true if this is a vararg call.

2412

if (isVarArg && isELF32_ABI) {

Nicolas Geoffray

d01feb2

2008-03-10 14:12:10 +0000

[diff] [blame]

2413

SDOperand SetCR(DAG.getTargetNode(PPC::CRSET, MVT::i32), 0);

2414

Chain = DAG.getCopyToReg(Chain, PPC::CR1EQ, SetCR, InFlag);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2415

InFlag = Chain.getValue(1);

2416

}

2417

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2418

// Emit a sequence of copyto/copyfrom virtual registers for arguments that

2419

// might overwrite each other in case of tail call optimization.

2420

if (isTailCall) {

2421

SmallVector<SDOperand, 8> MemOpChains2;

2422

// Do not flag preceeding copytoreg stuff together with the following stuff.

2423

InFlag = SDOperand();

2424

StoreTailCallArgumentsToStackSlot(DAG, Chain, TailCallArguments,

2425

MemOpChains2);

2426

if (!MemOpChains2.empty())

2427

Chain = DAG.getNode(ISD::TokenFactor, MVT::Other,

2428

&MemOpChains2[0], MemOpChains2.size());

2429

2430

// Store the return address to the appropriate stack slot.

2431

Chain = EmitTailCallStoreFPAndRetAddr(DAG, MF, Chain, LROp, FPOp, SPDiff,

2432

isPPC64, isMachoABI);

2433

}

2434

2435

// Emit callseq_end just before tailcall node.

2436

if (isTailCall) {

2437

SmallVector<SDOperand, 8> CallSeqOps;

2438

SDVTList CallSeqNodeTys = DAG.getVTList(MVT::Other, MVT::Flag);

2439

CallSeqOps.push_back(Chain);

2440

CallSeqOps.push_back(DAG.getIntPtrConstant(NumBytes));

2441

CallSeqOps.push_back(DAG.getIntPtrConstant(0));

2442

if (InFlag.Val)

2443

CallSeqOps.push_back(InFlag);

2444

Chain = DAG.getNode(ISD::CALLSEQ_END, CallSeqNodeTys, &CallSeqOps[0],

2445

CallSeqOps.size());

2446

InFlag = Chain.getValue(1);

2447

}

2448

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2449

std::vector<MVT::ValueType> NodeTys;

2450

NodeTys.push_back(MVT::Other); // Returns a chain

2451

NodeTys.push_back(MVT::Flag); // Returns a flag for retval copy to use.

2452

2453

SmallVector<SDOperand, 8> Ops;

2454

unsigned CallOpc = isMachoABI? PPCISD::CALL_Macho : PPCISD::CALL_ELF;

2455

2456

// If the callee is a GlobalAddress/ExternalSymbol node (quite common, every

2457

// direct call is) turn it into a TargetGlobalAddress/TargetExternalSymbol

2458

// node so that legalize doesn't hack it.

Nicolas Geoffray

455a2e0

2007-12-21 12:22:29 +0000

[diff] [blame]

2459

if (GlobalAddressSDNode *G = dyn_cast<GlobalAddressSDNode>(Callee))

2460

Callee = DAG.getTargetGlobalAddress(G->getGlobal(), Callee.getValueType());

2461

else if (ExternalSymbolSDNode *S = dyn_cast<ExternalSymbolSDNode>(Callee))

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2462

Callee = DAG.getTargetExternalSymbol(S->getSymbol(), Callee.getValueType());

2463

else if (SDNode *Dest = isBLACompatibleAddress(Callee, DAG))

2464

// If this is an absolute destination address, use the munged value.

2465

Callee = SDOperand(Dest, 0);

2466

else {

2467

// Otherwise, this is an indirect call. We have to use a MTCTR/BCTRL pair

2468

// to do the call, we can't use PPCISD::CALL.

2469

SDOperand MTCTROps[] = {Chain, Callee, InFlag};

2470

Chain = DAG.getNode(PPCISD::MTCTR, NodeTys, MTCTROps, 2+(InFlag.Val!=0));

2471

InFlag = Chain.getValue(1);

2472

Chris Lattner

6eae8c6

2008-03-09 20:49:33 +0000

[diff] [blame]

2473

// Copy the callee address into R12/X12 on darwin.

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2474

if (isMachoABI) {

Chris Lattner

6eae8c6

2008-03-09 20:49:33 +0000

[diff] [blame]

2475

unsigned Reg = Callee.getValueType() == MVT::i32 ? PPC::R12 : PPC::X12;

2476

Chain = DAG.getCopyToReg(Chain, Reg, Callee, InFlag);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2477

InFlag = Chain.getValue(1);

}

NodeTys.clear();

NodeTys.push_back(MVT::Other);

2482

NodeTys.push_back(MVT::Flag);

2483

Ops.push_back(Chain);

2484

CallOpc = isMachoABI ? PPCISD::BCTRL_Macho : PPCISD::BCTRL_ELF;

2485

Callee.Val = 0;

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2486

// Add CTR register as callee so a bctr can be emitted later.

2487

if (isTailCall)

2488

Ops.push_back(DAG.getRegister(PPC::CTR, getPointerTy()));

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2489

}

2490

2491

// If this is a direct call, pass the chain and the callee.

2492

if (Callee.Val) {

2493

Ops.push_back(Chain);

2494

Ops.push_back(Callee);

2495

}

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2496

// If this is a tail call add stack pointer delta.

2497

if (isTailCall)

2498

Ops.push_back(DAG.getConstant(SPDiff, MVT::i32));

2499

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2500

// Add argument registers to the end of the list so that they are known live

2501

// into the call.

2502

for (unsigned i = 0, e = RegsToPass.size(); i != e; ++i)

2503

Ops.push_back(DAG.getRegister(RegsToPass[i].first,

2504

RegsToPass[i].second.getValueType()));

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2505

2506

// When performing tail call optimization the callee pops its arguments off

2507

// the stack. Account for this here so these bytes can be pushed back on in

2508

// PPCRegisterInfo::eliminateCallFramePseudoInstr.

2509

int BytesCalleePops =

2510

(CC==CallingConv::Fast && PerformTailCallOpt) ? NumBytes : 0;

2511

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2512

if (InFlag.Val)

2513

Ops.push_back(InFlag);

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

// Emit tail call.

if (isTailCall) {

assert(InFlag.Val &&

"Flag must be set. Depend on flag being set in LowerRET");

2519

Chain = DAG.getNode(PPCISD::TAILCALL,

2520

Op.Val->getVTList(), &Ops[0], Ops.size());

2521

return SDOperand(Chain.Val, Op.ResNo);

2522

}

2523

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2524

Chain = DAG.getNode(CallOpc, NodeTys, &Ops[0], Ops.size());

2525

InFlag = Chain.getValue(1);

2526

Bill Wendling

22f8deb

2007-11-13 00:44:25 +0000

[diff] [blame]

2527

Chain = DAG.getCALLSEQ_END(Chain,

2528

DAG.getConstant(NumBytes, PtrVT),

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2529

DAG.getConstant(BytesCalleePops, PtrVT),

Bill Wendling

22f8deb

2007-11-13 00:44:25 +0000

[diff] [blame]

2530

InFlag);

2531

if (Op.Val->getValueType(0) != MVT::Other)

2532

InFlag = Chain.getValue(1);

2533

Dan Gohman

2008-03-19 21:39:28 +0000

[diff] [blame]

2534

SmallVector<SDOperand, 16> ResultVals;

2535

SmallVector<CCValAssign, 16> RVLocs;

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2536

unsigned CallerCC = DAG.getMachineFunction().getFunction()->getCallingConv();

2537

CCState CCInfo(CallerCC, isVarArg, TM, RVLocs);

Dan Gohman

2008-03-19 21:39:28 +0000

[diff] [blame]

2538

CCInfo.AnalyzeCallResult(Op.Val, RetCC_PPC);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2539

Dan Gohman

2008-03-19 21:39:28 +0000

[diff] [blame]

2540

// Copy all of the result registers out of their specified physreg.

2541

for (unsigned i = 0, e = RVLocs.size(); i != e; ++i) {

2542

CCValAssign &VA = RVLocs[i];

2543

MVT::ValueType VT = VA.getValVT();

2544

assert(VA.isRegLoc() && "Can only return in registers!");

2545

Chain = DAG.getCopyFromReg(Chain, VA.getLocReg(), VT, InFlag).getValue(1);

2546

ResultVals.push_back(Chain.getValue(0));

2547

InFlag = Chain.getValue(2);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2548

}

Dan Gohman

2008-03-19 21:39:28 +0000

[diff] [blame]

2549

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2550

// If the function returns void, just return the chain.

Dan Gohman

2008-03-19 21:39:28 +0000

[diff] [blame]

2551

if (RVLocs.empty())

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2552

return Chain;

2553

2554

// Otherwise, merge everything together with a MERGE_VALUES node.

Dan Gohman

2008-03-19 21:39:28 +0000

[diff] [blame]

2555

ResultVals.push_back(Chain);

2556

SDOperand Res = DAG.getNode(ISD::MERGE_VALUES, Op.Val->getVTList(),

2557

&ResultVals[0], ResultVals.size());

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2558

return Res.getValue(Op.ResNo);

2559

}

2560

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

2561

SDOperand PPCTargetLowering::LowerRET(SDOperand Op, SelectionDAG &DAG,

2562

TargetMachine &TM) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2563

SmallVector<CCValAssign, 16> RVLocs;

2564

unsigned CC = DAG.getMachineFunction().getFunction()->getCallingConv();

2565

bool isVarArg = DAG.getMachineFunction().getFunction()->isVarArg();

2566

CCState CCInfo(CC, isVarArg, TM, RVLocs);

2567

CCInfo.AnalyzeReturn(Op.Val, RetCC_PPC);

2568

2569

// If this is the first return lowered for this function, add the regs to the

2570

// liveout set for the function.

Chris Lattner

2007-12-31 04:13:23 +0000

[diff] [blame]

2571

if (DAG.getMachineFunction().getRegInfo().liveout_empty()) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2572

for (unsigned i = 0; i != RVLocs.size(); ++i)

Chris Lattner

2007-12-31 04:13:23 +0000

[diff] [blame]

2573

DAG.getMachineFunction().getRegInfo().addLiveOut(RVLocs[i].getLocReg());

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2574

}

2575

2576

SDOperand Chain = Op.getOperand(0);

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2577

2578

Chain = GetPossiblePreceedingTailCall(Chain, PPCISD::TAILCALL);

2579

if (Chain.getOpcode() == PPCISD::TAILCALL) {

2580

SDOperand TailCall = Chain;

2581

SDOperand TargetAddress = TailCall.getOperand(1);

2582

SDOperand StackAdjustment = TailCall.getOperand(2);

2583

2584

assert(((TargetAddress.getOpcode() == ISD::Register &&

2585

cast<RegisterSDNode>(TargetAddress)->getReg() == PPC::CTR) ||

2586

TargetAddress.getOpcode() == ISD::TargetExternalSymbol ||

2587

TargetAddress.getOpcode() == ISD::TargetGlobalAddress ||

2588

isa<ConstantSDNode>(TargetAddress)) &&

2589

"Expecting an global address, external symbol, absolute value or register");

2590

2591

assert(StackAdjustment.getOpcode() == ISD::Constant &&

2592

"Expecting a const value");

2593

2594

SmallVector<SDOperand,8> Operands;

2595

Operands.push_back(Chain.getOperand(0));

2596

Operands.push_back(TargetAddress);

2597

Operands.push_back(StackAdjustment);

2598

// Copy registers used by the call. Last operand is a flag so it is not

2599

// copied.

2600

for (unsigned i=3; i < TailCall.getNumOperands()-1; i++) {

2601

Operands.push_back(Chain.getOperand(i));

2602

}

2603

return DAG.getNode(PPCISD::TC_RETURN, MVT::Other, &Operands[0],

Operands.size());

}

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2607

SDOperand Flag;

2608

2609

// Copy the result values into the output registers.

2610

for (unsigned i = 0; i != RVLocs.size(); ++i) {

2611

CCValAssign &VA = RVLocs[i];

2612

assert(VA.isRegLoc() && "Can only return in registers!");

2613

Chain = DAG.getCopyToReg(Chain, VA.getLocReg(), Op.getOperand(i*2+1), Flag);

2614

Flag = Chain.getValue(1);

}

if (Flag.Val)

return DAG.getNode(PPCISD::RET_FLAG, MVT::Other, Chain, Flag);

2619

else

2620

return DAG.getNode(PPCISD::RET_FLAG, MVT::Other, Chain);

2621

}

2622

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

2623

SDOperand PPCTargetLowering::LowerSTACKRESTORE(SDOperand Op, SelectionDAG &DAG,

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2624

const PPCSubtarget &Subtarget) {

2625

// When we pop the dynamic allocation we need to restore the SP link.

2626

2627

// Get the corect type for pointers.

2628

MVT::ValueType PtrVT = DAG.getTargetLoweringInfo().getPointerTy();

2629

2630

// Construct the stack pointer operand.

2631

bool IsPPC64 = Subtarget.isPPC64();

2632

unsigned SP = IsPPC64 ? PPC::X1 : PPC::R1;

2633

SDOperand StackPtr = DAG.getRegister(SP, PtrVT);

2634

2635

// Get the operands for the STACKRESTORE.

2636

SDOperand Chain = Op.getOperand(0);

2637

SDOperand SaveSP = Op.getOperand(1);

2638

2639

// Load the old link SP.

2640

SDOperand LoadLinkSP = DAG.getLoad(PtrVT, Chain, StackPtr, NULL, 0);

2641

2642

// Restore the stack pointer.

2643

Chain = DAG.getCopyToReg(LoadLinkSP.getValue(1), SP, SaveSP);

2644

2645

// Store the old link SP.

2646

return DAG.getStore(Chain, LoadLinkSP, StackPtr, NULL, 0);

2647

}

2648

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

SDOperand

PPCTargetLowering::getReturnAddrFrameIndex(SelectionDAG & DAG) const {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2653

MachineFunction &MF = DAG.getMachineFunction();

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2654

bool IsPPC64 = PPCSubTarget.isPPC64();

2655

bool isMachoABI = PPCSubTarget.isMachoABI();

2656

MVT::ValueType PtrVT = DAG.getTargetLoweringInfo().getPointerTy();

2657

2658

// Get current frame pointer save index. The users of this index will be

2659

// primarily DYNALLOC instructions.

2660

PPCFunctionInfo *FI = MF.getInfo<PPCFunctionInfo>();

2661

int RASI = FI->getReturnAddrSaveIndex();

2662

2663

// If the frame pointer save index hasn't been defined yet.

2664

if (!RASI) {

2665

// Find out what the fix offset of the frame pointer save area.

2666

int LROffset = PPCFrameInfo::getReturnSaveOffset(IsPPC64, isMachoABI);

2667

// Allocate the frame index for frame pointer save area.

2668

RASI = MF.getFrameInfo()->CreateFixedObject(IsPPC64? 8 : 4, LROffset);

2669

// Save the result.

2670

FI->setReturnAddrSaveIndex(RASI);

2671

}

2672

return DAG.getFrameIndex(RASI, PtrVT);

}

SDOperand

PPCTargetLowering::getFramePointerFrameIndex(SelectionDAG & DAG) const {

2677

MachineFunction &MF = DAG.getMachineFunction();

2678

bool IsPPC64 = PPCSubTarget.isPPC64();

2679

bool isMachoABI = PPCSubTarget.isMachoABI();

2680

MVT::ValueType PtrVT = DAG.getTargetLoweringInfo().getPointerTy();

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2681

2682

// Get current frame pointer save index. The users of this index will be

2683

// primarily DYNALLOC instructions.

2684

PPCFunctionInfo *FI = MF.getInfo<PPCFunctionInfo>();

2685

int FPSI = FI->getFramePointerSaveIndex();

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2686

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2687

// If the frame pointer save index hasn't been defined yet.

2688

if (!FPSI) {

2689

// Find out what the fix offset of the frame pointer save area.

2690

int FPOffset = PPCFrameInfo::getFramePointerSaveOffset(IsPPC64, isMachoABI);

2691

2692

// Allocate the frame index for frame pointer save area.

2693

FPSI = MF.getFrameInfo()->CreateFixedObject(IsPPC64? 8 : 4, FPOffset);

2694

// Save the result.

2695

FI->setFramePointerSaveIndex(FPSI);

2696

}

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2697

return DAG.getFrameIndex(FPSI, PtrVT);

2698

}

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2699

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2700

SDOperand PPCTargetLowering::LowerDYNAMIC_STACKALLOC(SDOperand Op,

2701

SelectionDAG &DAG,

2702

const PPCSubtarget &Subtarget) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2703

// Get the inputs.

2704

SDOperand Chain = Op.getOperand(0);

2705

SDOperand Size = Op.getOperand(1);

2706

2707

// Get the corect type for pointers.

2708

MVT::ValueType PtrVT = DAG.getTargetLoweringInfo().getPointerTy();

2709

// Negate the size.

2710

SDOperand NegSize = DAG.getNode(ISD::SUB, PtrVT,

2711

DAG.getConstant(0, PtrVT), Size);

2712

// Construct a node for the frame pointer save index.

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

2713

SDOperand FPSIdx = getFramePointerFrameIndex(DAG);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2714

// Build a DYNALLOC node.

2715

SDOperand Ops[3] = { Chain, NegSize, FPSIdx };

2716

SDVTList VTs = DAG.getVTList(PtrVT, MVT::Other);

2717

return DAG.getNode(PPCISD::DYNALLOC, VTs, Ops, 3);

2718

}

2719

Evan Cheng

2008-04-19 01:30:48 +0000

[diff] [blame]

2720

SDOperand PPCTargetLowering::LowerAtomicLAS(SDOperand Op, SelectionDAG &DAG) {

Evan Cheng

2008-04-19 02:30:38 +0000

[diff] [blame]

2721

MVT::ValueType VT = Op.Val->getValueType(0);

Evan Cheng

2008-04-19 01:30:48 +0000

[diff] [blame]

2722

SDOperand Chain = Op.getOperand(0);

2723

SDOperand Ptr = Op.getOperand(1);

2724

SDOperand Incr = Op.getOperand(2);

2725

2726

// Issue a "load and reserve".

2727

std::vector<MVT::ValueType> VTs;

2728

VTs.push_back(VT);

2729

VTs.push_back(MVT::Other);

2730

2731

SDOperand Label = DAG.getConstant(PPCAtomicLabelIndex++, MVT::i32);

2732

SDOperand Ops[] = {

Evan Cheng

2008-04-19 02:30:38 +0000

[diff] [blame]

2733

Chain, // Chain

2734

Ptr, // Ptr

2735

Label, // Label

Evan Cheng

2008-04-19 01:30:48 +0000

[diff] [blame]

2736

};

Evan Cheng

2008-04-19 02:30:38 +0000

[diff] [blame]

2737

SDOperand Load = DAG.getNode(PPCISD::LARX, VTs, Ops, 3);

Evan Cheng

2008-04-19 01:30:48 +0000

[diff] [blame]

2738

Chain = Load.getValue(1);

2739

2740

// Compute new value.

2741

SDOperand NewVal = DAG.getNode(ISD::ADD, VT, Load, Incr);

2742

2743

// Issue a "store and check".

2744

SDOperand Ops2[] = {

Evan Cheng

2008-04-19 02:30:38 +0000

[diff] [blame]

Chain, // Chain

NewVal, // Value

Ptr, // Ptr

Label, // Label

Evan Cheng

2008-04-19 01:30:48 +0000

[diff] [blame]

2749

};

Evan Cheng

2008-04-19 02:30:38 +0000

[diff] [blame]

2750

SDOperand Store = DAG.getNode(PPCISD::STCX, MVT::Other, Ops2, 4);

Evan Cheng

2008-04-19 01:30:48 +0000

[diff] [blame]

2751

SDOperand OutOps[] = { Load, Store };

2752

return DAG.getNode(ISD::MERGE_VALUES, DAG.getVTList(VT, MVT::Other),

OutOps, 2);

}

SDOperand PPCTargetLowering::LowerAtomicLCS(SDOperand Op, SelectionDAG &DAG) {

Evan Cheng

2008-04-19 02:30:38 +0000

[diff] [blame]

2757

MVT::ValueType VT = Op.Val->getValueType(0);

Evan Cheng

2008-04-19 01:30:48 +0000

[diff] [blame]

2758

SDOperand Chain = Op.getOperand(0);

2759

SDOperand Ptr = Op.getOperand(1);

2760

SDOperand NewVal = Op.getOperand(2);

2761

SDOperand OldVal = Op.getOperand(3);

2762

2763

// Issue a "load and reserve".

2764

std::vector<MVT::ValueType> VTs;

2765

VTs.push_back(VT);

2766

VTs.push_back(MVT::Other);

2767

2768

SDOperand Label = DAG.getConstant(PPCAtomicLabelIndex++, MVT::i32);

2769

SDOperand Ops[] = {

Evan Cheng

2008-04-19 02:30:38 +0000

[diff] [blame]

2770

Chain, // Chain

2771

Ptr, // Ptr

2772

Label, // Label

Evan Cheng

2008-04-19 01:30:48 +0000

[diff] [blame]

2773

};

Evan Cheng

2008-04-19 02:30:38 +0000

[diff] [blame]

2774

SDOperand Load = DAG.getNode(PPCISD::LARX, VTs, Ops, 3);

Evan Cheng

2008-04-19 01:30:48 +0000

[diff] [blame]

2775

Chain = Load.getValue(1);

2776

2777

// Compare and unreserve if not equal.

2778

SDOperand Ops2[] = {

Evan Cheng

2008-04-19 02:30:38 +0000

[diff] [blame]

2779

Chain, // Chain

2780

OldVal, // Old value

2781

Load, // Value in memory

2782

Label, // Label

Evan Cheng

2008-04-19 01:30:48 +0000

[diff] [blame]

2783

};

2784

Chain = DAG.getNode(PPCISD::CMP_UNRESERVE, MVT::Other, Ops2, 4);

2785

2786

// Issue a "store and check".

2787

SDOperand Ops3[] = {

Evan Cheng

2008-04-19 02:30:38 +0000

[diff] [blame]

Chain, // Chain

NewVal, // Value

Ptr, // Ptr

Label, // Label

Evan Cheng

2008-04-19 01:30:48 +0000

[diff] [blame]

2792

};

Evan Cheng

2008-04-19 02:30:38 +0000

[diff] [blame]

2793

SDOperand Store = DAG.getNode(PPCISD::STCX, MVT::Other, Ops3, 4);

Evan Cheng

2008-04-19 01:30:48 +0000

[diff] [blame]

2794

SDOperand OutOps[] = { Load, Store };

2795

return DAG.getNode(ISD::MERGE_VALUES, DAG.getVTList(VT, MVT::Other),

OutOps, 2);

}

SDOperand PPCTargetLowering::LowerAtomicSWAP(SDOperand Op, SelectionDAG &DAG) {

Evan Cheng

2008-04-19 02:30:38 +0000

[diff] [blame]

2800

MVT::ValueType VT = Op.Val->getValueType(0);

Evan Cheng

2008-04-19 01:30:48 +0000

[diff] [blame]

2801

SDOperand Chain = Op.getOperand(0);

2802

SDOperand Ptr = Op.getOperand(1);

2803

SDOperand NewVal = Op.getOperand(2);

2804

2805

// Issue a "load and reserve".

2806

std::vector<MVT::ValueType> VTs;

2807

VTs.push_back(VT);

2808

VTs.push_back(MVT::Other);

2809

2810

SDOperand Label = DAG.getConstant(PPCAtomicLabelIndex++, MVT::i32);

2811

SDOperand Ops[] = {

Evan Cheng

2008-04-19 02:30:38 +0000

[diff] [blame]

2812

Chain, // Chain

2813

Ptr, // Ptr

2814

Label, // Label

Evan Cheng

2008-04-19 01:30:48 +0000

[diff] [blame]

2815

};

Evan Cheng

2008-04-19 02:30:38 +0000

[diff] [blame]

2816

SDOperand Load = DAG.getNode(PPCISD::LARX, VTs, Ops, 3);

Evan Cheng

2008-04-19 01:30:48 +0000

[diff] [blame]

2817

Chain = Load.getValue(1);

2818

2819

// Issue a "store and check".

2820

SDOperand Ops2[] = {

Evan Cheng

2008-04-19 02:30:38 +0000

[diff] [blame]

Chain, // Chain

NewVal, // Value

Ptr, // Ptr

Label, // Label

Evan Cheng

2008-04-19 01:30:48 +0000

[diff] [blame]

2825

};

Evan Cheng

2008-04-19 02:30:38 +0000

[diff] [blame]

2826

SDOperand Store = DAG.getNode(PPCISD::STCX, MVT::Other, Ops2, 4);

Evan Cheng

2008-04-19 01:30:48 +0000

[diff] [blame]

2827

SDOperand OutOps[] = { Load, Store };

2828

return DAG.getNode(ISD::MERGE_VALUES, DAG.getVTList(VT, MVT::Other),

2829

OutOps, 2);

2830

}

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2831

2832

/// LowerSELECT_CC - Lower floating point select_cc's into fsel instruction when

2833

/// possible.

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

2834

SDOperand PPCTargetLowering::LowerSELECT_CC(SDOperand Op, SelectionDAG &DAG) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2835

// Not FP? Not a fsel.

2836

if (!MVT::isFloatingPoint(Op.getOperand(0).getValueType()) ||

2837

!MVT::isFloatingPoint(Op.getOperand(2).getValueType()))

2838

return SDOperand();

2839

2840

ISD::CondCode CC = cast<CondCodeSDNode>(Op.getOperand(4))->get();

2841

2842

// Cannot handle SETEQ/SETNE.

2843

if (CC == ISD::SETEQ || CC == ISD::SETNE) return SDOperand();

2844

2845

MVT::ValueType ResVT = Op.getValueType();

2846

MVT::ValueType CmpVT = Op.getOperand(0).getValueType();

2847

SDOperand LHS = Op.getOperand(0), RHS = Op.getOperand(1);

2848

SDOperand TV = Op.getOperand(2), FV = Op.getOperand(3);

2849

2850

// If the RHS of the comparison is a 0.0, we don't need to do the

2851

// subtraction at all.

2852

if (isFloatingPointZero(RHS))

2853

switch (CC) {

2854

default: break; // SETUO etc aren't handled by fsel.

case ISD::SETULT:

case ISD::SETOLT:

case ISD::SETLT:

std::swap(TV, FV); // fsel is natively setge, swap operands for setlt

case ISD::SETUGE:

case ISD::SETOGE:

case ISD::SETGE:

if (LHS.getValueType() == MVT::f32) // Comparison is always 64-bits

2863

LHS = DAG.getNode(ISD::FP_EXTEND, MVT::f64, LHS);

2864

return DAG.getNode(PPCISD::FSEL, ResVT, LHS, TV, FV);

case ISD::SETUGT:

case ISD::SETOGT:

case ISD::SETGT:

std::swap(TV, FV); // fsel is natively setge, swap operands for setlt

case ISD::SETULE:

case ISD::SETOLE:

case ISD::SETLE:

if (LHS.getValueType() == MVT::f32) // Comparison is always 64-bits

2873

LHS = DAG.getNode(ISD::FP_EXTEND, MVT::f64, LHS);

2874

return DAG.getNode(PPCISD::FSEL, ResVT,

2875

DAG.getNode(ISD::FNEG, MVT::f64, LHS), TV, FV);

2876

}

2877

Chris Lattner

a216bee

2007-10-15 20:14:52 +0000

[diff] [blame]

2878

SDOperand Cmp;

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2879

switch (CC) {

2880

default: break; // SETUO etc aren't handled by fsel.

case ISD::SETULT:

case ISD::SETOLT:

case ISD::SETLT:

Cmp = DAG.getNode(ISD::FSUB, CmpVT, LHS, RHS);

2885

if (Cmp.getValueType() == MVT::f32) // Comparison is always 64-bits

2886

Cmp = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Cmp);

2887

return DAG.getNode(PPCISD::FSEL, ResVT, Cmp, FV, TV);

case ISD::SETUGE:

case ISD::SETOGE:

case ISD::SETGE:

Cmp = DAG.getNode(ISD::FSUB, CmpVT, LHS, RHS);

2892

if (Cmp.getValueType() == MVT::f32) // Comparison is always 64-bits

2893

Cmp = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Cmp);

2894

return DAG.getNode(PPCISD::FSEL, ResVT, Cmp, TV, FV);

case ISD::SETUGT:

case ISD::SETOGT:

case ISD::SETGT:

Cmp = DAG.getNode(ISD::FSUB, CmpVT, RHS, LHS);

2899

if (Cmp.getValueType() == MVT::f32) // Comparison is always 64-bits

2900

Cmp = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Cmp);

2901

return DAG.getNode(PPCISD::FSEL, ResVT, Cmp, FV, TV);

case ISD::SETULE:

case ISD::SETOLE:

case ISD::SETLE:

Cmp = DAG.getNode(ISD::FSUB, CmpVT, RHS, LHS);

2906

if (Cmp.getValueType() == MVT::f32) // Comparison is always 64-bits

2907

Cmp = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Cmp);

2908

return DAG.getNode(PPCISD::FSEL, ResVT, Cmp, TV, FV);

}

return SDOperand();

}

Chris Lattner

2007-11-28 18:44:47 +0000

[diff] [blame]

2913

// FIXME: Split this code up when LegalizeDAGTypes lands.

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

2914

SDOperand PPCTargetLowering::LowerFP_TO_SINT(SDOperand Op, SelectionDAG &DAG) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2915

assert(MVT::isFloatingPoint(Op.getOperand(0).getValueType()));

2916

SDOperand Src = Op.getOperand(0);

2917

if (Src.getValueType() == MVT::f32)

2918

Src = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Src);

2919

2920

SDOperand Tmp;

2921

switch (Op.getValueType()) {

2922

default: assert(0 && "Unhandled FP_TO_SINT type in custom expander!");

2923

case MVT::i32:

2924

Tmp = DAG.getNode(PPCISD::FCTIWZ, MVT::f64, Src);

2925

break;

2926

case MVT::i64:

2927

Tmp = DAG.getNode(PPCISD::FCTIDZ, MVT::f64, Src);

break;

}

// Convert the FP value to an int value through memory.

Chris Lattner

a216bee

2007-10-15 20:14:52 +0000

[diff] [blame]

2932

SDOperand FIPtr = DAG.CreateStackTemporary(MVT::f64);

2933

2934

// Emit a store to the stack slot.

2935

SDOperand Chain = DAG.getStore(DAG.getEntryNode(), Tmp, FIPtr, NULL, 0);

2936

2937

// Result is a load from the stack slot. If loading 4 bytes, make sure to

2938

// add in a bias.

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2939

if (Op.getValueType() == MVT::i32)

Chris Lattner

a216bee

2007-10-15 20:14:52 +0000

[diff] [blame]

2940

FIPtr = DAG.getNode(ISD::ADD, FIPtr.getValueType(), FIPtr,

2941

DAG.getConstant(4, FIPtr.getValueType()));

2942

return DAG.getLoad(Op.getValueType(), Chain, FIPtr, NULL, 0);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

2943

}

2944

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

2945

SDOperand PPCTargetLowering::LowerFP_ROUND_INREG(SDOperand Op,

2946

SelectionDAG &DAG) {

Dale Johannesen

2007-10-10 01:01:31 +0000

[diff] [blame]

2947

assert(Op.getValueType() == MVT::ppcf128);

2948

SDNode *Node = Op.Val;

2949

assert(Node->getOperand(0).getValueType() == MVT::ppcf128);

Chris Lattner

c882caf

2007-10-19 04:08:28 +0000

[diff] [blame]

2950

assert(Node->getOperand(0).Val->getOpcode() == ISD::BUILD_PAIR);

Dale Johannesen

2007-10-10 01:01:31 +0000

[diff] [blame]

2951

SDOperand Lo = Node->getOperand(0).Val->getOperand(0);

2952

SDOperand Hi = Node->getOperand(0).Val->getOperand(1);

2953

2954

// This sequence changes FPSCR to do round-to-zero, adds the two halves

2955

// of the long double, and puts FPSCR back the way it was. We do not

2956

// actually model FPSCR.

2957

std::vector<MVT::ValueType> NodeTys;

2958

SDOperand Ops[4], Result, MFFSreg, InFlag, FPreg;

2959

2960

NodeTys.push_back(MVT::f64); // Return register

2961

NodeTys.push_back(MVT::Flag); // Returns a flag for later insns

2962

Result = DAG.getNode(PPCISD::MFFS, NodeTys, &InFlag, 0);

2963

MFFSreg = Result.getValue(0);

2964

InFlag = Result.getValue(1);

2965

2966

NodeTys.clear();

2967

NodeTys.push_back(MVT::Flag); // Returns a flag

2968

Ops[0] = DAG.getConstant(31, MVT::i32);

2969

Ops[1] = InFlag;

2970

Result = DAG.getNode(PPCISD::MTFSB1, NodeTys, Ops, 2);

2971

InFlag = Result.getValue(0);

2972

2973

NodeTys.clear();

2974

NodeTys.push_back(MVT::Flag); // Returns a flag

2975

Ops[0] = DAG.getConstant(30, MVT::i32);

2976

Ops[1] = InFlag;

2977

Result = DAG.getNode(PPCISD::MTFSB0, NodeTys, Ops, 2);

2978

InFlag = Result.getValue(0);

2979

2980

NodeTys.clear();

2981

NodeTys.push_back(MVT::f64); // result of add

2982

NodeTys.push_back(MVT::Flag); // Returns a flag

Ops[0] = Lo;

Ops[1] = Hi;

Ops[2] = InFlag;

Result = DAG.getNode(PPCISD::FADDRTZ, NodeTys, Ops, 3);

2987

FPreg = Result.getValue(0);

2988

InFlag = Result.getValue(1);

2989

2990

NodeTys.clear();

2991

NodeTys.push_back(MVT::f64);

2992

Ops[0] = DAG.getConstant(1, MVT::i32);

Ops[1] = MFFSreg;

Ops[2] = FPreg;

Ops[3] = InFlag;

Result = DAG.getNode(PPCISD::MTFSF, NodeTys, Ops, 4);

2997

FPreg = Result.getValue(0);

2998

2999

// We know the low half is about to be thrown away, so just use something

3000

// convenient.

3001

return DAG.getNode(ISD::BUILD_PAIR, Lo.getValueType(), FPreg, FPreg);

3002

}

3003

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

3004

SDOperand PPCTargetLowering::LowerSINT_TO_FP(SDOperand Op, SelectionDAG &DAG) {

Dan Gohman

8b232ff

2008-03-11 01:59:03 +0000

[diff] [blame]

3005

// Don't handle ppc_fp128 here; let it be lowered to a libcall.

3006

if (Op.getValueType() != MVT::f32 && Op.getValueType() != MVT::f64)

3007

return SDOperand();

3008

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3009

if (Op.getOperand(0).getValueType() == MVT::i64) {

3010

SDOperand Bits = DAG.getNode(ISD::BIT_CONVERT, MVT::f64, Op.getOperand(0));

3011

SDOperand FP = DAG.getNode(PPCISD::FCFID, MVT::f64, Bits);

3012

if (Op.getValueType() == MVT::f32)

Chris Lattner

5872a36

2008-01-17 07:00:52 +0000

[diff] [blame]

3013

FP = DAG.getNode(ISD::FP_ROUND, MVT::f32, FP, DAG.getIntPtrConstant(0));

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

return FP;

}

assert(Op.getOperand(0).getValueType() == MVT::i32 &&

3018

"Unhandled SINT_TO_FP type in custom expander!");

3019

// Since we only generate this in 64-bit mode, we can take advantage of

3020

// 64-bit registers. In particular, sign extend the input value into the

3021

// 64-bit register with extsw, store the WHOLE 64-bit value into the stack

3022

// then lfd it and fcfid it.

3023

MachineFrameInfo *FrameInfo = DAG.getMachineFunction().getFrameInfo();

3024

int FrameIdx = FrameInfo->CreateStackObject(8, 8);

3025

MVT::ValueType PtrVT = DAG.getTargetLoweringInfo().getPointerTy();

3026

SDOperand FIdx = DAG.getFrameIndex(FrameIdx, PtrVT);

3027

3028

SDOperand Ext64 = DAG.getNode(PPCISD::EXTSW_32, MVT::i32,

3029

Op.getOperand(0));

3030

3031

// STD the extended value into the stack slot.

Dan Gohman

1fad9e6

2008-04-07 19:35:22 +0000

[diff] [blame]

3032

MachineMemOperand MO(PseudoSourceValue::getFixedStack(),

3033

MachineMemOperand::MOStore, FrameIdx, 8, 8);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3034

SDOperand Store = DAG.getNode(PPCISD::STD_32, MVT::Other,

3035

DAG.getEntryNode(), Ext64, FIdx,

Dan Gohman

2008-02-06 22:27:42 +0000

[diff] [blame]

3036

DAG.getMemOperand(MO));

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3037

// Load the value as a double.

3038

SDOperand Ld = DAG.getLoad(MVT::f64, Store, FIdx, NULL, 0);

3039

3040

// FCFID it and return it.

3041

SDOperand FP = DAG.getNode(PPCISD::FCFID, MVT::f64, Ld);

3042

if (Op.getValueType() == MVT::f32)

Chris Lattner

5872a36

2008-01-17 07:00:52 +0000

[diff] [blame]

3043

FP = DAG.getNode(ISD::FP_ROUND, MVT::f32, FP, DAG.getIntPtrConstant(0));

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

return FP;

}

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

3047

SDOperand PPCTargetLowering::LowerFLT_ROUNDS_(SDOperand Op, SelectionDAG &DAG) {

Dale Johannesen

436e380

2008-01-18 19:55:37 +0000

[diff] [blame]

3048

/*

3049

The rounding mode is in bits 30:31 of FPSR, and has the following

settings:

00 Round to nearest

01 Round to 0

10 Round to +inf

11 Round to -inf

FLT_ROUNDS, on the other hand, expects the following:

-1 Undefined

0 Round to 0

1 Round to nearest

2 Round to +inf

3 Round to -inf

To perform the conversion, we do:

3064

((FPSCR & 0x3) ^ ((~FPSCR & 0x3) >> 1))

3065

*/

3066

3067

MachineFunction &MF = DAG.getMachineFunction();

3068

MVT::ValueType VT = Op.getValueType();

3069

MVT::ValueType PtrVT = DAG.getTargetLoweringInfo().getPointerTy();

3070

std::vector<MVT::ValueType> NodeTys;

3071

SDOperand MFFSreg, InFlag;

3072

3073

// Save FP Control Word to register

3074

NodeTys.push_back(MVT::f64); // return register

3075

NodeTys.push_back(MVT::Flag); // unused in this context

3076

SDOperand Chain = DAG.getNode(PPCISD::MFFS, NodeTys, &InFlag, 0);

3077

3078

// Save FP register to stack slot

3079

int SSFI = MF.getFrameInfo()->CreateStackObject(8, 8);

3080

SDOperand StackSlot = DAG.getFrameIndex(SSFI, PtrVT);

3081

SDOperand Store = DAG.getStore(DAG.getEntryNode(), Chain,

3082

StackSlot, NULL, 0);

3083

3084

// Load FP Control Word from low 32 bits of stack slot.

3085

SDOperand Four = DAG.getConstant(4, PtrVT);

3086

SDOperand Addr = DAG.getNode(ISD::ADD, PtrVT, StackSlot, Four);

3087

SDOperand CWD = DAG.getLoad(MVT::i32, Store, Addr, NULL, 0);

3088

3089

// Transform as necessary

3090

SDOperand CWD1 =

3091

DAG.getNode(ISD::AND, MVT::i32,

3092

CWD, DAG.getConstant(3, MVT::i32));

3093

SDOperand CWD2 =

3094

DAG.getNode(ISD::SRL, MVT::i32,

3095

DAG.getNode(ISD::AND, MVT::i32,

3096

DAG.getNode(ISD::XOR, MVT::i32,

3097

CWD, DAG.getConstant(3, MVT::i32)),

3098

DAG.getConstant(3, MVT::i32)),

3099

DAG.getConstant(1, MVT::i8));

3100

3101

SDOperand RetVal =

3102

DAG.getNode(ISD::XOR, MVT::i32, CWD1, CWD2);

3103

3104

return DAG.getNode((MVT::getSizeInBits(VT) < 16 ?

3105

ISD::TRUNCATE : ISD::ZERO_EXTEND), VT, RetVal);

3106

}

3107

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

3108

SDOperand PPCTargetLowering::LowerSHL_PARTS(SDOperand Op, SelectionDAG &DAG) {

Dan Gohman

2008-03-07 20:36:53 +0000

[diff] [blame]

3109

MVT::ValueType VT = Op.getValueType();

3110

unsigned BitWidth = MVT::getSizeInBits(VT);

3111

assert(Op.getNumOperands() == 3 &&

3112

VT == Op.getOperand(1).getValueType() &&

3113

"Unexpected SHL!");

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3114

3115

// Expand into a bunch of logical ops. Note that these ops

3116

// depend on the PPC behavior for oversized shift amounts.

3117

SDOperand Lo = Op.getOperand(0);

3118

SDOperand Hi = Op.getOperand(1);

3119

SDOperand Amt = Op.getOperand(2);

Dan Gohman

2008-03-07 20:36:53 +0000

[diff] [blame]

3120

MVT::ValueType AmtVT = Amt.getValueType();

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3121

Dan Gohman

2008-03-07 20:36:53 +0000

[diff] [blame]

3122

SDOperand Tmp1 = DAG.getNode(ISD::SUB, AmtVT,

3123

DAG.getConstant(BitWidth, AmtVT), Amt);

3124

SDOperand Tmp2 = DAG.getNode(PPCISD::SHL, VT, Hi, Amt);

3125

SDOperand Tmp3 = DAG.getNode(PPCISD::SRL, VT, Lo, Tmp1);

3126

SDOperand Tmp4 = DAG.getNode(ISD::OR , VT, Tmp2, Tmp3);

3127

SDOperand Tmp5 = DAG.getNode(ISD::ADD, AmtVT, Amt,

3128

DAG.getConstant(-BitWidth, AmtVT));

3129

SDOperand Tmp6 = DAG.getNode(PPCISD::SHL, VT, Lo, Tmp5);

3130

SDOperand OutHi = DAG.getNode(ISD::OR, VT, Tmp4, Tmp6);

3131

SDOperand OutLo = DAG.getNode(PPCISD::SHL, VT, Lo, Amt);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3132

SDOperand OutOps[] = { OutLo, OutHi };

Dan Gohman

2008-03-07 20:36:53 +0000

[diff] [blame]

3133

return DAG.getNode(ISD::MERGE_VALUES, DAG.getVTList(VT, VT),

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

OutOps, 2);

}

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

3137

SDOperand PPCTargetLowering::LowerSRL_PARTS(SDOperand Op, SelectionDAG &DAG) {

Dan Gohman

2008-03-07 20:36:53 +0000

[diff] [blame]

3138

MVT::ValueType VT = Op.getValueType();

3139

unsigned BitWidth = MVT::getSizeInBits(VT);

3140

assert(Op.getNumOperands() == 3 &&

3141

VT == Op.getOperand(1).getValueType() &&

3142

"Unexpected SRL!");

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3143

Dan Gohman

2008-03-07 20:36:53 +0000

[diff] [blame]

3144

// Expand into a bunch of logical ops. Note that these ops

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3145

// depend on the PPC behavior for oversized shift amounts.

3146

SDOperand Lo = Op.getOperand(0);

3147

SDOperand Hi = Op.getOperand(1);

3148

SDOperand Amt = Op.getOperand(2);

Dan Gohman

2008-03-07 20:36:53 +0000

[diff] [blame]

3149

MVT::ValueType AmtVT = Amt.getValueType();

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3150

Dan Gohman

2008-03-07 20:36:53 +0000

[diff] [blame]

3151

SDOperand Tmp1 = DAG.getNode(ISD::SUB, AmtVT,

3152

DAG.getConstant(BitWidth, AmtVT), Amt);

3153

SDOperand Tmp2 = DAG.getNode(PPCISD::SRL, VT, Lo, Amt);

3154

SDOperand Tmp3 = DAG.getNode(PPCISD::SHL, VT, Hi, Tmp1);

3155

SDOperand Tmp4 = DAG.getNode(ISD::OR , VT, Tmp2, Tmp3);

3156

SDOperand Tmp5 = DAG.getNode(ISD::ADD, AmtVT, Amt,

3157

DAG.getConstant(-BitWidth, AmtVT));

3158

SDOperand Tmp6 = DAG.getNode(PPCISD::SRL, VT, Hi, Tmp5);

3159

SDOperand OutLo = DAG.getNode(ISD::OR, VT, Tmp4, Tmp6);

3160

SDOperand OutHi = DAG.getNode(PPCISD::SRL, VT, Hi, Amt);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3161

SDOperand OutOps[] = { OutLo, OutHi };

Dan Gohman

2008-03-07 20:36:53 +0000

[diff] [blame]

3162

return DAG.getNode(ISD::MERGE_VALUES, DAG.getVTList(VT, VT),

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

OutOps, 2);

}

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

3166

SDOperand PPCTargetLowering::LowerSRA_PARTS(SDOperand Op, SelectionDAG &DAG) {

Dan Gohman

2008-03-07 20:36:53 +0000

[diff] [blame]

3167

MVT::ValueType VT = Op.getValueType();

3168

unsigned BitWidth = MVT::getSizeInBits(VT);

3169

assert(Op.getNumOperands() == 3 &&

3170

VT == Op.getOperand(1).getValueType() &&

3171

"Unexpected SRA!");

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3172

Dan Gohman

2008-03-07 20:36:53 +0000

[diff] [blame]

3173

// Expand into a bunch of logical ops, followed by a select_cc.

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3174

SDOperand Lo = Op.getOperand(0);

3175

SDOperand Hi = Op.getOperand(1);

3176

SDOperand Amt = Op.getOperand(2);

Dan Gohman

2008-03-07 20:36:53 +0000

[diff] [blame]

3177

MVT::ValueType AmtVT = Amt.getValueType();

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3178

Dan Gohman

2008-03-07 20:36:53 +0000

[diff] [blame]

3179

SDOperand Tmp1 = DAG.getNode(ISD::SUB, AmtVT,

3180

DAG.getConstant(BitWidth, AmtVT), Amt);

3181

SDOperand Tmp2 = DAG.getNode(PPCISD::SRL, VT, Lo, Amt);

3182

SDOperand Tmp3 = DAG.getNode(PPCISD::SHL, VT, Hi, Tmp1);

3183

SDOperand Tmp4 = DAG.getNode(ISD::OR , VT, Tmp2, Tmp3);

3184

SDOperand Tmp5 = DAG.getNode(ISD::ADD, AmtVT, Amt,

3185

DAG.getConstant(-BitWidth, AmtVT));

3186

SDOperand Tmp6 = DAG.getNode(PPCISD::SRA, VT, Hi, Tmp5);

3187

SDOperand OutHi = DAG.getNode(PPCISD::SRA, VT, Hi, Amt);

3188

SDOperand OutLo = DAG.getSelectCC(Tmp5, DAG.getConstant(0, AmtVT),

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3189

Tmp4, Tmp6, ISD::SETLE);

3190

SDOperand OutOps[] = { OutLo, OutHi };

Dan Gohman

2008-03-07 20:36:53 +0000

[diff] [blame]

3191

return DAG.getNode(ISD::MERGE_VALUES, DAG.getVTList(VT, VT),

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

OutOps, 2);

}

//===----------------------------------------------------------------------===//

3196

// Vector related lowering.

3197

//

3198

3199

// If this is a vector of constants or undefs, get the bits. A bit in

3200

// UndefBits is set if the corresponding element of the vector is an

3201

// ISD::UNDEF value. For undefs, the corresponding VectorBits values are

3202

// zero. Return true if this is not an array of constants, false if it is.

3203

//

3204

static bool GetConstantBuildVectorBits(SDNode *BV, uint64_t VectorBits[2],

3205

uint64_t UndefBits[2]) {

3206

// Start with zero'd results.

3207

VectorBits[0] = VectorBits[1] = UndefBits[0] = UndefBits[1] = 0;

3208

3209

unsigned EltBitSize = MVT::getSizeInBits(BV->getOperand(0).getValueType());

3210

for (unsigned i = 0, e = BV->getNumOperands(); i != e; ++i) {

3211

SDOperand OpVal = BV->getOperand(i);

3212

3213

unsigned PartNo = i >= e/2; // In the upper 128 bits?

3214

unsigned SlotNo = e/2 - (i & (e/2-1))-1; // Which subpiece of the uint64_t.

3215

3216

uint64_t EltBits = 0;

3217

if (OpVal.getOpcode() == ISD::UNDEF) {

3218

uint64_t EltUndefBits = ~0U >> (32-EltBitSize);

3219

UndefBits[PartNo] |= EltUndefBits << (SlotNo*EltBitSize);

3220

continue;

3221

} else if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(OpVal)) {

3222

EltBits = CN->getValue() & (~0U >> (32-EltBitSize));

3223

} else if (ConstantFPSDNode *CN = dyn_cast<ConstantFPSDNode>(OpVal)) {

3224

assert(CN->getValueType(0) == MVT::f32 &&

3225

"Only one legal FP vector type!");

Dale Johannesen

2007-08-31 04:03:46 +0000

[diff] [blame]

3226

EltBits = FloatToBits(CN->getValueAPF().convertToFloat());

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3227

} else {

3228

// Nonconstant element.

return true;

}

VectorBits[PartNo] |= EltBits << (SlotNo*EltBitSize);

3233

}

3234

3235

//printf("%llx %llx %llx %llx\n",

3236

// VectorBits[0], VectorBits[1], UndefBits[0], UndefBits[1]);

return false;

}

// If this is a splat (repetition) of a value across the whole vector, return

3241

// the smallest size that splats it. For example, "0x01010101010101..." is a

3242

// splat of 0x01, 0x0101, and 0x01010101. We return SplatBits = 0x01 and

3243

// SplatSize = 1 byte.

3244

static bool isConstantSplat(const uint64_t Bits128[2],

3245

const uint64_t Undef128[2],

3246

unsigned &SplatBits, unsigned &SplatUndef,

3247

unsigned &SplatSize) {

3248

3249

// Don't let undefs prevent splats from matching. See if the top 64-bits are

3250

// the same as the lower 64-bits, ignoring undefs.

3251

if ((Bits128[0] & ~Undef128[1]) != (Bits128[1] & ~Undef128[0]))

3252

return false; // Can't be a splat if two pieces don't match.

3253

3254

uint64_t Bits64 = Bits128[0] | Bits128[1];

3255

uint64_t Undef64 = Undef128[0] & Undef128[1];

3256

3257

// Check that the top 32-bits are the same as the lower 32-bits, ignoring

3258

// undefs.

3259

if ((Bits64 & (~Undef64 >> 32)) != ((Bits64 >> 32) & ~Undef64))

3260

return false; // Can't be a splat if two pieces don't match.

3261

3262

uint32_t Bits32 = uint32_t(Bits64) | uint32_t(Bits64 >> 32);

3263

uint32_t Undef32 = uint32_t(Undef64) & uint32_t(Undef64 >> 32);

3264

3265

// If the top 16-bits are different than the lower 16-bits, ignoring

3266

// undefs, we have an i32 splat.

3267

if ((Bits32 & (~Undef32 >> 16)) != ((Bits32 >> 16) & ~Undef32)) {

3268

SplatBits = Bits32;

3269

SplatUndef = Undef32;

SplatSize = 4;

return true;

}

uint16_t Bits16 = uint16_t(Bits32) | uint16_t(Bits32 >> 16);

3275

uint16_t Undef16 = uint16_t(Undef32) & uint16_t(Undef32 >> 16);

3276

3277

// If the top 8-bits are different than the lower 8-bits, ignoring

3278

// undefs, we have an i16 splat.

3279

if ((Bits16 & (uint16_t(~Undef16) >> 8)) != ((Bits16 >> 8) & ~Undef16)) {

3280

SplatBits = Bits16;

3281

SplatUndef = Undef16;

SplatSize = 2;

return true;

}

// Otherwise, we have an 8-bit splat.

3287

SplatBits = uint8_t(Bits16) | uint8_t(Bits16 >> 8);

3288

SplatUndef = uint8_t(Undef16) & uint8_t(Undef16 >> 8);

SplatSize = 1;

return true;

}

/// BuildSplatI - Build a canonical splati of Val with an element size of

3294

/// SplatSize. Cast the result to VT.

3295

static SDOperand BuildSplatI(int Val, unsigned SplatSize, MVT::ValueType VT,

3296

SelectionDAG &DAG) {

3297

assert(Val >= -16 && Val <= 15 && "vsplti is out of range!");

3298

3299

static const MVT::ValueType VTys[] = { // canonical VT to use for each size.

3300

MVT::v16i8, MVT::v8i16, MVT::Other, MVT::v4i32

3301

};

3302

3303

MVT::ValueType ReqVT = VT != MVT::Other ? VT : VTys[SplatSize-1];

3304

3305

// Force vspltis[hw] -1 to vspltisb -1 to canonicalize.

if (Val == -1)

SplatSize = 1;

MVT::ValueType CanonicalVT = VTys[SplatSize-1];

3310

3311

// Build a canonical splat for this value.

3312

SDOperand Elt = DAG.getConstant(Val, MVT::getVectorElementType(CanonicalVT));

3313

SmallVector<SDOperand, 8> Ops;

3314

Ops.assign(MVT::getVectorNumElements(CanonicalVT), Elt);

3315

SDOperand Res = DAG.getNode(ISD::BUILD_VECTOR, CanonicalVT,

3316

&Ops[0], Ops.size());

3317

return DAG.getNode(ISD::BIT_CONVERT, ReqVT, Res);

3318

}

3319

3320

/// BuildIntrinsicOp - Return a binary operator intrinsic node with the

3321

/// specified intrinsic ID.

3322

static SDOperand BuildIntrinsicOp(unsigned IID, SDOperand LHS, SDOperand RHS,

3323

SelectionDAG &DAG,

3324

MVT::ValueType DestVT = MVT::Other) {

3325

if (DestVT == MVT::Other) DestVT = LHS.getValueType();

3326

return DAG.getNode(ISD::INTRINSIC_WO_CHAIN, DestVT,

3327

DAG.getConstant(IID, MVT::i32), LHS, RHS);

3328

}

3329

3330

/// BuildIntrinsicOp - Return a ternary operator intrinsic node with the

3331

/// specified intrinsic ID.

3332

static SDOperand BuildIntrinsicOp(unsigned IID, SDOperand Op0, SDOperand Op1,

3333

SDOperand Op2, SelectionDAG &DAG,

3334

MVT::ValueType DestVT = MVT::Other) {

3335

if (DestVT == MVT::Other) DestVT = Op0.getValueType();

3336

return DAG.getNode(ISD::INTRINSIC_WO_CHAIN, DestVT,

3337

DAG.getConstant(IID, MVT::i32), Op0, Op1, Op2);

}

/// BuildVSLDOI - Return a VECTOR_SHUFFLE that is a vsldoi of the specified

3342

/// amount. The result has the specified value type.

3343

static SDOperand BuildVSLDOI(SDOperand LHS, SDOperand RHS, unsigned Amt,

3344

MVT::ValueType VT, SelectionDAG &DAG) {

3345

// Force LHS/RHS to be the right type.

3346

LHS = DAG.getNode(ISD::BIT_CONVERT, MVT::v16i8, LHS);

3347

RHS = DAG.getNode(ISD::BIT_CONVERT, MVT::v16i8, RHS);

3348

3349

SDOperand Ops[16];

3350

for (unsigned i = 0; i != 16; ++i)

3351

Ops[i] = DAG.getConstant(i+Amt, MVT::i32);

3352

SDOperand T = DAG.getNode(ISD::VECTOR_SHUFFLE, MVT::v16i8, LHS, RHS,

3353

DAG.getNode(ISD::BUILD_VECTOR, MVT::v16i8, Ops,16));

3354

return DAG.getNode(ISD::BIT_CONVERT, VT, T);

3355

}

3356

3357

// If this is a case we can't handle, return null and let the default

3358

// expansion code take care of it. If we CAN select this case, and if it

3359

// selects to a single instruction, return Op. Otherwise, if we can codegen

3360

// this case more efficiently than a constant pool load, lower it to the

3361

// sequence of ops that should be used.

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

3362

SDOperand PPCTargetLowering::LowerBUILD_VECTOR(SDOperand Op,

3363

SelectionDAG &DAG) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3364

// If this is a vector of constants or undefs, get the bits. A bit in

3365

// UndefBits is set if the corresponding element of the vector is an

3366

// ISD::UNDEF value. For undefs, the corresponding VectorBits values are

3367

// zero.

3368

uint64_t VectorBits[2];

3369

uint64_t UndefBits[2];

3370

if (GetConstantBuildVectorBits(Op.Val, VectorBits, UndefBits))

3371

return SDOperand(); // Not a constant vector.

3372

3373

// If this is a splat (repetition) of a value across the whole vector, return

3374

// the smallest size that splats it. For example, "0x01010101010101..." is a

3375

// splat of 0x01, 0x0101, and 0x01010101. We return SplatBits = 0x01 and

3376

// SplatSize = 1 byte.

3377

unsigned SplatBits, SplatUndef, SplatSize;

3378

if (isConstantSplat(VectorBits, UndefBits, SplatBits, SplatUndef, SplatSize)){

3379

bool HasAnyUndefs = (UndefBits[0] | UndefBits[1]) != 0;

3380

3381

// First, handle single instruction cases.

3382

3383

// All zeros?

3384

if (SplatBits == 0) {

3385

// Canonicalize all zero vectors to be v4i32.

3386

if (Op.getValueType() != MVT::v4i32 || HasAnyUndefs) {

3387

SDOperand Z = DAG.getConstant(0, MVT::i32);

3388

Z = DAG.getNode(ISD::BUILD_VECTOR, MVT::v4i32, Z, Z, Z, Z);

3389

Op = DAG.getNode(ISD::BIT_CONVERT, Op.getValueType(), Z);

}

return Op;

}

// If the sign extended value is in the range [-16,15], use VSPLTI[bhw].

3395

int32_t SextVal= int32_t(SplatBits << (32-8*SplatSize)) >> (32-8*SplatSize);

3396

if (SextVal >= -16 && SextVal <= 15)

3397

return BuildSplatI(SextVal, SplatSize, Op.getValueType(), DAG);

3398

3399

3400

// Two instruction sequences.

3401

3402

// If this value is in the range [-32,30] and is even, use:

3403

// tmp = VSPLTI[bhw], result = add tmp, tmp

3404

if (SextVal >= -32 && SextVal <= 30 && (SextVal & 1) == 0) {

3405

Op = BuildSplatI(SextVal >> 1, SplatSize, Op.getValueType(), DAG);

3406

return DAG.getNode(ISD::ADD, Op.getValueType(), Op, Op);

3407

}

3408

3409

// If this is 0x8000_0000 x 4, turn into vspltisw + vslw. If it is

3410

// 0x7FFF_FFFF x 4, turn it into not(0x8000_0000). This is important

3411

// for fneg/fabs.

3412

if (SplatSize == 4 && SplatBits == (0x7FFFFFFF&~SplatUndef)) {

3413

// Make -1 and vspltisw -1:

3414

SDOperand OnesV = BuildSplatI(-1, 4, MVT::v4i32, DAG);

3415

3416

// Make the VSLW intrinsic, computing 0x8000_0000.

3417

SDOperand Res = BuildIntrinsicOp(Intrinsic::ppc_altivec_vslw, OnesV,

3418

OnesV, DAG);

3419

3420

// xor by OnesV to invert it.

3421

Res = DAG.getNode(ISD::XOR, MVT::v4i32, Res, OnesV);

3422

return DAG.getNode(ISD::BIT_CONVERT, Op.getValueType(), Res);

3423

}

3424

3425

// Check to see if this is a wide variety of vsplti*, binop self cases.

3426

unsigned SplatBitSize = SplatSize*8;

3427

static const signed char SplatCsts[] = {

3428

-1, 1, -2, 2, -3, 3, -4, 4, -5, 5, -6, 6, -7, 7,

3429

-8, 8, -9, 9, -10, 10, -11, 11, -12, 12, -13, 13, 14, -14, 15, -15, -16

3430

};

3431

Owen Anderson

2007-09-07 04:06:50 +0000

[diff] [blame]

3432

for (unsigned idx = 0; idx < array_lengthof(SplatCsts); ++idx) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3433

// Indirect through the SplatCsts array so that we favor 'vsplti -1' for

3434

// cases which are ambiguous (e.g. formation of 0x8000_0000). 'vsplti -1'

3435

int i = SplatCsts[idx];

3436

3437

// Figure out what shift amount will be used by altivec if shifted by i in

3438

// this splat size.

3439

unsigned TypeShiftAmt = i & (SplatBitSize-1);

3440

3441

// vsplti + shl self.

3442

if (SextVal == (i << (int)TypeShiftAmt)) {

3443

SDOperand Res = BuildSplatI(i, SplatSize, MVT::Other, DAG);

3444

static const unsigned IIDs[] = { // Intrinsic to use for each size.

3445

Intrinsic::ppc_altivec_vslb, Intrinsic::ppc_altivec_vslh, 0,

3446

Intrinsic::ppc_altivec_vslw

3447

};

3448

Res = BuildIntrinsicOp(IIDs[SplatSize-1], Res, Res, DAG);

3449

return DAG.getNode(ISD::BIT_CONVERT, Op.getValueType(), Res);

3450

}

3451

3452

// vsplti + srl self.

3453

if (SextVal == (int)((unsigned)i >> TypeShiftAmt)) {

3454

SDOperand Res = BuildSplatI(i, SplatSize, MVT::Other, DAG);

3455

static const unsigned IIDs[] = { // Intrinsic to use for each size.

3456

Intrinsic::ppc_altivec_vsrb, Intrinsic::ppc_altivec_vsrh, 0,

3457

Intrinsic::ppc_altivec_vsrw

3458

};

3459

Res = BuildIntrinsicOp(IIDs[SplatSize-1], Res, Res, DAG);

3460

return DAG.getNode(ISD::BIT_CONVERT, Op.getValueType(), Res);

3461

}

3462

3463

// vsplti + sra self.

3464

if (SextVal == (int)((unsigned)i >> TypeShiftAmt)) {

3465

SDOperand Res = BuildSplatI(i, SplatSize, MVT::Other, DAG);

3466

static const unsigned IIDs[] = { // Intrinsic to use for each size.

3467

Intrinsic::ppc_altivec_vsrab, Intrinsic::ppc_altivec_vsrah, 0,

3468

Intrinsic::ppc_altivec_vsraw

3469

};

3470

Res = BuildIntrinsicOp(IIDs[SplatSize-1], Res, Res, DAG);

3471

return DAG.getNode(ISD::BIT_CONVERT, Op.getValueType(), Res);

3472

}

3473

3474

// vsplti + rol self.

3475

if (SextVal == (int)(((unsigned)i << TypeShiftAmt) |

3476

((unsigned)i >> (SplatBitSize-TypeShiftAmt)))) {

3477

SDOperand Res = BuildSplatI(i, SplatSize, MVT::Other, DAG);

3478

static const unsigned IIDs[] = { // Intrinsic to use for each size.

3479

Intrinsic::ppc_altivec_vrlb, Intrinsic::ppc_altivec_vrlh, 0,

3480

Intrinsic::ppc_altivec_vrlw

3481

};

3482

Res = BuildIntrinsicOp(IIDs[SplatSize-1], Res, Res, DAG);

3483

return DAG.getNode(ISD::BIT_CONVERT, Op.getValueType(), Res);

3484

}

3485

3486

// t = vsplti c, result = vsldoi t, t, 1

3487

if (SextVal == ((i << 8) | (i >> (TypeShiftAmt-8)))) {

3488

SDOperand T = BuildSplatI(i, SplatSize, MVT::v16i8, DAG);

3489

return BuildVSLDOI(T, T, 1, Op.getValueType(), DAG);

3490

}

3491

// t = vsplti c, result = vsldoi t, t, 2

3492

if (SextVal == ((i << 16) | (i >> (TypeShiftAmt-16)))) {

3493

SDOperand T = BuildSplatI(i, SplatSize, MVT::v16i8, DAG);

3494

return BuildVSLDOI(T, T, 2, Op.getValueType(), DAG);

3495

}

3496

// t = vsplti c, result = vsldoi t, t, 3

3497

if (SextVal == ((i << 24) | (i >> (TypeShiftAmt-24)))) {

3498

SDOperand T = BuildSplatI(i, SplatSize, MVT::v16i8, DAG);

3499

return BuildVSLDOI(T, T, 3, Op.getValueType(), DAG);

}

}

// Three instruction sequences.

3504

3505

// Odd, in range [17,31]: (vsplti C)-(vsplti -16).

3506

if (SextVal >= 0 && SextVal <= 31) {

3507

SDOperand LHS = BuildSplatI(SextVal-16, SplatSize, MVT::Other, DAG);

3508

SDOperand RHS = BuildSplatI(-16, SplatSize, MVT::Other, DAG);

Dale Johannesen

6fdf931

2007-10-14 01:58:32 +0000

[diff] [blame]

3509

LHS = DAG.getNode(ISD::SUB, LHS.getValueType(), LHS, RHS);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3510

return DAG.getNode(ISD::BIT_CONVERT, Op.getValueType(), LHS);

3511

}

3512

// Odd, in range [-31,-17]: (vsplti C)+(vsplti -16).

3513

if (SextVal >= -31 && SextVal <= 0) {

3514

SDOperand LHS = BuildSplatI(SextVal+16, SplatSize, MVT::Other, DAG);

3515

SDOperand RHS = BuildSplatI(-16, SplatSize, MVT::Other, DAG);

Dale Johannesen

6fdf931

2007-10-14 01:58:32 +0000

[diff] [blame]

3516

LHS = DAG.getNode(ISD::ADD, LHS.getValueType(), LHS, RHS);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3517

return DAG.getNode(ISD::BIT_CONVERT, Op.getValueType(), LHS);

}

}

return SDOperand();

}

/// GeneratePerfectShuffle - Given an entry in the perfect-shuffle table, emit

3525

/// the specified operations to build the shuffle.

3526

static SDOperand GeneratePerfectShuffle(unsigned PFEntry, SDOperand LHS,

3527

SDOperand RHS, SelectionDAG &DAG) {

3528

unsigned OpNum = (PFEntry >> 26) & 0x0F;

3529

unsigned LHSID = (PFEntry >> 13) & ((1 << 13)-1);

3530

unsigned RHSID = (PFEntry >> 0) & ((1 << 13)-1);

3531

3532

enum {

3533

OP_COPY = 0, // Copy, used for things like <u,u,u,3> to say it is <0,1,2,3>

OP_VMRGHW,

OP_VMRGLW,

OP_VSPLTISW0,

OP_VSPLTISW1,

OP_VSPLTISW2,

OP_VSPLTISW3,

OP_VSLDOI4,

OP_VSLDOI8,

OP_VSLDOI12

};

if (OpNum == OP_COPY) {

3546

if (LHSID == (1*9+2)*9+3) return LHS;

3547

assert(LHSID == ((4*9+5)*9+6)*9+7 && "Illegal OP_COPY!");

return RHS;

}

SDOperand OpLHS, OpRHS;

3552

OpLHS = GeneratePerfectShuffle(PerfectShuffleTable[LHSID], LHS, RHS, DAG);

3553

OpRHS = GeneratePerfectShuffle(PerfectShuffleTable[RHSID], LHS, RHS, DAG);

3554

3555

unsigned ShufIdxs[16];

3556

switch (OpNum) {

3557

default: assert(0 && "Unknown i32 permute!");

3558

case OP_VMRGHW:

3559

ShufIdxs[ 0] = 0; ShufIdxs[ 1] = 1; ShufIdxs[ 2] = 2; ShufIdxs[ 3] = 3;

3560

ShufIdxs[ 4] = 16; ShufIdxs[ 5] = 17; ShufIdxs[ 6] = 18; ShufIdxs[ 7] = 19;

3561

ShufIdxs[ 8] = 4; ShufIdxs[ 9] = 5; ShufIdxs[10] = 6; ShufIdxs[11] = 7;

3562

ShufIdxs[12] = 20; ShufIdxs[13] = 21; ShufIdxs[14] = 22; ShufIdxs[15] = 23;

3563

break;

3564

case OP_VMRGLW:

3565

ShufIdxs[ 0] = 8; ShufIdxs[ 1] = 9; ShufIdxs[ 2] = 10; ShufIdxs[ 3] = 11;

3566

ShufIdxs[ 4] = 24; ShufIdxs[ 5] = 25; ShufIdxs[ 6] = 26; ShufIdxs[ 7] = 27;

3567

ShufIdxs[ 8] = 12; ShufIdxs[ 9] = 13; ShufIdxs[10] = 14; ShufIdxs[11] = 15;

3568

ShufIdxs[12] = 28; ShufIdxs[13] = 29; ShufIdxs[14] = 30; ShufIdxs[15] = 31;

3569

break;

3570

case OP_VSPLTISW0:

3571

for (unsigned i = 0; i != 16; ++i)

3572

ShufIdxs[i] = (i&3)+0;

3573

break;

3574

case OP_VSPLTISW1:

3575

for (unsigned i = 0; i != 16; ++i)

3576

ShufIdxs[i] = (i&3)+4;

3577

break;

3578

case OP_VSPLTISW2:

3579

for (unsigned i = 0; i != 16; ++i)

3580

ShufIdxs[i] = (i&3)+8;

3581

break;

3582

case OP_VSPLTISW3:

3583

for (unsigned i = 0; i != 16; ++i)

3584

ShufIdxs[i] = (i&3)+12;

3585

break;

3586

case OP_VSLDOI4:

3587

return BuildVSLDOI(OpLHS, OpRHS, 4, OpLHS.getValueType(), DAG);

3588

case OP_VSLDOI8:

3589

return BuildVSLDOI(OpLHS, OpRHS, 8, OpLHS.getValueType(), DAG);

3590

case OP_VSLDOI12:

3591

return BuildVSLDOI(OpLHS, OpRHS, 12, OpLHS.getValueType(), DAG);

3592

}

3593

SDOperand Ops[16];

3594

for (unsigned i = 0; i != 16; ++i)

3595

Ops[i] = DAG.getConstant(ShufIdxs[i], MVT::i32);

3596

3597

return DAG.getNode(ISD::VECTOR_SHUFFLE, OpLHS.getValueType(), OpLHS, OpRHS,

3598

DAG.getNode(ISD::BUILD_VECTOR, MVT::v16i8, Ops, 16));

3599

}

3600

3601

/// LowerVECTOR_SHUFFLE - Return the code we lower for VECTOR_SHUFFLE. If this

3602

/// is a shuffle we can handle in a single instruction, return it. Otherwise,

3603

/// return the code it can be lowered into. Worst case, it can always be

3604

/// lowered into a vperm.

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

3605

SDOperand PPCTargetLowering::LowerVECTOR_SHUFFLE(SDOperand Op,

3606

SelectionDAG &DAG) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3607

SDOperand V1 = Op.getOperand(0);

3608

SDOperand V2 = Op.getOperand(1);

3609

SDOperand PermMask = Op.getOperand(2);

3610

3611

// Cases that are handled by instructions that take permute immediates

3612

// (such as vsplt*) should be left as VECTOR_SHUFFLE nodes so they can be

3613

// selected by the instruction selector.

3614

if (V2.getOpcode() == ISD::UNDEF) {

3615

if (PPC::isSplatShuffleMask(PermMask.Val, 1) ||

3616

PPC::isSplatShuffleMask(PermMask.Val, 2) ||

3617

PPC::isSplatShuffleMask(PermMask.Val, 4) ||

3618

PPC::isVPKUWUMShuffleMask(PermMask.Val, true) ||

3619

PPC::isVPKUHUMShuffleMask(PermMask.Val, true) ||

3620

PPC::isVSLDOIShuffleMask(PermMask.Val, true) != -1 ||

3621

PPC::isVMRGLShuffleMask(PermMask.Val, 1, true) ||

3622

PPC::isVMRGLShuffleMask(PermMask.Val, 2, true) ||

3623

PPC::isVMRGLShuffleMask(PermMask.Val, 4, true) ||

3624

PPC::isVMRGHShuffleMask(PermMask.Val, 1, true) ||

3625

PPC::isVMRGHShuffleMask(PermMask.Val, 2, true) ||

3626

PPC::isVMRGHShuffleMask(PermMask.Val, 4, true)) {

return Op;

}

}

// Altivec has a variety of "shuffle immediates" that take two vector inputs

3632

// and produce a fixed permutation. If any of these match, do not lower to

3633

// VPERM.

3634

if (PPC::isVPKUWUMShuffleMask(PermMask.Val, false) ||

3635

PPC::isVPKUHUMShuffleMask(PermMask.Val, false) ||

3636

PPC::isVSLDOIShuffleMask(PermMask.Val, false) != -1 ||

3637

PPC::isVMRGLShuffleMask(PermMask.Val, 1, false) ||

3638

PPC::isVMRGLShuffleMask(PermMask.Val, 2, false) ||

3639

PPC::isVMRGLShuffleMask(PermMask.Val, 4, false) ||

3640

PPC::isVMRGHShuffleMask(PermMask.Val, 1, false) ||

3641

PPC::isVMRGHShuffleMask(PermMask.Val, 2, false) ||

3642

PPC::isVMRGHShuffleMask(PermMask.Val, 4, false))

3643

return Op;

3644

3645

// Check to see if this is a shuffle of 4-byte values. If so, we can use our

3646

// perfect shuffle table to emit an optimal matching sequence.

3647

unsigned PFIndexes[4];

3648

bool isFourElementShuffle = true;

3649

for (unsigned i = 0; i != 4 && isFourElementShuffle; ++i) { // Element number

3650

unsigned EltNo = 8; // Start out undef.

3651

for (unsigned j = 0; j != 4; ++j) { // Intra-element byte.

3652

if (PermMask.getOperand(i*4+j).getOpcode() == ISD::UNDEF)

3653

continue; // Undef, ignore it.

3654

3655

unsigned ByteSource =

3656

cast<ConstantSDNode>(PermMask.getOperand(i*4+j))->getValue();

3657

if ((ByteSource & 3) != j) {

3658

isFourElementShuffle = false;

break;

}

if (EltNo == 8) {

EltNo = ByteSource/4;

3664

} else if (EltNo != ByteSource/4) {

3665

isFourElementShuffle = false;

break;

}

}

PFIndexes[i] = EltNo;

3670

}

3671

3672

// If this shuffle can be expressed as a shuffle of 4-byte elements, use the

3673

// perfect shuffle vector to determine if it is cost effective to do this as

3674

// discrete instructions, or whether we should use a vperm.

3675

if (isFourElementShuffle) {

3676

// Compute the index in the perfect shuffle table.

3677

unsigned PFTableIndex =

3678

PFIndexes[0]*9*9*9+PFIndexes[1]*9*9+PFIndexes[2]*9+PFIndexes[3];

3679

3680

unsigned PFEntry = PerfectShuffleTable[PFTableIndex];

3681

unsigned Cost = (PFEntry >> 30);

3682

3683

// Determining when to avoid vperm is tricky. Many things affect the cost

3684

// of vperm, particularly how many times the perm mask needs to be computed.

3685

// For example, if the perm mask can be hoisted out of a loop or is already

3686

// used (perhaps because there are multiple permutes with the same shuffle

3687

// mask?) the vperm has a cost of 1. OTOH, hoisting the permute mask out of

3688

// the loop requires an extra register.

3689

//

3690

// As a compromise, we only emit discrete instructions if the shuffle can be

3691

// generated in 3 or fewer operations. When we have loop information

3692

// available, if this block is within a loop, we should avoid using vperm

3693

// for 3-operation perms and use a constant pool load instead.

3694

if (Cost < 3)

3695

return GeneratePerfectShuffle(PFEntry, V1, V2, DAG);

3696

}

3697

3698

// Lower this to a VPERM(V1, V2, V3) expression, where V3 is a constant

3699

// vector that will get spilled to the constant pool.

3700

if (V2.getOpcode() == ISD::UNDEF) V2 = V1;

3701

3702

// The SHUFFLE_VECTOR mask is almost exactly what we want for vperm, except

3703

// that it is in input element units, not in bytes. Convert now.

3704

MVT::ValueType EltVT = MVT::getVectorElementType(V1.getValueType());

3705

unsigned BytesPerElement = MVT::getSizeInBits(EltVT)/8;

3706

3707

SmallVector<SDOperand, 16> ResultMask;

3708

for (unsigned i = 0, e = PermMask.getNumOperands(); i != e; ++i) {

3709

unsigned SrcElt;

3710

if (PermMask.getOperand(i).getOpcode() == ISD::UNDEF)

3711

SrcElt = 0;

3712

else

3713

SrcElt = cast<ConstantSDNode>(PermMask.getOperand(i))->getValue();

3714

3715

for (unsigned j = 0; j != BytesPerElement; ++j)

3716

ResultMask.push_back(DAG.getConstant(SrcElt*BytesPerElement+j,

MVT::i8));

}

SDOperand VPermMask = DAG.getNode(ISD::BUILD_VECTOR, MVT::v16i8,

3721

&ResultMask[0], ResultMask.size());

3722

return DAG.getNode(PPCISD::VPERM, V1.getValueType(), V1, V2, VPermMask);

3723

}

3724

3725

/// getAltivecCompareInfo - Given an intrinsic, return false if it is not an

3726

/// altivec comparison. If it is, return true and fill in Opc/isDot with

3727

/// information about the intrinsic.

3728

static bool getAltivecCompareInfo(SDOperand Intrin, int &CompareOpc,

3729

bool &isDot) {

3730

unsigned IntrinsicID = cast<ConstantSDNode>(Intrin.getOperand(0))->getValue();

3731

CompareOpc = -1;

3732

isDot = false;

3733

switch (IntrinsicID) {

3734

default: return false;

3735

// Comparison predicates.

3736

case Intrinsic::ppc_altivec_vcmpbfp_p: CompareOpc = 966; isDot = 1; break;

3737

case Intrinsic::ppc_altivec_vcmpeqfp_p: CompareOpc = 198; isDot = 1; break;

3738

case Intrinsic::ppc_altivec_vcmpequb_p: CompareOpc = 6; isDot = 1; break;

3739

case Intrinsic::ppc_altivec_vcmpequh_p: CompareOpc = 70; isDot = 1; break;

3740

case Intrinsic::ppc_altivec_vcmpequw_p: CompareOpc = 134; isDot = 1; break;

3741

case Intrinsic::ppc_altivec_vcmpgefp_p: CompareOpc = 454; isDot = 1; break;

3742

case Intrinsic::ppc_altivec_vcmpgtfp_p: CompareOpc = 710; isDot = 1; break;

3743

case Intrinsic::ppc_altivec_vcmpgtsb_p: CompareOpc = 774; isDot = 1; break;

3744

case Intrinsic::ppc_altivec_vcmpgtsh_p: CompareOpc = 838; isDot = 1; break;

3745

case Intrinsic::ppc_altivec_vcmpgtsw_p: CompareOpc = 902; isDot = 1; break;

3746

case Intrinsic::ppc_altivec_vcmpgtub_p: CompareOpc = 518; isDot = 1; break;

3747

case Intrinsic::ppc_altivec_vcmpgtuh_p: CompareOpc = 582; isDot = 1; break;

3748

case Intrinsic::ppc_altivec_vcmpgtuw_p: CompareOpc = 646; isDot = 1; break;

3749

3750

// Normal Comparisons.

3751

case Intrinsic::ppc_altivec_vcmpbfp: CompareOpc = 966; isDot = 0; break;

3752

case Intrinsic::ppc_altivec_vcmpeqfp: CompareOpc = 198; isDot = 0; break;

3753

case Intrinsic::ppc_altivec_vcmpequb: CompareOpc = 6; isDot = 0; break;

3754

case Intrinsic::ppc_altivec_vcmpequh: CompareOpc = 70; isDot = 0; break;

3755

case Intrinsic::ppc_altivec_vcmpequw: CompareOpc = 134; isDot = 0; break;

3756

case Intrinsic::ppc_altivec_vcmpgefp: CompareOpc = 454; isDot = 0; break;

3757

case Intrinsic::ppc_altivec_vcmpgtfp: CompareOpc = 710; isDot = 0; break;

3758

case Intrinsic::ppc_altivec_vcmpgtsb: CompareOpc = 774; isDot = 0; break;

3759

case Intrinsic::ppc_altivec_vcmpgtsh: CompareOpc = 838; isDot = 0; break;

3760

case Intrinsic::ppc_altivec_vcmpgtsw: CompareOpc = 902; isDot = 0; break;

3761

case Intrinsic::ppc_altivec_vcmpgtub: CompareOpc = 518; isDot = 0; break;

3762

case Intrinsic::ppc_altivec_vcmpgtuh: CompareOpc = 582; isDot = 0; break;

3763

case Intrinsic::ppc_altivec_vcmpgtuw: CompareOpc = 646; isDot = 0; break;

}

return true;

}

/// LowerINTRINSIC_WO_CHAIN - If this is an intrinsic that we want to custom

3769

/// lower, do it, otherwise return null.

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

3770

SDOperand PPCTargetLowering::LowerINTRINSIC_WO_CHAIN(SDOperand Op,

3771

SelectionDAG &DAG) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3772

// If this is a lowered altivec predicate compare, CompareOpc is set to the

3773

// opcode number of the comparison.

3774

int CompareOpc;

3775

bool isDot;

3776

if (!getAltivecCompareInfo(Op, CompareOpc, isDot))

3777

return SDOperand(); // Don't custom lower most intrinsics.

3778

3779

// If this is a non-dot comparison, make the VCMP node and we are done.

3780

if (!isDot) {

3781

SDOperand Tmp = DAG.getNode(PPCISD::VCMP, Op.getOperand(2).getValueType(),

3782

Op.getOperand(1), Op.getOperand(2),

3783

DAG.getConstant(CompareOpc, MVT::i32));

3784

return DAG.getNode(ISD::BIT_CONVERT, Op.getValueType(), Tmp);

3785

}

3786

3787

// Create the PPCISD altivec 'dot' comparison node.

3788

SDOperand Ops[] = {

3789

Op.getOperand(2), // LHS

3790

Op.getOperand(3), // RHS

3791

DAG.getConstant(CompareOpc, MVT::i32)

3792

};

3793

std::vector<MVT::ValueType> VTs;

3794

VTs.push_back(Op.getOperand(2).getValueType());

3795

VTs.push_back(MVT::Flag);

3796

SDOperand CompNode = DAG.getNode(PPCISD::VCMPo, VTs, Ops, 3);

3797

3798

// Now that we have the comparison, emit a copy from the CR to a GPR.

3799

// This is flagged to the above dot comparison.

3800

SDOperand Flags = DAG.getNode(PPCISD::MFCR, MVT::i32,

3801

DAG.getRegister(PPC::CR6, MVT::i32),

3802

CompNode.getValue(1));

3803

3804

// Unpack the result based on how the target uses it.

3805

unsigned BitNo; // Bit # of CR6.

3806

bool InvertBit; // Invert result?

3807

switch (cast<ConstantSDNode>(Op.getOperand(1))->getValue()) {

3808

default: // Can't happen, don't crash on invalid number though.

3809

case 0: // Return the value of the EQ bit of CR6.

3810

BitNo = 0; InvertBit = false;

3811

break;

3812

case 1: // Return the inverted value of the EQ bit of CR6.

3813

BitNo = 0; InvertBit = true;

3814

break;

3815

case 2: // Return the value of the LT bit of CR6.

3816

BitNo = 2; InvertBit = false;

3817

break;

3818

case 3: // Return the inverted value of the LT bit of CR6.

3819

BitNo = 2; InvertBit = true;

break;

}

// Shift the bit into the low position.

3824

Flags = DAG.getNode(ISD::SRL, MVT::i32, Flags,

3825

DAG.getConstant(8-(3-BitNo), MVT::i32));

3826

// Isolate the bit.

3827

Flags = DAG.getNode(ISD::AND, MVT::i32, Flags,

3828

DAG.getConstant(1, MVT::i32));

3829

3830

// If we are supposed to, toggle the bit.

3831

if (InvertBit)

3832

Flags = DAG.getNode(ISD::XOR, MVT::i32, Flags,

3833

DAG.getConstant(1, MVT::i32));

return Flags;

}

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

3837

SDOperand PPCTargetLowering::LowerSCALAR_TO_VECTOR(SDOperand Op,

3838

SelectionDAG &DAG) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3839

// Create a stack slot that is 16-byte aligned.

3840

MachineFrameInfo *FrameInfo = DAG.getMachineFunction().getFrameInfo();

3841

int FrameIdx = FrameInfo->CreateStackObject(16, 16);

3842

MVT::ValueType PtrVT = DAG.getTargetLoweringInfo().getPointerTy();

3843

SDOperand FIdx = DAG.getFrameIndex(FrameIdx, PtrVT);

3844

3845

// Store the input value into Value#0 of the stack slot.

3846

SDOperand Store = DAG.getStore(DAG.getEntryNode(),

3847

Op.getOperand(0), FIdx, NULL, 0);

3848

// Load it out.

3849

return DAG.getLoad(Op.getValueType(), Store, FIdx, NULL, 0);

3850

}

3851

Dale Johannesen

2008-03-04 23:17:14 +0000

[diff] [blame]

3852

SDOperand PPCTargetLowering::LowerMUL(SDOperand Op, SelectionDAG &DAG) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3853

if (Op.getValueType() == MVT::v4i32) {

3854

SDOperand LHS = Op.getOperand(0), RHS = Op.getOperand(1);

3855

3856

SDOperand Zero = BuildSplatI( 0, 1, MVT::v4i32, DAG);

3857

SDOperand Neg16 = BuildSplatI(-16, 4, MVT::v4i32, DAG); // +16 as shift amt.

3858

3859

SDOperand RHSSwap = // = vrlw RHS, 16

3860

BuildIntrinsicOp(Intrinsic::ppc_altivec_vrlw, RHS, Neg16, DAG);

3861

3862

// Shrinkify inputs to v8i16.

3863

LHS = DAG.getNode(ISD::BIT_CONVERT, MVT::v8i16, LHS);

3864

RHS = DAG.getNode(ISD::BIT_CONVERT, MVT::v8i16, RHS);

3865

RHSSwap = DAG.getNode(ISD::BIT_CONVERT, MVT::v8i16, RHSSwap);

3866

3867

// Low parts multiplied together, generating 32-bit results (we ignore the

3868

// top parts).

3869

SDOperand LoProd = BuildIntrinsicOp(Intrinsic::ppc_altivec_vmulouh,

3870

LHS, RHS, DAG, MVT::v4i32);

3871

3872

SDOperand HiProd = BuildIntrinsicOp(Intrinsic::ppc_altivec_vmsumuhm,

3873

LHS, RHSSwap, Zero, DAG, MVT::v4i32);

3874

// Shift the high parts up 16 bits.

3875

HiProd = BuildIntrinsicOp(Intrinsic::ppc_altivec_vslw, HiProd, Neg16, DAG);

3876

return DAG.getNode(ISD::ADD, MVT::v4i32, LoProd, HiProd);

3877

} else if (Op.getValueType() == MVT::v8i16) {

3878

SDOperand LHS = Op.getOperand(0), RHS = Op.getOperand(1);

3879

3880

SDOperand Zero = BuildSplatI(0, 1, MVT::v8i16, DAG);

3881

3882

return BuildIntrinsicOp(Intrinsic::ppc_altivec_vmladduhm,

3883

LHS, RHS, Zero, DAG);

3884

} else if (Op.getValueType() == MVT::v16i8) {

3885

SDOperand LHS = Op.getOperand(0), RHS = Op.getOperand(1);

3886

3887

// Multiply the even 8-bit parts, producing 16-bit sums.

3888

SDOperand EvenParts = BuildIntrinsicOp(Intrinsic::ppc_altivec_vmuleub,

3889

LHS, RHS, DAG, MVT::v8i16);

3890

EvenParts = DAG.getNode(ISD::BIT_CONVERT, MVT::v16i8, EvenParts);

3891

3892

// Multiply the odd 8-bit parts, producing 16-bit sums.

3893

SDOperand OddParts = BuildIntrinsicOp(Intrinsic::ppc_altivec_vmuloub,

3894

LHS, RHS, DAG, MVT::v8i16);

3895

OddParts = DAG.getNode(ISD::BIT_CONVERT, MVT::v16i8, OddParts);

3896

3897

// Merge the results together.

3898

SDOperand Ops[16];

3899

for (unsigned i = 0; i != 8; ++i) {

3900

Ops[i*2 ] = DAG.getConstant(2*i+1, MVT::i8);

3901

Ops[i*2+1] = DAG.getConstant(2*i+1+16, MVT::i8);

3902

}

3903

return DAG.getNode(ISD::VECTOR_SHUFFLE, MVT::v16i8, EvenParts, OddParts,

3904

DAG.getNode(ISD::BUILD_VECTOR, MVT::v16i8, Ops, 16));

3905

} else {

3906

assert(0 && "Unknown mul to lower!");

abort();

}

}

/// LowerOperation - Provide custom lowering hooks for some operations.

3912

///

3913

SDOperand PPCTargetLowering::LowerOperation(SDOperand Op, SelectionDAG &DAG) {

3914

switch (Op.getOpcode()) {

3915

default: assert(0 && "Wasn't expecting to be able to lower this!");

3916

case ISD::ConstantPool: return LowerConstantPool(Op, DAG);

3917

case ISD::GlobalAddress: return LowerGlobalAddress(Op, DAG);

3918

case ISD::GlobalTLSAddress: return LowerGlobalTLSAddress(Op, DAG);

3919

case ISD::JumpTable: return LowerJumpTable(Op, DAG);

3920

case ISD::SETCC: return LowerSETCC(Op, DAG);

3921

case ISD::VASTART:

3922

return LowerVASTART(Op, DAG, VarArgsFrameIndex, VarArgsStackOffset,

3923

VarArgsNumGPR, VarArgsNumFPR, PPCSubTarget);

3924

3925

case ISD::VAARG:

3926

return LowerVAARG(Op, DAG, VarArgsFrameIndex, VarArgsStackOffset,

3927

VarArgsNumGPR, VarArgsNumFPR, PPCSubTarget);

3928

3929

case ISD::FORMAL_ARGUMENTS:

3930

return LowerFORMAL_ARGUMENTS(Op, DAG, VarArgsFrameIndex,

3931

VarArgsStackOffset, VarArgsNumGPR,

3932

VarArgsNumFPR, PPCSubTarget);

3933

Dan Gohman

2008-03-19 21:39:28 +0000

[diff] [blame]

3934

case ISD::CALL: return LowerCALL(Op, DAG, PPCSubTarget,

3935

getTargetMachine());

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3936

case ISD::RET: return LowerRET(Op, DAG, getTargetMachine());

3937

case ISD::STACKRESTORE: return LowerSTACKRESTORE(Op, DAG, PPCSubTarget);

3938

case ISD::DYNAMIC_STACKALLOC:

3939

return LowerDYNAMIC_STACKALLOC(Op, DAG, PPCSubTarget);

Evan Cheng

2008-04-19 01:30:48 +0000

[diff] [blame]

3940

3941

case ISD::ATOMIC_LAS: return LowerAtomicLAS(Op, DAG);

3942

case ISD::ATOMIC_LCS: return LowerAtomicLCS(Op, DAG);

3943

case ISD::ATOMIC_SWAP: return LowerAtomicSWAP(Op, DAG);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3944

3945

case ISD::SELECT_CC: return LowerSELECT_CC(Op, DAG);

3946

case ISD::FP_TO_SINT: return LowerFP_TO_SINT(Op, DAG);

3947

case ISD::SINT_TO_FP: return LowerSINT_TO_FP(Op, DAG);

Dale Johannesen

2007-10-10 01:01:31 +0000

[diff] [blame]

3948

case ISD::FP_ROUND_INREG: return LowerFP_ROUND_INREG(Op, DAG);

Dan Gohman

819574c

2008-01-31 00:41:03 +0000

[diff] [blame]

3949

case ISD::FLT_ROUNDS_: return LowerFLT_ROUNDS_(Op, DAG);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3950

3951

// Lower 64-bit shifts.

3952

case ISD::SHL_PARTS: return LowerSHL_PARTS(Op, DAG);

3953

case ISD::SRL_PARTS: return LowerSRL_PARTS(Op, DAG);

3954

case ISD::SRA_PARTS: return LowerSRA_PARTS(Op, DAG);

3955

3956

// Vector-related lowering.

3957

case ISD::BUILD_VECTOR: return LowerBUILD_VECTOR(Op, DAG);

3958

case ISD::VECTOR_SHUFFLE: return LowerVECTOR_SHUFFLE(Op, DAG);

3959

case ISD::INTRINSIC_WO_CHAIN: return LowerINTRINSIC_WO_CHAIN(Op, DAG);

3960

case ISD::SCALAR_TO_VECTOR: return LowerSCALAR_TO_VECTOR(Op, DAG);

3961

case ISD::MUL: return LowerMUL(Op, DAG);

3962

Chris Lattner

2007-12-08 06:59:59 +0000

[diff] [blame]

3963

// Frame & Return address.

3964

case ISD::RETURNADDR: return LowerRETURNADDR(Op, DAG);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3965

case ISD::FRAMEADDR: return LowerFRAMEADDR(Op, DAG);

}

return SDOperand();

}

Chris Lattner

2007-11-28 18:44:47 +0000

[diff] [blame]

3970

SDNode *PPCTargetLowering::ExpandOperationResult(SDNode *N, SelectionDAG &DAG) {

3971

switch (N->getOpcode()) {

3972

default: assert(0 && "Wasn't expecting to be able to lower this!");

3973

case ISD::FP_TO_SINT: return LowerFP_TO_SINT(SDOperand(N, 0), DAG).Val;

}

}

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3978

//===----------------------------------------------------------------------===//

3979

// Other Lowering Code

3980

//===----------------------------------------------------------------------===//

3981

3982

MachineBasicBlock *

Evan Cheng

e637db1

2008-01-30 18:18:23 +0000

[diff] [blame]

3983

PPCTargetLowering::EmitInstrWithCustomInserter(MachineInstr *MI,

3984

MachineBasicBlock *BB) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

3985

const TargetInstrInfo *TII = getTargetMachine().getInstrInfo();

3986

assert((MI->getOpcode() == PPC::SELECT_CC_I4 ||

3987

MI->getOpcode() == PPC::SELECT_CC_I8 ||

3988

MI->getOpcode() == PPC::SELECT_CC_F4 ||

3989

MI->getOpcode() == PPC::SELECT_CC_F8 ||

3990

MI->getOpcode() == PPC::SELECT_CC_VRRC) &&

3991

"Unexpected instr type to insert");

3992

3993

// To "insert" a SELECT_CC instruction, we actually have to insert the diamond

3994

// control-flow pattern. The incoming instruction knows the destination vreg

3995

// to set, the condition code register to branch on, the true/false values to

3996

// select between, and a branch opcode to use.

3997

const BasicBlock *LLVM_BB = BB->getBasicBlock();

3998

ilist<MachineBasicBlock>::iterator It = BB;

++It;

// thisMBB:

// ...

// TrueVal = ...

// cmpTY ccX, r1, r2

// bCC copy1MBB

// fallthrough --> copy0MBB

4007

MachineBasicBlock *thisMBB = BB;

4008

MachineBasicBlock *copy0MBB = new MachineBasicBlock(LLVM_BB);

4009

MachineBasicBlock *sinkMBB = new MachineBasicBlock(LLVM_BB);

4010

unsigned SelectPred = MI->getOperand(4).getImm();

4011

BuildMI(BB, TII->get(PPC::BCC))

4012

.addImm(SelectPred).addReg(MI->getOperand(1).getReg()).addMBB(sinkMBB);

4013

MachineFunction *F = BB->getParent();

4014

F->getBasicBlockList().insert(It, copy0MBB);

4015

F->getBasicBlockList().insert(It, sinkMBB);

4016

// Update machine-CFG edges by first adding all successors of the current

4017

// block to the new block which will contain the Phi node for the select.

4018

for(MachineBasicBlock::succ_iterator i = BB->succ_begin(),

4019

e = BB->succ_end(); i != e; ++i)

4020

sinkMBB->addSuccessor(*i);

4021

// Next, remove all successors of the current block, and add the true

4022

// and fallthrough blocks as its successors.

4023

while(!BB->succ_empty())

4024

BB->removeSuccessor(BB->succ_begin());

4025

BB->addSuccessor(copy0MBB);

4026

BB->addSuccessor(sinkMBB);

// copy0MBB:

// %FalseValue = ...

// # fallthrough to sinkMBB

4031

BB = copy0MBB;

4032

4033

// Update machine-CFG edges

4034

BB->addSuccessor(sinkMBB);

4035

4036

// sinkMBB:

4037

// %Result = phi [ %FalseValue, copy0MBB ], [ %TrueValue, thisMBB ]

4038

// ...

4039

BB = sinkMBB;

4040

BuildMI(BB, TII->get(PPC::PHI), MI->getOperand(0).getReg())

4041

.addReg(MI->getOperand(3).getReg()).addMBB(copy0MBB)

4042

.addReg(MI->getOperand(2).getReg()).addMBB(thisMBB);

4043

4044

delete MI; // The pseudo instruction is gone now.

return BB;

}

//===----------------------------------------------------------------------===//

4049

// Target Optimization Hooks

4050

//===----------------------------------------------------------------------===//

4051

4052

SDOperand PPCTargetLowering::PerformDAGCombine(SDNode *N,

4053

DAGCombinerInfo &DCI) const {

4054

TargetMachine &TM = getTargetMachine();

4055

SelectionDAG &DAG = DCI.DAG;

4056

switch (N->getOpcode()) {

4057

default: break;

4058

case PPCISD::SHL:

4059

if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(N->getOperand(0))) {

4060

if (C->getValue() == 0) // 0 << V -> 0.

4061

return N->getOperand(0);

}

break;

case PPCISD::SRL:

if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(N->getOperand(0))) {

4066

if (C->getValue() == 0) // 0 >>u V -> 0.

4067

return N->getOperand(0);

}

break;

case PPCISD::SRA:

if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(N->getOperand(0))) {

4072

if (C->getValue() == 0 || // 0 >>s V -> 0.

4073

C->isAllOnesValue()) // -1 >>s V -> -1.

4074

return N->getOperand(0);

}

break;

case ISD::SINT_TO_FP:

4079

if (TM.getSubtarget<PPCSubtarget>().has64BitSupport()) {

4080

if (N->getOperand(0).getOpcode() == ISD::FP_TO_SINT) {

4081

// Turn (sint_to_fp (fp_to_sint X)) -> fctidz/fcfid without load/stores.

4082

// We allow the src/dst to be either f32/f64, but the intermediate

4083

// type must be i64.

Dale Johannesen

cbc0351

2007-10-23 23:20:14 +0000

[diff] [blame]

4084

if (N->getOperand(0).getValueType() == MVT::i64 &&

4085

N->getOperand(0).getOperand(0).getValueType() != MVT::ppcf128) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

4086

SDOperand Val = N->getOperand(0).getOperand(0);

4087

if (Val.getValueType() == MVT::f32) {

4088

Val = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Val);

4089

DCI.AddToWorklist(Val.Val);

4090

}

4091

4092

Val = DAG.getNode(PPCISD::FCTIDZ, MVT::f64, Val);

4093

DCI.AddToWorklist(Val.Val);

4094

Val = DAG.getNode(PPCISD::FCFID, MVT::f64, Val);

4095

DCI.AddToWorklist(Val.Val);

4096

if (N->getValueType(0) == MVT::f32) {

Chris Lattner

5872a36

2008-01-17 07:00:52 +0000

[diff] [blame]

4097

Val = DAG.getNode(ISD::FP_ROUND, MVT::f32, Val,

4098

DAG.getIntPtrConstant(0));

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

4099

DCI.AddToWorklist(Val.Val);

4100

}

4101

return Val;

4102

} else if (N->getOperand(0).getValueType() == MVT::i32) {

4103

// If the intermediate type is i32, we can avoid the load/store here

// too.

}

}

}

break;

case ISD::STORE:

// Turn STORE (FP_TO_SINT F) -> STFIWX(FCTIWZ(F)).

4111

if (TM.getSubtarget<PPCSubtarget>().hasSTFIWX() &&

Chris Lattner

df7a4ae

2008-01-18 16:54:56 +0000

[diff] [blame]

4112

!cast<StoreSDNode>(N)->isTruncatingStore() &&

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

4113

N->getOperand(1).getOpcode() == ISD::FP_TO_SINT &&

Dale Johannesen

cbc0351

2007-10-23 23:20:14 +0000

[diff] [blame]

4114

N->getOperand(1).getValueType() == MVT::i32 &&

4115

N->getOperand(1).getOperand(0).getValueType() != MVT::ppcf128) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

4116

SDOperand Val = N->getOperand(1).getOperand(0);

4117

if (Val.getValueType() == MVT::f32) {

4118

Val = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Val);

4119

DCI.AddToWorklist(Val.Val);

4120

}

4121

Val = DAG.getNode(PPCISD::FCTIWZ, MVT::f64, Val);

4122

DCI.AddToWorklist(Val.Val);

4123

4124

Val = DAG.getNode(PPCISD::STFIWX, MVT::Other, N->getOperand(0), Val,

4125

N->getOperand(2), N->getOperand(3));

4126

DCI.AddToWorklist(Val.Val);

return Val;

}

// Turn STORE (BSWAP) -> sthbrx/stwbrx.

4131

if (N->getOperand(1).getOpcode() == ISD::BSWAP &&

4132

N->getOperand(1).Val->hasOneUse() &&

4133

(N->getOperand(1).getValueType() == MVT::i32 ||

4134

N->getOperand(1).getValueType() == MVT::i16)) {

4135

SDOperand BSwapOp = N->getOperand(1).getOperand(0);

4136

// Do an any-extend to 32-bits if this is a half-word input.

4137

if (BSwapOp.getValueType() == MVT::i16)

4138

BSwapOp = DAG.getNode(ISD::ANY_EXTEND, MVT::i32, BSwapOp);

4139

4140

return DAG.getNode(PPCISD::STBRX, MVT::Other, N->getOperand(0), BSwapOp,

4141

N->getOperand(2), N->getOperand(3),

4142

DAG.getValueType(N->getOperand(1).getValueType()));

}

break;

case ISD::BSWAP:

// Turn BSWAP (LOAD) -> lhbrx/lwbrx.

4147

if (ISD::isNON_EXTLoad(N->getOperand(0).Val) &&

4148

N->getOperand(0).hasOneUse() &&

4149

(N->getValueType(0) == MVT::i32 || N->getValueType(0) == MVT::i16)) {

4150

SDOperand Load = N->getOperand(0);

4151

LoadSDNode *LD = cast<LoadSDNode>(Load);

4152

// Create the byte-swapping load.

4153

std::vector<MVT::ValueType> VTs;

4154

VTs.push_back(MVT::i32);

4155

VTs.push_back(MVT::Other);

Dan Gohman

2008-02-06 22:27:42 +0000

[diff] [blame]

4156

SDOperand MO = DAG.getMemOperand(LD->getMemOperand());

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

4157

SDOperand Ops[] = {

4158

LD->getChain(), // Chain

4159

LD->getBasePtr(), // Ptr

Dan Gohman

2008-02-06 22:27:42 +0000

[diff] [blame]

4160

MO, // MemOperand

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

4161

DAG.getValueType(N->getValueType(0)) // VT

4162

};

4163

SDOperand BSLoad = DAG.getNode(PPCISD::LBRX, VTs, Ops, 4);

4164

4165

// If this is an i16 load, insert the truncate.

4166

SDOperand ResVal = BSLoad;

4167

if (N->getValueType(0) == MVT::i16)

4168

ResVal = DAG.getNode(ISD::TRUNCATE, MVT::i16, BSLoad);

4169

4170

// First, combine the bswap away. This makes the value produced by the

4171

// load dead.

4172

DCI.CombineTo(N, ResVal);

4173

4174

// Next, combine the load away, we give it a bogus result value but a real

4175

// chain result. The result value is dead because the bswap is dead.

4176

DCI.CombineTo(Load.Val, ResVal, BSLoad.getValue(1));

4177

4178

// Return N so it doesn't get rechecked!

4179

return SDOperand(N, 0);

}

break;

case PPCISD::VCMP: {

// If a VCMPo node already exists with exactly the same operands as this

4185

// node, use its result instead of this node (VCMPo computes both a CR6 and

4186

// a normal output).

4187

//

4188

if (!N->getOperand(0).hasOneUse() &&

4189

!N->getOperand(1).hasOneUse() &&

4190

!N->getOperand(2).hasOneUse()) {

4191

4192

// Scan all of the users of the LHS, looking for VCMPo's that match.

4193

SDNode *VCMPoNode = 0;

4194

4195

SDNode *LHSN = N->getOperand(0).Val;

4196

for (SDNode::use_iterator UI = LHSN->use_begin(), E = LHSN->use_end();

4197

UI != E; ++UI)

Roman Levenstein

05650fd

2008-04-07 10:06:32 +0000

[diff] [blame]

4198

if ((*UI).getUser()->getOpcode() == PPCISD::VCMPo &&

4199

(*UI).getUser()->getOperand(1) == N->getOperand(1) &&

4200

(*UI).getUser()->getOperand(2) == N->getOperand(2) &&

4201

(*UI).getUser()->getOperand(0) == N->getOperand(0)) {

4202

VCMPoNode = UI->getUser();

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

break;

}

// If there is no VCMPo node, or if the flag value has a single use, don't

4207

// transform this.

4208

if (!VCMPoNode || VCMPoNode->hasNUsesOfValue(0, 1))

4209

break;

4210

4211

// Look at the (necessarily single) use of the flag value. If it has a

4212

// chain, this transformation is more complex. Note that multiple things

4213

// could use the value result, which we should ignore.

4214

SDNode *FlagUser = 0;

4215

for (SDNode::use_iterator UI = VCMPoNode->use_begin();

4216

FlagUser == 0; ++UI) {

4217

assert(UI != VCMPoNode->use_end() && "Didn't find user!");

Roman Levenstein

05650fd

2008-04-07 10:06:32 +0000

[diff] [blame]

4218

SDNode *User = UI->getUser();

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

4219

for (unsigned i = 0, e = User->getNumOperands(); i != e; ++i) {

4220

if (User->getOperand(i) == SDOperand(VCMPoNode, 1)) {

FlagUser = User;

break;

}

}

}

// If the user is a MFCR instruction, we know this is safe. Otherwise we

4228

// give up for right now.

4229

if (FlagUser->getOpcode() == PPCISD::MFCR)

4230

return SDOperand(VCMPoNode, 0);

}

break;

}

case ISD::BR_CC: {

// If this is a branch on an altivec predicate comparison, lower this so

4236

// that we don't have to do a MFCR: instead, branch directly on CR6. This

4237

// lowering is done pre-legalize, because the legalizer lowers the predicate

4238

// compare down to code that is difficult to reassemble.

4239

ISD::CondCode CC = cast<CondCodeSDNode>(N->getOperand(1))->get();

4240

SDOperand LHS = N->getOperand(2), RHS = N->getOperand(3);

int CompareOpc;

bool isDot;

if (LHS.getOpcode() == ISD::INTRINSIC_WO_CHAIN &&

4245

isa<ConstantSDNode>(RHS) && (CC == ISD::SETEQ || CC == ISD::SETNE) &&

4246

getAltivecCompareInfo(LHS, CompareOpc, isDot)) {

4247

assert(isDot && "Can't compare against a vector result!");

4248

4249

// If this is a comparison against something other than 0/1, then we know

4250

// that the condition is never/always true.

4251

unsigned Val = cast<ConstantSDNode>(RHS)->getValue();

4252

if (Val != 0 && Val != 1) {

4253

if (CC == ISD::SETEQ) // Cond never true, remove branch.

4254

return N->getOperand(0);

4255

// Always !=, turn it into an unconditional branch.

4256

return DAG.getNode(ISD::BR, MVT::Other,

4257

N->getOperand(0), N->getOperand(4));

4258

}

4259

4260

bool BranchOnWhenPredTrue = (CC == ISD::SETEQ) ^ (Val == 0);

4261

4262

// Create the PPCISD altivec 'dot' comparison node.

4263

std::vector<MVT::ValueType> VTs;

4264

SDOperand Ops[] = {

4265

LHS.getOperand(2), // LHS of compare

4266

LHS.getOperand(3), // RHS of compare

4267

DAG.getConstant(CompareOpc, MVT::i32)

4268

};

4269

VTs.push_back(LHS.getOperand(2).getValueType());

4270

VTs.push_back(MVT::Flag);

4271

SDOperand CompNode = DAG.getNode(PPCISD::VCMPo, VTs, Ops, 3);

4272

4273

// Unpack the result based on how the target uses it.

4274

PPC::Predicate CompOpc;

4275

switch (cast<ConstantSDNode>(LHS.getOperand(1))->getValue()) {

4276

default: // Can't happen, don't crash on invalid number though.

4277

case 0: // Branch on the value of the EQ bit of CR6.

4278

CompOpc = BranchOnWhenPredTrue ? PPC::PRED_EQ : PPC::PRED_NE;

4279

break;

4280

case 1: // Branch on the inverted value of the EQ bit of CR6.

4281

CompOpc = BranchOnWhenPredTrue ? PPC::PRED_NE : PPC::PRED_EQ;

4282

break;

4283

case 2: // Branch on the value of the LT bit of CR6.

4284

CompOpc = BranchOnWhenPredTrue ? PPC::PRED_LT : PPC::PRED_GE;

4285

break;

4286

case 3: // Branch on the inverted value of the LT bit of CR6.

4287

CompOpc = BranchOnWhenPredTrue ? PPC::PRED_GE : PPC::PRED_LT;

break;

}

return DAG.getNode(PPCISD::COND_BRANCH, MVT::Other, N->getOperand(0),

4292

DAG.getConstant(CompOpc, MVT::i32),

4293

DAG.getRegister(PPC::CR6, MVT::i32),

4294

N->getOperand(4), CompNode.getValue(1));

}

break;

}

}

return SDOperand();

}

//===----------------------------------------------------------------------===//

4304

// Inline Assembly Support

4305

//===----------------------------------------------------------------------===//

4306

4307

void PPCTargetLowering::computeMaskedBitsForTargetNode(const SDOperand Op,

Dan Gohman

d0dfc77

2008-02-13 22:28:48 +0000

[diff] [blame]

4308

const APInt &Mask,

Dan Gohman

229fa05

2008-02-13 00:35:47 +0000

[diff] [blame]

4309

APInt &KnownZero,

4310

APInt &KnownOne,

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

4311

const SelectionDAG &DAG,

4312

unsigned Depth) const {

Dan Gohman

229fa05

2008-02-13 00:35:47 +0000

[diff] [blame]

4313

KnownZero = KnownOne = APInt(Mask.getBitWidth(), 0);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

4314

switch (Op.getOpcode()) {

4315

default: break;

4316

case PPCISD::LBRX: {

4317

// lhbrx is known to have the top bits cleared out.

4318

if (cast<VTSDNode>(Op.getOperand(3))->getVT() == MVT::i16)

4319

KnownZero = 0xFFFF0000;

4320

break;

4321

}

4322

case ISD::INTRINSIC_WO_CHAIN: {

4323

switch (cast<ConstantSDNode>(Op.getOperand(0))->getValue()) {

4324

default: break;

4325

case Intrinsic::ppc_altivec_vcmpbfp_p:

4326

case Intrinsic::ppc_altivec_vcmpeqfp_p:

4327

case Intrinsic::ppc_altivec_vcmpequb_p:

4328

case Intrinsic::ppc_altivec_vcmpequh_p:

4329

case Intrinsic::ppc_altivec_vcmpequw_p:

4330

case Intrinsic::ppc_altivec_vcmpgefp_p:

4331

case Intrinsic::ppc_altivec_vcmpgtfp_p:

4332

case Intrinsic::ppc_altivec_vcmpgtsb_p:

4333

case Intrinsic::ppc_altivec_vcmpgtsh_p:

4334

case Intrinsic::ppc_altivec_vcmpgtsw_p:

4335

case Intrinsic::ppc_altivec_vcmpgtub_p:

4336

case Intrinsic::ppc_altivec_vcmpgtuh_p:

4337

case Intrinsic::ppc_altivec_vcmpgtuw_p:

4338

KnownZero = ~1U; // All bits but the low one are known to be zero.

break;

}

}

}

}

/// getConstraintType - Given a constraint, return the type of

4347

/// constraint it is for this target.

4348

PPCTargetLowering::ConstraintType

4349

PPCTargetLowering::getConstraintType(const std::string &Constraint) const {

4350

if (Constraint.size() == 1) {

4351

switch (Constraint[0]) {

default: break;

case 'b':

case 'r':

case 'f':

case 'v':

case 'y':

return C_RegisterClass;

4359

}

4360

}

4361

return TargetLowering::getConstraintType(Constraint);

4362

}

4363

4364

std::pair<unsigned, const TargetRegisterClass*>

4365

PPCTargetLowering::getRegForInlineAsmConstraint(const std::string &Constraint,

4366

MVT::ValueType VT) const {

4367

if (Constraint.size() == 1) {

4368

// GCC RS6000 Constraint Letters

4369

switch (Constraint[0]) {

4370

case 'b': // R1-R31

4371

case 'r': // R0-R31

4372

if (VT == MVT::i64 && PPCSubTarget.isPPC64())

4373

return std::make_pair(0U, PPC::G8RCRegisterClass);

4374

return std::make_pair(0U, PPC::GPRCRegisterClass);

4375

case 'f':

4376

if (VT == MVT::f32)

4377

return std::make_pair(0U, PPC::F4RCRegisterClass);

4378

else if (VT == MVT::f64)

4379

return std::make_pair(0U, PPC::F8RCRegisterClass);

4380

break;

4381

case 'v':

4382

return std::make_pair(0U, PPC::VRRCRegisterClass);

4383

case 'y': // crrc

4384

return std::make_pair(0U, PPC::CRRCRegisterClass);

}

}

return TargetLowering::getRegForInlineAsmConstraint(Constraint, VT);

}

Chris Lattner

2007-08-25 00:47:38 +0000

[diff] [blame]

4392

/// LowerAsmOperandForConstraint - Lower the specified operand into the Ops

4393

/// vector. If it is invalid, don't add anything to Ops.

4394

void PPCTargetLowering::LowerAsmOperandForConstraint(SDOperand Op, char Letter,

4395

std::vector<SDOperand>&Ops,

Chris Lattner

eca405c

2008-04-26 23:02:14 +0000

[diff] [blame]

4396

SelectionDAG &DAG) const {

Chris Lattner

2007-08-25 00:47:38 +0000

[diff] [blame]

4397

SDOperand Result(0,0);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

switch (Letter) {

default: break;

case 'I':

case 'J':

case 'K':

case 'L':

case 'M':

case 'N':

case 'O':

case 'P': {

ConstantSDNode *CST = dyn_cast<ConstantSDNode>(Op);

Chris Lattner

2007-08-25 00:47:38 +0000

[diff] [blame]

4409

if (!CST) return; // Must be an immediate to match.

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

4410

unsigned Value = CST->getValue();

4411

switch (Letter) {

4412

default: assert(0 && "Unknown constraint letter!");

4413

case 'I': // "I" is a signed 16-bit constant.

4414

if ((short)Value == (int)Value)

Chris Lattner

2007-08-25 00:47:38 +0000

[diff] [blame]

4415

Result = DAG.getTargetConstant(Value, Op.getValueType());

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

4416

break;

4417

case 'J': // "J" is a constant with only the high-order 16 bits nonzero.

4418

case 'L': // "L" is a signed 16-bit constant shifted left 16 bits.

4419

if ((short)Value == 0)

Chris Lattner

2007-08-25 00:47:38 +0000

[diff] [blame]

4420

Result = DAG.getTargetConstant(Value, Op.getValueType());

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

4421

break;

4422

case 'K': // "K" is a constant with only the low-order 16 bits nonzero.

4423

if ((Value >> 16) == 0)

Chris Lattner

2007-08-25 00:47:38 +0000

[diff] [blame]

4424

Result = DAG.getTargetConstant(Value, Op.getValueType());

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

4425

break;

4426

case 'M': // "M" is a constant that is greater than 31.

4427

if (Value > 31)

Chris Lattner

2007-08-25 00:47:38 +0000

[diff] [blame]

4428

Result = DAG.getTargetConstant(Value, Op.getValueType());

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

4429

break;

4430

case 'N': // "N" is a positive constant that is an exact power of two.

4431

if ((int)Value > 0 && isPowerOf2_32(Value))

Chris Lattner

2007-08-25 00:47:38 +0000

[diff] [blame]

4432

Result = DAG.getTargetConstant(Value, Op.getValueType());

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

4433

break;

4434

case 'O': // "O" is the constant zero.

4435

if (Value == 0)

Chris Lattner

2007-08-25 00:47:38 +0000

[diff] [blame]

4436

Result = DAG.getTargetConstant(Value, Op.getValueType());

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

4437

break;

4438

case 'P': // "P" is a constant whose negation is a signed 16-bit constant.

4439

if ((short)-Value == (int)-Value)

Chris Lattner

2007-08-25 00:47:38 +0000

[diff] [blame]

4440

Result = DAG.getTargetConstant(Value, Op.getValueType());

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

break;

}

break;

}

}

Chris Lattner

2007-08-25 00:47:38 +0000

[diff] [blame]

4447

if (Result.Val) {

4448

Ops.push_back(Result);

return;

}

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

4452

// Handle standard constraint letters.

Chris Lattner

2007-08-25 00:47:38 +0000

[diff] [blame]

4453

TargetLowering::LowerAsmOperandForConstraint(Op, Letter, Ops, DAG);

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

4454

}

4455

4456

// isLegalAddressingMode - Return true if the addressing mode represented

4457

// by AM is legal for this target, for a load/store of the specified type.

4458

bool PPCTargetLowering::isLegalAddressingMode(const AddrMode &AM,

4459

const Type *Ty) const {

4460

// FIXME: PPC does not allow r+i addressing modes for vectors!

4461

4462

// PPC allows a sign-extended 16-bit immediate field.

4463

if (AM.BaseOffs <= -(1LL << 16) || AM.BaseOffs >= (1LL << 16)-1)

4464

return false;

4465

4466

// No global is ever allowed as a base.

if (AM.BaseGV)

return false;

// PPC only support r+r,

4471

switch (AM.Scale) {

4472

case 0: // "r+i" or just "i", depending on HasBaseReg.

4473

break;

4474

case 1:

4475

if (AM.HasBaseReg && AM.BaseOffs) // "r+r+i" is not allowed.

4476

return false;

4477

// Otherwise we have r+r or r+i.

4478

break;

4479

case 2:

4480

if (AM.HasBaseReg || AM.BaseOffs) // 2*r+r or 2*r+i is not allowed.

return false;

// Allow 2*r as r+r.

break;

default:

// No other scales are supported.

return false;

}

return true;

}

/// isLegalAddressImmediate - Return true if the integer value can be used

4493

/// as the offset of the target addressing mode for load / store of the

4494

/// given type.

4495

bool PPCTargetLowering::isLegalAddressImmediate(int64_t V,const Type *Ty) const{

4496

// PPC allows a sign-extended 16-bit immediate field.

4497

return (V > -(1 << 16) && V < (1 << 16)-1);

4498

}

4499

4500

bool PPCTargetLowering::isLegalAddressImmediate(llvm::GlobalValue* GV) const {

return false;

}

Chris Lattner

2007-12-08 06:59:59 +0000

[diff] [blame]

4504

SDOperand PPCTargetLowering::LowerRETURNADDR(SDOperand Op, SelectionDAG &DAG) {

4505

// Depths > 0 not supported yet!

4506

if (cast<ConstantSDNode>(Op.getOperand(0))->getValue() > 0)

4507

return SDOperand();

4508

4509

MachineFunction &MF = DAG.getMachineFunction();

4510

PPCFunctionInfo *FuncInfo = MF.getInfo<PPCFunctionInfo>();

Chris Lattner

2007-12-08 06:59:59 +0000

[diff] [blame]

4511

Chris Lattner

2007-12-08 06:59:59 +0000

[diff] [blame]

4512

// Just load the return address off the stack.

Arnold Schwaighofer

2008-04-30 09:16:33 +0000

[diff] [blame^]

4513

SDOperand RetAddrFI = getReturnAddrFrameIndex(DAG);

4514

4515

// Make sure the function really does not optimize away the store of the RA

4516

// to the stack.

4517

FuncInfo->setLRStoreRequired();

Chris Lattner

2007-12-08 06:59:59 +0000

[diff] [blame]

4518

return DAG.getLoad(getPointerTy(), DAG.getEntryNode(), RetAddrFI, NULL, 0);

4519

}

4520

4521

SDOperand PPCTargetLowering::LowerFRAMEADDR(SDOperand Op, SelectionDAG &DAG) {

Dan Gohman

2007-07-18 16:29:46 +0000

[diff] [blame]

4522

// Depths > 0 not supported yet!

4523

if (cast<ConstantSDNode>(Op.getOperand(0))->getValue() > 0)

4524

return SDOperand();

4525

4526

MVT::ValueType PtrVT = DAG.getTargetLoweringInfo().getPointerTy();

4527

bool isPPC64 = PtrVT == MVT::i64;

4528

4529

MachineFunction &MF = DAG.getMachineFunction();

4530

MachineFrameInfo *MFI = MF.getFrameInfo();

4531

bool is31 = (NoFramePointerElim || MFI->hasVarSizedObjects())

4532

&& MFI->getStackSize();

4533

4534

if (isPPC64)

4535

return DAG.getCopyFromReg(DAG.getEntryNode(), is31 ? PPC::X31 : PPC::X1,

Bill Wendling

5e28ab1

2007-08-30 00:59:19 +0000

[diff] [blame]

4536

MVT::i64);

Dan Gohman