Blame - llvm/lib/Target/PowerPC/PPCISelDAGToDAG.cpp - toolchain/llvm-project

2005-08-17 19:33:03 +0000

[diff] [blame]

2

//

3

// The LLVM Compiler Infrastructure

4

//

Chris Lattner

f3ebc3f

2007-12-29 20:36:04 +0000

[diff] [blame]

5

// This file is distributed under the University of Illinois Open Source

6

// License. See LICENSE.TXT for details.

Chris Lattner

2005-08-17 19:33:03 +0000

[diff] [blame]

7

//

8

//===----------------------------------------------------------------------===//

9

//

Nate Begeman

6cca84e

2005-10-16 05:39:50 +0000

[diff] [blame]

10

// This file defines a pattern matching instruction selector for PowerPC,

Chris Lattner

2005-08-17 19:33:03 +0000

[diff] [blame]

11

// converting from a legalized dag to a PPC dag.

12

//

13

//===----------------------------------------------------------------------===//

14

Chris Lattner

bfca1ab

2005-10-14 23:51:18 +0000

[diff] [blame]

15

#include "PPC.h"

Evan Cheng

1142444

2011-07-26 00:24:13 +0000

[diff] [blame]

16

#include "MCTargetDesc/PPCPredicates.h"

Hal Finkel

2014-07-18 23:29:49 +0000

[diff] [blame]

17

#include "PPCMachineFunctionInfo.h"

Chandler Carruth

2012-12-03 16:50:05 +0000

[diff] [blame]

18

#include "PPCTargetMachine.h"

Chris Lattner

2005-08-19 22:38:53 +0000

[diff] [blame]

19

#include "llvm/CodeGen/MachineFunction.h"

Chandler Carruth

2012-12-03 16:50:05 +0000

[diff] [blame]

20

#include "llvm/CodeGen/MachineInstrBuilder.h"

Chris Lattner

a10fff5

2007-12-31 04:13:23 +0000

[diff] [blame]

21

#include "llvm/CodeGen/MachineRegisterInfo.h"

Chris Lattner

2005-08-17 19:33:03 +0000

[diff] [blame]

22

#include "llvm/CodeGen/SelectionDAG.h"

23

#include "llvm/CodeGen/SelectionDAGISel.h"

Chandler Carruth

9fb823b

2013-01-02 11:36:10 +0000

[diff] [blame]

24

#include "llvm/IR/Constants.h"

25

#include "llvm/IR/Function.h"

Chandler Carruth

1fe21fc

2013-01-19 08:03:47 +0000

[diff] [blame]

26

#include "llvm/IR/GlobalAlias.h"

Chandler Carruth

9fb823b

2013-01-02 11:36:10 +0000

[diff] [blame]

27

#include "llvm/IR/GlobalValue.h"

28

#include "llvm/IR/GlobalVariable.h"

29

#include "llvm/IR/Intrinsics.h"

Justin Hibbits

2014-11-12 15:16:30 +0000

[diff] [blame]

30

#include "llvm/IR/Module.h"

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

31

#include "llvm/Support/CommandLine.h"

Chris Lattner

2005-08-17 19:33:03 +0000

[diff] [blame]

32

#include "llvm/Support/Debug.h"

Torok Edwin

fb8d6d5

2009-07-08 20:53:28 +0000

[diff] [blame]

33

#include "llvm/Support/ErrorHandling.h"

Chandler Carruth

2012-12-03 16:50:05 +0000

[diff] [blame]

34

#include "llvm/Support/MathExtras.h"

Torok Edwin

fb8d6d5

2009-07-08 20:53:28 +0000

[diff] [blame]

35

#include "llvm/Support/raw_ostream.h"

Chandler Carruth

2012-12-03 16:50:05 +0000

[diff] [blame]

36

#include "llvm/Target/TargetOptions.h"

Chris Lattner

2005-08-17 19:33:03 +0000

[diff] [blame]

37

using namespace llvm;

38

Chandler Carruth

84e68b2

2014-04-22 02:41:26 +0000

[diff] [blame]

39

#define DEBUG_TYPE "ppc-codegen"

40

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

41

// FIXME: Remove this once the bug has been fixed!

42

cl::opt<bool> ANDIGlueBug("expose-ppc-andi-glue-bug",

43

cl::desc("expose the ANDI glue bug on PPC"), cl::Hidden);

44

Benjamin Kramer

970eac4

2015-02-06 17:51:54 +0000

[diff] [blame]

45

static cl::opt<bool>

46

UseBitPermRewriter("ppc-use-bit-perm-rewriter", cl::init(true),

47

cl::desc("use aggressive ppc isel for bit permutations"),

48

cl::Hidden);

49

static cl::opt<bool> BPermRewriterNoMasking(

50

"ppc-bit-perm-rewriter-stress-rotates",

51

cl::desc("stress rotate selection in aggressive ppc isel for "

52

"bit permutations"),

53

cl::Hidden);

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

54

Krzysztof Parzyszek

2013-02-13 17:40:07 +0000

[diff] [blame]

55

namespace llvm {

56

void initializePPCDAGToDAGISelPass(PassRegistry&);

57

}

58

Chris Lattner

2005-08-17 19:33:03 +0000

[diff] [blame]

59

namespace {

Chris Lattner

2005-08-17 19:33:03 +0000

[diff] [blame]

60

//===--------------------------------------------------------------------===//

Nate Begeman

0b71e00

2005-10-18 00:28:58 +0000

[diff] [blame]

61

/// PPCDAGToDAGISel - PPC specific code to select PPC machine

Chris Lattner

2005-08-17 19:33:03 +0000

[diff] [blame]

62

/// instructions for SelectionDAG operations.

63

///

Nick Lewycky

02d5f77

2009-10-25 06:33:48 +0000

[diff] [blame]

64

class PPCDAGToDAGISel : public SelectionDAGISel {

Dan Gohman

21cea8a

2010-04-17 15:26:15 +0000

[diff] [blame]

65

const PPCTargetMachine &TM;

Eric Christopher

2014-05-22 01:07:24 +0000

[diff] [blame]

66

const PPCSubtarget *PPCSubTarget;

Eric Christopher

2015-01-30 22:02:31 +0000

[diff] [blame]

67

const PPCTargetLowering *PPCLowering;

Chris Lattner

2005-08-19 22:38:53 +0000

[diff] [blame]

68

unsigned GlobalBaseReg;

Chris Lattner

2005-08-17 19:33:03 +0000

[diff] [blame]

69

public:

Dan Gohman

56e3f63

2008-07-07 18:00:37 +0000

[diff] [blame]

70

explicit PPCDAGToDAGISel(PPCTargetMachine &tm)

Eric Christopher

2015-01-30 22:02:31 +0000

[diff] [blame]

71

: SelectionDAGISel(tm), TM(tm) {

Krzysztof Parzyszek

2013-02-13 17:40:07 +0000

[diff] [blame]

72

initializePPCDAGToDAGISelPass(*PassRegistry::getPassRegistry());

73

}

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

74

Craig Topper

2014-04-29 07:57:37 +0000

[diff] [blame]

75

bool runOnMachineFunction(MachineFunction &MF) override {

Chris Lattner

2005-08-19 22:38:53 +0000

[diff] [blame]

76

// Make sure we re-emit a set of the global base reg if necessary

77

GlobalBaseReg = 0;

Eric Christopher

2015-01-30 22:02:31 +0000

[diff] [blame]

78

PPCSubTarget = &MF.getSubtarget<PPCSubtarget>();

79

PPCLowering = PPCSubTarget->getTargetLowering();

Dan Gohman

5ea74d5

2009-07-31 18:16:33 +0000

[diff] [blame]

80

SelectionDAGISel::runOnMachineFunction(MF);

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

81

Eric Christopher

2014-05-22 01:07:24 +0000

[diff] [blame]

82

if (!PPCSubTarget->isSVR4ABI())

Bill Schmidt

38d9458

2012-10-10 20:54:15 +0000

[diff] [blame]

83

InsertVRSaveCode(MF);

84

Chris Lattner

2006-03-16 18:25:23 +0000

[diff] [blame]

85

return true;

Chris Lattner

2005-08-19 22:38:53 +0000

[diff] [blame]

86

}

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

87

Hal Finkel

2015-01-03 01:16:37 +0000

[diff] [blame]

88

void PreprocessISelDAG() override;

Craig Topper

2014-04-29 07:57:37 +0000

[diff] [blame]

89

void PostprocessISelDAG() override;

Bill Schmidt

2013-02-21 00:38:25 +0000

[diff] [blame]

90

Chris Lattner

2005-08-17 19:33:03 +0000

[diff] [blame]

91

/// getI32Imm - Return a target constant with the specified value, of type

92

/// i32.

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

93

inline SDValue getI32Imm(unsigned Imm) {

Owen Anderson

2009-08-11 20:47:22 +0000

[diff] [blame]

94

return CurDAG->getTargetConstant(Imm, MVT::i32);

Chris Lattner

2005-08-17 19:33:03 +0000

[diff] [blame]

95

}

Chris Lattner

2005-08-19 22:38:53 +0000

[diff] [blame]

96

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

97

/// getI64Imm - Return a target constant with the specified value, of type

98

/// i64.

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

99

inline SDValue getI64Imm(uint64_t Imm) {

Owen Anderson

2009-08-11 20:47:22 +0000

[diff] [blame]

100

return CurDAG->getTargetConstant(Imm, MVT::i64);

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

101

}

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

102

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

103

/// getSmallIPtrImm - Return a target constant of pointer type.

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

104

inline SDValue getSmallIPtrImm(unsigned Imm) {

Eric Christopher

2014-05-22 01:07:24 +0000

[diff] [blame]

105

return CurDAG->getTargetConstant(Imm, PPCLowering->getPointerTy());

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

106

}

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

107

Sylvestre Ledru

91ce36c

2012-09-27 10:14:43 +0000

[diff] [blame]

108

/// isRunOfOnes - Returns true iff Val consists of one contiguous run of 1s

Nate Begeman

2006-09-22 05:01:56 +0000

[diff] [blame]

109

/// with any number of 0s on either side. The 1s are allowed to wrap from

110

/// LSB to MSB, so 0x000FFF0, 0x0000FFFF, and 0xFF0000FF are all runs.

111

/// 0x0F0F0000 is not, since all 1s are not contiguous.

112

static bool isRunOfOnes(unsigned Val, unsigned &MB, unsigned &ME);

113

114

115

/// isRotateAndMask - Returns true if Mask and Shift can be folded into a

116

/// rotate and mask opcode and mask operation.

Dale Johannesen

86dcae1

2009-11-24 01:09:07 +0000

[diff] [blame]

117

static bool isRotateAndMask(SDNode *N, unsigned Mask, bool isShiftMask,

Nate Begeman

2006-09-22 05:01:56 +0000

[diff] [blame]

118

unsigned &SH, unsigned &MB, unsigned &ME);

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

119

Chris Lattner

2005-08-19 22:38:53 +0000

[diff] [blame]

120

/// getGlobalBaseReg - insert code into the entry mbb to materialize the PIC

121

/// base register. Return the virtual register that holds this value.

Evan Cheng

61413a3

2006-08-26 05:34:46 +0000

[diff] [blame]

122

SDNode *getGlobalBaseReg();

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

123

Hal Finkel

2014-12-11 22:51:06 +0000

[diff] [blame]

124

SDNode *getFrameIndex(SDNode *SN, SDNode *N, unsigned Offset = 0);

125

Chris Lattner

2005-08-17 19:33:03 +0000

[diff] [blame]

126

// Select - Convert the specified operand from a target-independent to a

127

// target-specific node if it hasn't already been changed.

Craig Topper

2014-04-29 07:57:37 +0000

[diff] [blame]

128

SDNode *Select(SDNode *N) override;

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

129

Nate Begeman

2005-08-19 00:38:14 +0000

[diff] [blame]

130

SDNode *SelectBitfieldInsert(SDNode *N);

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

131

SDNode *SelectBitPermutation(SDNode *N);

Nate Begeman

2005-08-19 00:38:14 +0000

[diff] [blame]

132

Chris Lattner

2005-08-21 18:50:37 +0000

[diff] [blame]

133

/// SelectCC - Select a comparison of the specified values with the

134

/// specified condition code, returning the CR# of the expression.

Andrew Trick

2013-05-25 02:42:55 +0000

[diff] [blame]

135

SDValue SelectCC(SDValue LHS, SDValue RHS, ISD::CondCode CC, SDLoc dl);

Chris Lattner

2005-08-21 18:50:37 +0000

[diff] [blame]

136

Nate Begeman

8e6a8af

2005-12-19 23:25:09 +0000

[diff] [blame]

137

/// SelectAddrImm - Returns true if the address N can be represented by

138

/// a base register plus a signed 16-bit displacement [r+imm].

Chris Lattner

2010-09-21 20:31:19 +0000

[diff] [blame]

139

bool SelectAddrImm(SDValue N, SDValue &Disp,

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

140

SDValue &Base) {

Eric Christopher

2014-05-22 01:07:24 +0000

[diff] [blame]

141

return PPCLowering->SelectAddressRegImm(N, Disp, Base, *CurDAG, false);

Chris Lattner

2006-11-08 02:15:41 +0000

[diff] [blame]

142

}

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

143

Chris Lattner

6f5840c

2006-11-16 00:41:37 +0000

[diff] [blame]

144

/// SelectAddrImmOffs - Return true if the operand is valid for a preinc

Ulrich Weigand

d1b99d3

2013-03-22 14:58:17 +0000

[diff] [blame]

145

/// immediate field. Note that the operand at this point is already the

146

/// result of a prior SelectAddressRegImm call.

Chris Lattner

2010-09-21 20:31:19 +0000

[diff] [blame]

147

bool SelectAddrImmOffs(SDValue N, SDValue &Out) const {

Ulrich Weigand

d1b99d3

2013-03-22 14:58:17 +0000

[diff] [blame]

148

if (N.getOpcode() == ISD::TargetConstant ||

Hal Finkel

a86b0f2

2012-06-21 20:10:48 +0000

[diff] [blame]

149

N.getOpcode() == ISD::TargetGlobalAddress) {

Hal Finkel

1cc27e4

2012-06-19 02:34:32 +0000

[diff] [blame]

Out = N;

return true;

}

return false;

}

Nate Begeman

2005-12-19 23:25:09 +0000

[diff] [blame]

157

/// SelectAddrIdx - Given the specified addressed, check to see if it can be

158

/// represented as an indexed [r+r] operation. Returns false if it can

159

/// be represented by [r+imm], which are preferred.

Chris Lattner

2010-09-21 20:31:19 +0000

[diff] [blame]

160

bool SelectAddrIdx(SDValue N, SDValue &Base, SDValue &Index) {

Eric Christopher

2014-05-22 01:07:24 +0000

[diff] [blame]

161

return PPCLowering->SelectAddressRegReg(N, Base, Index, *CurDAG);

Chris Lattner

2006-11-08 02:15:41 +0000

[diff] [blame]

162

}

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

163

Nate Begeman

8e6a8af

2005-12-19 23:25:09 +0000

[diff] [blame]

164

/// SelectAddrIdxOnly - Given the specified addressed, force it to be

165

/// represented as an indexed [r+r] operation.

Chris Lattner

2010-09-21 20:31:19 +0000

[diff] [blame]

166

bool SelectAddrIdxOnly(SDValue N, SDValue &Base, SDValue &Index) {

Eric Christopher

2014-05-22 01:07:24 +0000

[diff] [blame]

167

return PPCLowering->SelectAddressRegRegOnly(N, Base, Index, *CurDAG);

Chris Lattner

2006-11-08 02:15:41 +0000

[diff] [blame]

168

}

Chris Lattner

c5292ec

2005-08-21 22:31:09 +0000

[diff] [blame]

169

Ulrich Weigand

9d980cb

2013-05-16 17:58:02 +0000

[diff] [blame]

170

/// SelectAddrImmX4 - Returns true if the address N can be represented by

171

/// a base register plus a signed 16-bit displacement that is a multiple of 4.

172

/// Suitable for use by STD and friends.

173

bool SelectAddrImmX4(SDValue N, SDValue &Disp, SDValue &Base) {

Eric Christopher

2014-05-22 01:07:24 +0000

[diff] [blame]

174

return PPCLowering->SelectAddressRegImm(N, Disp, Base, *CurDAG, true);

Chris Lattner

2006-11-08 02:15:41 +0000

[diff] [blame]

175

}

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

176

Hal Finkel

756810f

2013-03-21 21:37:52 +0000

[diff] [blame]

177

// Select an address into a single register.

178

bool SelectAddr(SDValue N, SDValue &Base) {

Base = N;

return true;

}

Chris Lattner

2006-02-24 02:13:12 +0000

[diff] [blame]

183

/// SelectInlineAsmMemoryOperand - Implement addressing mode selection for

Dale Johannesen

4a50e68

2009-08-18 00:18:39 +0000

[diff] [blame]

184

/// inline asm expressions. It is always correct to compute the value into

185

/// a register. The case of adding a (possibly relocatable) constant to a

186

/// register can be improved, but it is wrong to substitute Reg+Reg for

187

/// Reg in an asm, because the load or store opcode would have to change.

Hal Finkel

d433838

2014-12-03 23:40:13 +0000

[diff] [blame]

188

bool SelectInlineAsmMemoryOperand(const SDValue &Op,

Daniel Sanders

60f1db0

2015-03-13 12:45:09 +0000

[diff] [blame]

189

unsigned ConstraintID,

Craig Topper

2014-04-29 07:57:37 +0000

[diff] [blame]

190

std::vector<SDValue> &OutOps) override {

Hal Finkel

d433838

2014-12-03 23:40:13 +0000

[diff] [blame]

191

Daniel Sanders

0828860

2015-03-17 11:09:13 +0000

[diff] [blame]

192

switch(ConstraintID) {

193

default:

194

errs() << "ConstraintID: " << ConstraintID << "\n";

195

llvm_unreachable("Unexpected asm memory constraint");

196

case InlineAsm::Constraint_es:

Daniel Sanders

914b947

2015-03-17 12:00:04 +0000

[diff] [blame^]

197

case InlineAsm::Constraint_i:

Daniel Sanders

0828860

2015-03-17 11:09:13 +0000

[diff] [blame]

198

case InlineAsm::Constraint_m:

199

case InlineAsm::Constraint_o:

200

case InlineAsm::Constraint_Q:

201

case InlineAsm::Constraint_Z:

202

case InlineAsm::Constraint_Zy:

203

// We need to make sure that this one operand does not end up in r0

204

// (because we might end up lowering this as 0(%op)).

205

const TargetRegisterInfo *TRI = PPCSubTarget->getRegisterInfo();

206

const TargetRegisterClass *TRC = TRI->getPointerRegClass(*MF, /*Kind=*/1);

207

SDValue RC = CurDAG->getTargetConstant(TRC->getID(), MVT::i32);

208

SDValue NewOp =

209

SDValue(CurDAG->getMachineNode(TargetOpcode::COPY_TO_REGCLASS,

210

SDLoc(Op), Op.getValueType(),

211

Op, RC), 0);

212

213

OutOps.push_back(NewOp);

214

return false;

215

}

216

return true;

Chris Lattner

a1ec1dd

2006-02-24 02:13:12 +0000

[diff] [blame]

217

}

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

218

Dan Gohman

5ea74d5

2009-07-31 18:16:33 +0000

[diff] [blame]

219

void InsertVRSaveCode(MachineFunction &MF);

Chris Lattner

2006-03-16 18:25:23 +0000

[diff] [blame]

220

Craig Topper

2014-04-29 07:57:37 +0000

[diff] [blame]

221

const char *getPassName() const override {

Chris Lattner

2005-08-17 19:33:03 +0000

[diff] [blame]

222

return "PowerPC DAG->DAG Pattern Instruction Selection";

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

223

}

224

Chris Lattner

03e08ee

2005-09-13 22:03:06 +0000

[diff] [blame]

225

// Include the pieces autogenerated from the target description.

Chris Lattner

0921e3b

2005-10-14 23:37:35 +0000

[diff] [blame]

226

#include "PPCGenDAGISel.inc"

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

227

Chris Lattner

259e6c7

2005-10-06 18:45:51 +0000

[diff] [blame]

228

private:

Dan Gohman

2010-01-05 01:24:18 +0000

[diff] [blame]

229

SDNode *SelectSETCC(SDNode *N);

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

230

231

void PeepholePPC64();

Hal Finkel

2014-12-12 23:59:36 +0000

[diff] [blame]

232

void PeepholePPC64ZExt();

Eric Christopher

02e1804

2014-05-14 00:31:15 +0000

[diff] [blame]

233

void PeepholeCROps();

Hal Finkel

2014-02-28 06:11:16 +0000

[diff] [blame]

234

Hal Finkel

2015-01-03 01:16:37 +0000

[diff] [blame]

235

SDValue combineToCMPB(SDNode *N);

Hal Finkel

200d2ad

2015-01-05 21:10:24 +0000

[diff] [blame]

236

void foldBoolExts(SDValue &Res, SDNode *&N);

Hal Finkel

2015-01-03 01:16:37 +0000

[diff] [blame]

237

Hal Finkel

2014-02-28 06:11:16 +0000

[diff] [blame]

238

bool AllUsersSelectZero(SDNode *N);

239

void SwapAllSelectUsers(SDNode *N);

Hal Finkel

2015-02-25 21:36:59 +0000

[diff] [blame]

240

241

SDNode *transferMemOperands(SDNode *N, SDNode *Result);

Chris Lattner

2005-08-17 19:33:03 +0000

[diff] [blame]

};

}

Chris Lattner

2006-03-16 18:25:23 +0000

[diff] [blame]

245

/// InsertVRSaveCode - Once the entire function has been instruction selected,

246

/// all virtual registers are created and all machine instructions are built,

247

/// check to see if we need to save/restore VRSAVE. If so, do it.

Dan Gohman

5ea74d5

2009-07-31 18:16:33 +0000

[diff] [blame]

248

void PPCDAGToDAGISel::InsertVRSaveCode(MachineFunction &Fn) {

Chris Lattner

2006-03-13 21:52:10 +0000

[diff] [blame]

249

// Check to see if this function uses vector registers, which means we have to

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

250

// save and restore the VRSAVE register and update it with the regs we use.

Chris Lattner

2006-03-13 21:52:10 +0000

[diff] [blame]

251

//

Dan Gohman

4a61882

2010-02-10 16:03:48 +0000

[diff] [blame]

252

// In this case, there will be virtual registers of vector type created

Chris Lattner

2006-03-13 21:52:10 +0000

[diff] [blame]

253

// by the scheduler. Detect them now.

Chris Lattner

2006-03-13 21:52:10 +0000

[diff] [blame]

254

bool HasVectorVReg = false;

Jakob Stoklund Olesen

4a7b48d

2011-01-08 23:11:11 +0000

[diff] [blame]

255

for (unsigned i = 0, e = RegInfo->getNumVirtRegs(); i != e; ++i) {

256

unsigned Reg = TargetRegisterInfo::index2VirtReg(i);

257

if (RegInfo->getRegClass(Reg) == &PPC::VRRCRegClass) {

Chris Lattner

2006-03-13 21:52:10 +0000

[diff] [blame]

258

HasVectorVReg = true;

259

break;

260

}

Jakob Stoklund Olesen

4a7b48d

2011-01-08 23:11:11 +0000

[diff] [blame]

261

}

Chris Lattner

2006-03-16 18:25:23 +0000

[diff] [blame]

262

if (!HasVectorVReg) return; // nothing to do.

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

263

Chris Lattner

2006-03-13 21:52:10 +0000

[diff] [blame]

264

// If we have a vector register, we want to emit code into the entry and exit

265

// blocks to save and restore the VRSAVE register. We do this here (instead

266

// of marking all vector instructions as clobbering VRSAVE) for two reasons:

267

//

268

// 1. This (trivially) reduces the load on the register allocator, by not

269

// having to represent the live range of the VRSAVE register.

270

// 2. This (more significantly) allows us to create a temporary virtual

271

// register to hold the saved VRSAVE value, allowing this temporary to be

272

// register allocated, instead of forcing it to be spilled to the stack.

Chris Lattner

2006-03-16 18:25:23 +0000

[diff] [blame]

273

274

// Create two vregs - one to hold the VRSAVE register that is live-in to the

275

// function and one for the value after having bits or'd into it.

Chris Lattner

a10fff5

2007-12-31 04:13:23 +0000

[diff] [blame]

276

unsigned InVRSAVE = RegInfo->createVirtualRegister(&PPC::GPRCRegClass);

277

unsigned UpdatedVRSAVE = RegInfo->createVirtualRegister(&PPC::GPRCRegClass);

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

278

Eric Christopher

2015-01-30 22:02:31 +0000

[diff] [blame]

279

const TargetInstrInfo &TII = *PPCSubTarget->getInstrInfo();

Chris Lattner

2006-03-16 18:25:23 +0000

[diff] [blame]

280

MachineBasicBlock &EntryBB = *Fn.begin();

Chris Lattner

6f306d7

2010-04-02 20:16:16 +0000

[diff] [blame]

281

DebugLoc dl;

Chris Lattner

2006-03-16 18:25:23 +0000

[diff] [blame]

282

// Emit the following code into the entry block:

283

// InVRSAVE = MFVRSAVE

284

// UpdatedVRSAVE = UPDATE_VRSAVE InVRSAVE

285

// MTVRSAVE UpdatedVRSAVE

286

MachineBasicBlock::iterator IP = EntryBB.begin(); // Insert Point

Dale Johannesen

2009-02-13 02:27:39 +0000

[diff] [blame]

287

BuildMI(EntryBB, IP, dl, TII.get(PPC::MFVRSAVE), InVRSAVE);

288

BuildMI(EntryBB, IP, dl, TII.get(PPC::UPDATE_VRSAVE),

Chris Lattner

a98c679

2008-01-07 01:56:04 +0000

[diff] [blame]

289

UpdatedVRSAVE).addReg(InVRSAVE);

Dale Johannesen

2009-02-13 02:27:39 +0000

[diff] [blame]

290

BuildMI(EntryBB, IP, dl, TII.get(PPC::MTVRSAVE)).addReg(UpdatedVRSAVE);

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

291

Chris Lattner

2006-03-16 18:25:23 +0000

[diff] [blame]

292

// Find all return blocks, outputting a restore in each epilog.

Chris Lattner

2006-03-16 18:25:23 +0000

[diff] [blame]

293

for (MachineFunction::iterator BB = Fn.begin(), E = Fn.end(); BB != E; ++BB) {

Evan Cheng

7f8e563

2011-12-07 07:15:52 +0000

[diff] [blame]

294

if (!BB->empty() && BB->back().isReturn()) {

Chris Lattner

2006-03-16 18:25:23 +0000

[diff] [blame]

295

IP = BB->end(); --IP;

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

296

Chris Lattner

2006-03-16 18:25:23 +0000

[diff] [blame]

297

// Skip over all terminator instructions, which are part of the return

298

// sequence.

299

MachineBasicBlock::iterator I2 = IP;

Evan Cheng

7f8e563

2011-12-07 07:15:52 +0000

[diff] [blame]

300

while (I2 != BB->begin() && (--I2)->isTerminator())

Chris Lattner

2006-03-16 18:25:23 +0000

[diff] [blame]

301

IP = I2;

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

302

Chris Lattner

2006-03-16 18:25:23 +0000

[diff] [blame]

303

// Emit: MTVRSAVE InVRSave

Dale Johannesen

2009-02-13 02:27:39 +0000

[diff] [blame]

304

BuildMI(*BB, IP, dl, TII.get(PPC::MTVRSAVE)).addReg(InVRSAVE);

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

305

}

Chris Lattner

2006-03-13 21:52:10 +0000

[diff] [blame]

306

}

Chris Lattner

259e6c7

2005-10-06 18:45:51 +0000

[diff] [blame]

307

}

Chris Lattner

8ae9525

2005-09-03 01:17:22 +0000

[diff] [blame]

308

Chris Lattner

2006-03-16 18:25:23 +0000

[diff] [blame]

309

Chris Lattner

2005-08-19 22:38:53 +0000

[diff] [blame]

310

/// getGlobalBaseReg - Output the instructions required to put the

311

/// base address to use for accessing globals into a register.

312

///

Evan Cheng

61413a3

2006-08-26 05:34:46 +0000

[diff] [blame]

313

SDNode *PPCDAGToDAGISel::getGlobalBaseReg() {

Chris Lattner

2005-08-19 22:38:53 +0000

[diff] [blame]

314

if (!GlobalBaseReg) {

Eric Christopher

2015-01-30 22:02:31 +0000

[diff] [blame]

315

const TargetInstrInfo &TII = *PPCSubTarget->getInstrInfo();

Chris Lattner

2005-08-19 22:38:53 +0000

[diff] [blame]

316

// Insert the set of GlobalBaseReg into the first MBB of the function

Dan Gohman

fca8968

2009-08-15 02:07:36 +0000

[diff] [blame]

317

MachineBasicBlock &FirstMBB = MF->front();

Chris Lattner

2005-08-19 22:38:53 +0000

[diff] [blame]

318

MachineBasicBlock::iterator MBBI = FirstMBB.begin();

Justin Hibbits

2014-11-12 15:16:30 +0000

[diff] [blame]

319

const Module *M = MF->getFunction()->getParent();

Chris Lattner

6f306d7

2010-04-02 20:16:16 +0000

[diff] [blame]

320

DebugLoc dl;

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

321

Eric Christopher

2014-05-22 01:07:24 +0000

[diff] [blame]

322

if (PPCLowering->getPointerTy() == MVT::i32) {

Justin Hibbits

2014-11-12 15:16:30 +0000

[diff] [blame]

323

if (PPCSubTarget->isTargetELF()) {

Hal Finkel

2014-07-18 23:29:49 +0000

[diff] [blame]

324

GlobalBaseReg = PPC::R30;

Justin Hibbits

2014-11-12 15:16:30 +0000

[diff] [blame]

325

if (M->getPICLevel() == PICLevel::Small) {

326

BuildMI(FirstMBB, MBBI, dl, TII.get(PPC::MoveGOTtoLR));

327

BuildMI(FirstMBB, MBBI, dl, TII.get(PPC::MFLR), GlobalBaseReg);

Justin Hibbits

98a532d

2015-01-08 15:47:19 +0000

[diff] [blame]

328

MF->getInfo<PPCFunctionInfo>()->setUsesPICBase(true);

Justin Hibbits

2014-11-12 15:16:30 +0000

[diff] [blame]

329

} else {

330

BuildMI(FirstMBB, MBBI, dl, TII.get(PPC::MovePCtoLR));

331

BuildMI(FirstMBB, MBBI, dl, TII.get(PPC::MFLR), GlobalBaseReg);

332

unsigned TempReg = RegInfo->createVirtualRegister(&PPC::GPRCRegClass);

333

BuildMI(FirstMBB, MBBI, dl,

Hal Finkel

2015-02-25 21:36:59 +0000

[diff] [blame]

334

TII.get(PPC::UpdateGBR), GlobalBaseReg)

Justin Hibbits

2014-11-12 15:16:30 +0000

[diff] [blame]

335

.addReg(TempReg, RegState::Define).addReg(GlobalBaseReg);

336

MF->getInfo<PPCFunctionInfo>()->setUsesPICBase(true);

337

}

338

} else {

Hal Finkel

2014-07-18 23:29:49 +0000

[diff] [blame]

339

GlobalBaseReg =

340

RegInfo->createVirtualRegister(&PPC::GPRC_NOR0RegClass);

Justin Hibbits

2014-11-12 15:16:30 +0000

[diff] [blame]

341

BuildMI(FirstMBB, MBBI, dl, TII.get(PPC::MovePCtoLR));

342

BuildMI(FirstMBB, MBBI, dl, TII.get(PPC::MFLR), GlobalBaseReg);

Hal Finkel

2014-07-18 23:29:49 +0000

[diff] [blame]

343

}

Chris Lattner

b542925

2006-11-14 18:43:11 +0000

[diff] [blame]

344

} else {

Hal Finkel

6daf2aa

2014-03-06 01:28:23 +0000

[diff] [blame]

345

GlobalBaseReg = RegInfo->createVirtualRegister(&PPC::G8RC_NOX0RegClass);

Cameron Zwarich

dadd733

2011-05-19 02:56:28 +0000

[diff] [blame]

346

BuildMI(FirstMBB, MBBI, dl, TII.get(PPC::MovePCtoLR8));

Dale Johannesen

2009-02-13 02:27:39 +0000

[diff] [blame]

347

BuildMI(FirstMBB, MBBI, dl, TII.get(PPC::MFLR8), GlobalBaseReg);

Chris Lattner

b542925

2006-11-14 18:43:11 +0000

[diff] [blame]

348

}

Chris Lattner

2005-08-19 22:38:53 +0000

[diff] [blame]

349

}

Gabor Greif

81d6a38

2008-08-31 15:37:04 +0000

[diff] [blame]

350

return CurDAG->getRegister(GlobalBaseReg,

Eric Christopher

2014-05-22 01:07:24 +0000

[diff] [blame]

351

PPCLowering->getPointerTy()).getNode();

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

352

}

353

354

/// isIntS16Immediate - This method tests to see if the node is either a 32-bit

355

/// or 64-bit immediate, and if the value can be accurately represented as a

356

/// sign extension from a 16-bit value. If so, this returns true and the

357

/// immediate.

358

static bool isIntS16Immediate(SDNode *N, short &Imm) {

359

if (N->getOpcode() != ISD::Constant)

360

return false;

361

Dan Gohman

2008-09-12 16:56:44 +0000

[diff] [blame]

362

Imm = (short)cast<ConstantSDNode>(N)->getZExtValue();

Owen Anderson

2009-08-11 20:47:22 +0000

[diff] [blame]

363

if (N->getValueType(0) == MVT::i32)

Dan Gohman

2008-09-12 16:56:44 +0000

[diff] [blame]

364

return Imm == (int32_t)cast<ConstantSDNode>(N)->getZExtValue();

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

365

else

Dan Gohman

2008-09-12 16:56:44 +0000

[diff] [blame]

366

return Imm == (int64_t)cast<ConstantSDNode>(N)->getZExtValue();

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

367

}

368

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

369

static bool isIntS16Immediate(SDValue Op, short &Imm) {

Gabor Greif

2008-08-28 21:40:38 +0000

[diff] [blame]

370

return isIntS16Immediate(Op.getNode(), Imm);

Chris Lattner

2005-08-19 22:38:53 +0000

[diff] [blame]

}

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

374

/// isInt32Immediate - This method tests to see if the node is a 32-bit constant

375

/// operand. If so Imm will receive the 32-bit value.

376

static bool isInt32Immediate(SDNode *N, unsigned &Imm) {

Owen Anderson

2009-08-11 20:47:22 +0000

[diff] [blame]

377

if (N->getOpcode() == ISD::Constant && N->getValueType(0) == MVT::i32) {

Dan Gohman

2008-09-12 16:56:44 +0000

[diff] [blame]

378

Imm = cast<ConstantSDNode>(N)->getZExtValue();

Nate Begeman

72d6f88

2005-08-18 05:00:13 +0000

[diff] [blame]

return true;

}

return false;

}

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

384

/// isInt64Immediate - This method tests to see if the node is a 64-bit constant

385

/// operand. If so Imm will receive the 64-bit value.

386

static bool isInt64Immediate(SDNode *N, uint64_t &Imm) {

Owen Anderson

2009-08-11 20:47:22 +0000

[diff] [blame]

387

if (N->getOpcode() == ISD::Constant && N->getValueType(0) == MVT::i64) {

Dan Gohman

2008-09-12 16:56:44 +0000

[diff] [blame]

388

Imm = cast<ConstantSDNode>(N)->getZExtValue();

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

return true;

}

return false;

}

// isInt32Immediate - This method tests to see if a constant operand.

395

// If so Imm will receive the 32 bit value.

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

396

static bool isInt32Immediate(SDValue N, unsigned &Imm) {

Gabor Greif

2008-08-28 21:40:38 +0000

[diff] [blame]

397

return isInt32Immediate(N.getNode(), Imm);

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

}

// isOpcWithIntImmediate - This method tests to see if the node is a specific

402

// opcode and that it has a immediate integer right operand.

403

// If so Imm will receive the 32 bit value.

404

static bool isOpcWithIntImmediate(SDNode *N, unsigned Opc, unsigned& Imm) {

Gabor Greif

81d6a38

2008-08-31 15:37:04 +0000

[diff] [blame]

405

return N->getOpcode() == Opc

406

&& isInt32Immediate(N->getOperand(1).getNode(), Imm);

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

407

}

408

Hal Finkel

2014-12-11 22:51:06 +0000

[diff] [blame]

409

SDNode *PPCDAGToDAGISel::getFrameIndex(SDNode *SN, SDNode *N, unsigned Offset) {

410

SDLoc dl(SN);

411

int FI = cast<FrameIndexSDNode>(N)->getIndex();

412

SDValue TFI = CurDAG->getTargetFrameIndex(FI, N->getValueType(0));

413

unsigned Opc = N->getValueType(0) == MVT::i32 ? PPC::ADDI : PPC::ADDI8;

414

if (SN->hasOneUse())

415

return CurDAG->SelectNodeTo(SN, Opc, N->getValueType(0), TFI,

416

getSmallIPtrImm(Offset));

417

return CurDAG->getMachineNode(Opc, dl, N->getValueType(0), TFI,

418

getSmallIPtrImm(Offset));

419

}

420

Nate Begeman

2006-09-22 05:01:56 +0000

[diff] [blame]

421

bool PPCDAGToDAGISel::isRunOfOnes(unsigned Val, unsigned &MB, unsigned &ME) {

Hal Finkel

ff3ea80

2013-07-11 16:31:51 +0000

[diff] [blame]

if (!Val)

return false;

Nate Begeman

2005-08-18 07:30:46 +0000

[diff] [blame]

425

if (isShiftedMask_32(Val)) {

426

// look for the first non-zero bit

Michael J. Spencer

2013-05-24 22:23:49 +0000

[diff] [blame]

427

MB = countLeadingZeros(Val);

Nate Begeman

2005-08-18 07:30:46 +0000

[diff] [blame]

428

// look for the first zero bit after the run of ones

Michael J. Spencer

2013-05-24 22:23:49 +0000

[diff] [blame]

429

ME = countLeadingZeros((Val - 1) ^ Val);

Nate Begeman

2005-08-18 07:30:46 +0000

[diff] [blame]

430

return true;

Chris Lattner

666512c

2005-08-25 04:47:18 +0000

[diff] [blame]

431

} else {

432

Val = ~Val; // invert mask

433

if (isShiftedMask_32(Val)) {

434

// effectively look for the first zero bit

Michael J. Spencer

2013-05-24 22:23:49 +0000

[diff] [blame]

435

ME = countLeadingZeros(Val) - 1;

Chris Lattner

666512c

2005-08-25 04:47:18 +0000

[diff] [blame]

436

// effectively look for the first one bit after the run of zeros

Michael J. Spencer

2013-05-24 22:23:49 +0000

[diff] [blame]

437

MB = countLeadingZeros((Val - 1) ^ Val) + 1;

Chris Lattner

666512c

2005-08-25 04:47:18 +0000

[diff] [blame]

438

return true;

439

}

Nate Begeman

2005-08-18 07:30:46 +0000

[diff] [blame]

}

// no run present

return false;

}

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

445

bool PPCDAGToDAGISel::isRotateAndMask(SDNode *N, unsigned Mask,

446

bool isShiftMask, unsigned &SH,

Nate Begeman

2006-09-22 05:01:56 +0000

[diff] [blame]

447

unsigned &MB, unsigned &ME) {

Nate Begeman

92e7750

2005-10-19 00:05:37 +0000

[diff] [blame]

448

// Don't even go down this path for i64, since different logic will be

449

// necessary for rldicl/rldicr/rldimi.

Owen Anderson

2009-08-11 20:47:22 +0000

[diff] [blame]

450

if (N->getValueType(0) != MVT::i32)

Nate Begeman

92e7750

2005-10-19 00:05:37 +0000

[diff] [blame]

451

return false;

452

Nate Begeman

2005-08-18 07:30:46 +0000

[diff] [blame]

453

unsigned Shift = 32;

454

unsigned Indeterminant = ~0; // bit mask marking indeterminant results

455

unsigned Opcode = N->getOpcode();

Chris Lattner

e413b60

2005-08-30 00:59:16 +0000

[diff] [blame]

456

if (N->getNumOperands() != 2 ||

Gabor Greif

2008-08-28 21:40:38 +0000

[diff] [blame]

457

!isInt32Immediate(N->getOperand(1).getNode(), Shift) || (Shift > 31))

Nate Begeman

2005-08-18 07:30:46 +0000

[diff] [blame]

458

return false;

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

459

Nate Begeman

2005-08-18 07:30:46 +0000

[diff] [blame]

460

if (Opcode == ISD::SHL) {

461

// apply shift left to mask if it comes first

Dale Johannesen

86dcae1

2009-11-24 01:09:07 +0000

[diff] [blame]

462

if (isShiftMask) Mask = Mask << Shift;

Nate Begeman

2005-08-18 07:30:46 +0000

[diff] [blame]

463

// determine which bits are made indeterminant by shift

464

Indeterminant = ~(0xFFFFFFFFu << Shift);

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

465

} else if (Opcode == ISD::SRL) {

Nate Begeman

2005-08-18 07:30:46 +0000

[diff] [blame]

466

// apply shift right to mask if it comes first

Dale Johannesen

86dcae1

2009-11-24 01:09:07 +0000

[diff] [blame]

467

if (isShiftMask) Mask = Mask >> Shift;

Nate Begeman

2005-08-18 07:30:46 +0000

[diff] [blame]

468

// determine which bits are made indeterminant by shift

469

Indeterminant = ~(0xFFFFFFFFu >> Shift);

470

// adjust for the left rotate

471

Shift = 32 - Shift;

Nate Begeman

2006-09-22 05:01:56 +0000

[diff] [blame]

472

} else if (Opcode == ISD::ROTL) {

473

Indeterminant = 0;

Nate Begeman

2005-08-18 07:30:46 +0000

[diff] [blame]

474

} else {

475

return false;

476

}

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

477

Nate Begeman

2005-08-18 07:30:46 +0000

[diff] [blame]

478

// if the mask doesn't intersect any Indeterminant bits

479

if (Mask && !(Mask & Indeterminant)) {

Chris Lattner

a296339

2006-05-12 16:29:37 +0000

[diff] [blame]

480

SH = Shift & 31;

Nate Begeman

2005-08-18 07:30:46 +0000

[diff] [blame]

481

// make sure the mask is still a mask (wrap arounds may not be)

482

return isRunOfOnes(Mask, MB, ME);

}

return false;

}

Nate Begeman

2005-08-19 00:38:14 +0000

[diff] [blame]

487

/// SelectBitfieldInsert - turn an or of two masked values into

488

/// the rotate left word immediate then mask insert (rlwimi) instruction.

Nate Begeman

0b71e00

2005-10-18 00:28:58 +0000

[diff] [blame]

489

SDNode *PPCDAGToDAGISel::SelectBitfieldInsert(SDNode *N) {

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

490

SDValue Op0 = N->getOperand(0);

491

SDValue Op1 = N->getOperand(1);

Andrew Trick

2013-05-25 02:42:55 +0000

[diff] [blame]

492

SDLoc dl(N);

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

493

Dan Gohman

f19609a

2008-02-27 01:23:58 +0000

[diff] [blame]

494

APInt LKZ, LKO, RKZ, RKO;

Jay Foad

a0653a3

2014-05-14 21:14:37 +0000

[diff] [blame]

495

CurDAG->computeKnownBits(Op0, LKZ, LKO);

496

CurDAG->computeKnownBits(Op1, RKZ, RKO);

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

497

Dan Gohman

f19609a

2008-02-27 01:23:58 +0000

[diff] [blame]

498

unsigned TargetMask = LKZ.getZExtValue();

499

unsigned InsertMask = RKZ.getZExtValue();

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

500

Nate Begeman

2006-05-08 17:38:32 +0000

[diff] [blame]

501

if ((TargetMask | InsertMask) == 0xFFFFFFFF) {

502

unsigned Op0Opc = Op0.getOpcode();

503

unsigned Op1Opc = Op1.getOpcode();

504

unsigned Value, SH = 0;

505

TargetMask = ~TargetMask;

506

InsertMask = ~InsertMask;

Nate Begeman

2006-05-07 00:23:38 +0000

[diff] [blame]

507

Nate Begeman

2006-05-08 17:38:32 +0000

[diff] [blame]

508

// If the LHS has a foldable shift and the RHS does not, then swap it to the

509

// RHS so that we can fold the shift into the insert.

Nate Begeman

2006-05-07 00:23:38 +0000

[diff] [blame]

510

if (Op0Opc == ISD::AND && Op1Opc == ISD::AND) {

511

if (Op0.getOperand(0).getOpcode() == ISD::SHL ||

512

Op0.getOperand(0).getOpcode() == ISD::SRL) {

513

if (Op1.getOperand(0).getOpcode() != ISD::SHL &&

514

Op1.getOperand(0).getOpcode() != ISD::SRL) {

515

std::swap(Op0, Op1);

516

std::swap(Op0Opc, Op1Opc);

Nate Begeman

2006-05-08 17:38:32 +0000

[diff] [blame]

517

std::swap(TargetMask, InsertMask);

Nate Begeman

2006-05-07 00:23:38 +0000

[diff] [blame]

518

}

Nate Begeman

2005-08-19 00:38:14 +0000

[diff] [blame]

519

}

Nate Begeman

2006-05-08 17:38:32 +0000

[diff] [blame]

520

} else if (Op0Opc == ISD::SHL || Op0Opc == ISD::SRL) {

521

if (Op1Opc == ISD::AND && Op1.getOperand(0).getOpcode() != ISD::SHL &&

522

Op1.getOperand(0).getOpcode() != ISD::SRL) {

523

std::swap(Op0, Op1);

524

std::swap(Op0Opc, Op1Opc);

525

std::swap(TargetMask, InsertMask);

526

}

Nate Begeman

2005-08-19 00:38:14 +0000

[diff] [blame]

527

}

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

528

Nate Begeman

2006-05-07 00:23:38 +0000

[diff] [blame]

529

unsigned MB, ME;

Hal Finkel

ff3ea80

2013-07-11 16:31:51 +0000

[diff] [blame]

530

if (isRunOfOnes(InsertMask, MB, ME)) {

Dale Johannesen

8495a50

2009-11-20 22:16:40 +0000

[diff] [blame]

531

SDValue Tmp1, Tmp2;

Nate Begeman

2006-05-07 00:23:38 +0000

[diff] [blame]

532

533

if ((Op1Opc == ISD::SHL || Op1Opc == ISD::SRL) &&

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

534

isInt32Immediate(Op1.getOperand(1), Value)) {

Nate Begeman

2006-05-07 00:23:38 +0000

[diff] [blame]

535

Op1 = Op1.getOperand(0);

536

SH = (Op1Opc == ISD::SHL) ? Value : 32 - Value;

537

}

538

if (Op1Opc == ISD::AND) {

Hal Finkel

d9963c7

2014-04-13 17:10:58 +0000

[diff] [blame]

539

// The AND mask might not be a constant, and we need to make sure that

540

// if we're going to fold the masking with the insert, all bits not

541

// know to be zero in the mask are known to be one.

542

APInt MKZ, MKO;

Jay Foad

a0653a3

2014-05-14 21:14:37 +0000

[diff] [blame]

543

CurDAG->computeKnownBits(Op1.getOperand(1), MKZ, MKO);

Hal Finkel

d9963c7

2014-04-13 17:10:58 +0000

[diff] [blame]

544

bool CanFoldMask = InsertMask == MKO.getZExtValue();

545

Nate Begeman

2006-05-07 00:23:38 +0000

[diff] [blame]

546

unsigned SHOpc = Op1.getOperand(0).getOpcode();

Hal Finkel

d9963c7

2014-04-13 17:10:58 +0000

[diff] [blame]

547

if ((SHOpc == ISD::SHL || SHOpc == ISD::SRL) && CanFoldMask &&

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

548

isInt32Immediate(Op1.getOperand(0).getOperand(1), Value)) {

Eric Christopher

02e1804

2014-05-14 00:31:15 +0000

[diff] [blame]

549

// Note that Value must be in range here (less than 32) because

550

// otherwise there would not be any bits set in InsertMask.

Nate Begeman

2006-05-07 00:23:38 +0000

[diff] [blame]

551

Op1 = Op1.getOperand(0).getOperand(0);

552

SH = (SHOpc == ISD::SHL) ? Value : 32 - Value;

Nate Begeman

2006-05-07 00:23:38 +0000

[diff] [blame]

553

}

554

}

Dale Johannesen

8495a50

2009-11-20 22:16:40 +0000

[diff] [blame]

555

Chris Lattner

a296339

2006-05-12 16:29:37 +0000

[diff] [blame]

556

SH &= 31;

Dale Johannesen

8495a50

2009-11-20 22:16:40 +0000

[diff] [blame]

557

SDValue Ops[] = { Op0, Op1, getI32Imm(SH), getI32Imm(MB),

Evan Cheng

2006-08-27 08:14:06 +0000

[diff] [blame]

558

getI32Imm(ME) };

Michael Liao

2013-04-19 22:22:57 +0000

[diff] [blame]

559

return CurDAG->getMachineNode(PPC::RLWIMI, dl, MVT::i32, Ops);

Nate Begeman

2005-08-19 00:38:14 +0000

[diff] [blame]

560

}

Nate Begeman

2005-08-19 00:38:14 +0000

[diff] [blame]

561

}

Craig Topper

2014-04-25 05:30:21 +0000

[diff] [blame]

562

return nullptr;

Nate Begeman

2005-08-19 00:38:14 +0000

[diff] [blame]

563

}

564

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

565

// Predict the number of instructions that would be generated by calling

566

// SelectInt64(N).

Hal Finkel

2015-01-04 12:35:03 +0000

[diff] [blame]

567

static unsigned SelectInt64CountDirect(int64_t Imm) {

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

568

// Assume no remaining bits.

569

unsigned Remainder = 0;

570

// Assume no shift required.

571

unsigned Shift = 0;

572

573

// If it can't be represented as a 32 bit value.

574

if (!isInt<32>(Imm)) {

575

Shift = countTrailingZeros<uint64_t>(Imm);

576

int64_t ImmSh = static_cast<uint64_t>(Imm) >> Shift;

577

578

// If the shifted value fits 32 bits.

579

if (isInt<32>(ImmSh)) {

580

// Go with the shifted value.

581

Imm = ImmSh;

582

} else {

583

// Still stuck with a 64 bit value.

Remainder = Imm;

Shift = 32;

Imm >>= 32;

}

}

// Intermediate operand.

591

unsigned Result = 0;

592

593

// Handle first 32 bits.

594

unsigned Lo = Imm & 0xFFFF;

595

unsigned Hi = (Imm >> 16) & 0xFFFF;

596

597

// Simple value.

598

if (isInt<16>(Imm)) {

// Just the Lo bits.

++Result;

} else if (Lo) {

// Handle the Hi bits and Lo bits.

Result += 2;

} else {

// Just the Hi bits.

++Result;

}

// If no shift, we're done.

610

if (!Shift) return Result;

611

612

// Shift for next step if the upper 32-bits were not zero.

if (Imm)

++Result;

// Add in the last bits as required.

617

if ((Hi = (Remainder >> 16) & 0xFFFF))

618

++Result;

619

if ((Lo = Remainder & 0xFFFF))

++Result;

return Result;

}

Hal Finkel

2015-01-04 15:43:55 +0000

[diff] [blame]

625

static uint64_t Rot64(uint64_t Imm, unsigned R) {

626

return (Imm << R) | (Imm >> (64 - R));

627

}

628

Hal Finkel

2015-01-04 12:35:03 +0000

[diff] [blame]

629

static unsigned SelectInt64Count(int64_t Imm) {

Hal Finkel

2015-01-04 15:43:55 +0000

[diff] [blame]

630

unsigned Count = SelectInt64CountDirect(Imm);

Hal Finkel

2015-01-05 03:41:38 +0000

[diff] [blame]

631

if (Count == 1)

632

return Count;

Hal Finkel

2015-01-04 12:35:03 +0000

[diff] [blame]

633

Hal Finkel

2015-01-04 15:43:55 +0000

[diff] [blame]

634

for (unsigned r = 1; r < 63; ++r) {

Hal Finkel

2015-01-05 03:41:38 +0000

[diff] [blame]

635

uint64_t RImm = Rot64(Imm, r);

636

unsigned RCount = SelectInt64CountDirect(RImm) + 1;

637

Count = std::min(Count, RCount);

638

639

// See comments in SelectInt64 for an explanation of the logic below.

640

unsigned LS = findLastSet(RImm);

if (LS != r-1)

continue;

uint64_t OnesMask = -(int64_t) (UINT64_C(1) << (LS+1));

645

uint64_t RImmWithOnes = RImm | OnesMask;

646

647

RCount = SelectInt64CountDirect(RImmWithOnes) + 1;

Hal Finkel

2015-01-04 15:43:55 +0000

[diff] [blame]

648

Count = std::min(Count, RCount);

649

}

Hal Finkel

2015-01-04 12:35:03 +0000

[diff] [blame]

650

Hal Finkel

2015-01-04 15:43:55 +0000

[diff] [blame]

651

return Count;

Hal Finkel

2015-01-04 12:35:03 +0000

[diff] [blame]

652

}

653

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

654

// Select a 64-bit constant. For cost-modeling purposes, SelectInt64Count

655

// (above) needs to be kept in sync with this function.

Hal Finkel

2015-01-04 12:35:03 +0000

[diff] [blame]

656

static SDNode *SelectInt64Direct(SelectionDAG *CurDAG, SDLoc dl, int64_t Imm) {

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

657

// Assume no remaining bits.

658

unsigned Remainder = 0;

659

// Assume no shift required.

660

unsigned Shift = 0;

661

662

// If it can't be represented as a 32 bit value.

663

if (!isInt<32>(Imm)) {

664

Shift = countTrailingZeros<uint64_t>(Imm);

665

int64_t ImmSh = static_cast<uint64_t>(Imm) >> Shift;

666

667

// If the shifted value fits 32 bits.

668

if (isInt<32>(ImmSh)) {

669

// Go with the shifted value.

670

Imm = ImmSh;

671

} else {

672

// Still stuck with a 64 bit value.

Remainder = Imm;

Shift = 32;

Imm >>= 32;

}

}

// Intermediate operand.

680

SDNode *Result;

681

682

// Handle first 32 bits.

683

unsigned Lo = Imm & 0xFFFF;

684

unsigned Hi = (Imm >> 16) & 0xFFFF;

685

686

auto getI32Imm = [CurDAG](unsigned Imm) {

687

return CurDAG->getTargetConstant(Imm, MVT::i32);

};

// Simple value.

if (isInt<16>(Imm)) {

692

// Just the Lo bits.

693

Result = CurDAG->getMachineNode(PPC::LI8, dl, MVT::i64, getI32Imm(Lo));

694

} else if (Lo) {

695

// Handle the Hi bits.

696

unsigned OpC = Hi ? PPC::LIS8 : PPC::LI8;

697

Result = CurDAG->getMachineNode(OpC, dl, MVT::i64, getI32Imm(Hi));

698

// And Lo bits.

699

Result = CurDAG->getMachineNode(PPC::ORI8, dl, MVT::i64,

700

SDValue(Result, 0), getI32Imm(Lo));

701

} else {

702

// Just the Hi bits.

703

Result = CurDAG->getMachineNode(PPC::LIS8, dl, MVT::i64, getI32Imm(Hi));

704

}

705

706

// If no shift, we're done.

707

if (!Shift) return Result;

708

709

// Shift for next step if the upper 32-bits were not zero.

710

if (Imm) {

711

Result = CurDAG->getMachineNode(PPC::RLDICR, dl, MVT::i64,

712

SDValue(Result, 0),

713

getI32Imm(Shift),

714

getI32Imm(63 - Shift));

715

}

716

717

// Add in the last bits as required.

718

if ((Hi = (Remainder >> 16) & 0xFFFF)) {

719

Result = CurDAG->getMachineNode(PPC::ORIS8, dl, MVT::i64,

720

SDValue(Result, 0), getI32Imm(Hi));

721

}

722

if ((Lo = Remainder & 0xFFFF)) {

723

Result = CurDAG->getMachineNode(PPC::ORI8, dl, MVT::i64,

724

SDValue(Result, 0), getI32Imm(Lo));

}

return Result;

}

Hal Finkel

2015-01-04 12:35:03 +0000

[diff] [blame]

730

static SDNode *SelectInt64(SelectionDAG *CurDAG, SDLoc dl, int64_t Imm) {

Hal Finkel

2015-01-04 15:43:55 +0000

[diff] [blame]

731

unsigned Count = SelectInt64CountDirect(Imm);

Hal Finkel

2015-01-05 03:41:38 +0000

[diff] [blame]

732

if (Count == 1)

733

return SelectInt64Direct(CurDAG, dl, Imm);

734

Hal Finkel

2015-01-04 15:43:55 +0000

[diff] [blame]

735

unsigned RMin = 0;

Hal Finkel

2015-01-04 12:35:03 +0000

[diff] [blame]

736

Hal Finkel

2015-01-05 03:41:38 +0000

[diff] [blame]

int64_t MatImm;

unsigned MaskEnd;

Hal Finkel

2015-01-04 15:43:55 +0000

[diff] [blame]

740

for (unsigned r = 1; r < 63; ++r) {

Hal Finkel

2015-01-05 03:41:38 +0000

[diff] [blame]

741

uint64_t RImm = Rot64(Imm, r);

742

unsigned RCount = SelectInt64CountDirect(RImm) + 1;

Hal Finkel

2015-01-04 15:43:55 +0000

[diff] [blame]

743

if (RCount < Count) {

744

Count = RCount;

745

RMin = r;

Hal Finkel

2015-01-05 03:41:38 +0000

[diff] [blame]

MatImm = RImm;

MaskEnd = 63;

}

// If the immediate to generate has many trailing zeros, it might be

751

// worthwhile to generate a rotated value with too many leading ones

752

// (because that's free with li/lis's sign-extension semantics), and then

753

// mask them off after rotation.

754

755

unsigned LS = findLastSet(RImm);

756

// We're adding (63-LS) higher-order ones, and we expect to mask them off

757

// after performing the inverse rotation by (64-r). So we need that:

758

// 63-LS == 64-r => LS == r-1

if (LS != r-1)

continue;

uint64_t OnesMask = -(int64_t) (UINT64_C(1) << (LS+1));

763

uint64_t RImmWithOnes = RImm | OnesMask;

764

765

RCount = SelectInt64CountDirect(RImmWithOnes) + 1;

766

if (RCount < Count) {

767

Count = RCount;

768

RMin = r;

769

MatImm = RImmWithOnes;

770

MaskEnd = LS;

Hal Finkel

2015-01-04 15:43:55 +0000

[diff] [blame]

771

}

Hal Finkel

2015-01-04 12:35:03 +0000

[diff] [blame]

772

}

773

Hal Finkel

2015-01-04 15:43:55 +0000

[diff] [blame]

774

if (!RMin)

775

return SelectInt64Direct(CurDAG, dl, Imm);

776

777

auto getI32Imm = [CurDAG](unsigned Imm) {

778

return CurDAG->getTargetConstant(Imm, MVT::i32);

779

};

780

Hal Finkel

2015-01-05 03:41:38 +0000

[diff] [blame]

781

SDValue Val = SDValue(SelectInt64Direct(CurDAG, dl, MatImm), 0);

782

return CurDAG->getMachineNode(PPC::RLDICR, dl, MVT::i64, Val,

783

getI32Imm(64 - RMin), getI32Imm(MaskEnd));

Hal Finkel

2015-01-04 12:35:03 +0000

[diff] [blame]

784

}

785

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

786

// Select a 64-bit constant.

787

static SDNode *SelectInt64(SelectionDAG *CurDAG, SDNode *N) {

SDLoc dl(N);

// Get 64 bit value.

int64_t Imm = cast<ConstantSDNode>(N)->getZExtValue();

792

return SelectInt64(CurDAG, dl, Imm);

793

}

794

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

795

namespace {

796

class BitPermutationSelector {

struct ValueBit {

SDValue V;

// The bit number in the value, using a convention where bit 0 is the

// lowest-order bit.

unsigned Idx;

enum Kind {

ConstZero,

Variable

} K;

ValueBit(SDValue V, unsigned I, Kind K = Variable)

810

: V(V), Idx(I), K(K) {}

811

ValueBit(Kind K = Variable)

812

: V(SDValue(nullptr, 0)), Idx(UINT32_MAX), K(K) {}

813

814

bool isZero() const {

815

return K == ConstZero;

816

}

817

818

bool hasValue() const {

819

return K == Variable;

820

}

821

822

SDValue getValue() const {

823

assert(hasValue() && "Cannot get the value of a constant bit");

return V;

}

unsigned getValueBitIndex() const {

828

assert(hasValue() && "Cannot get the value bit index of a constant bit");

return Idx;

}

};

// A bit group has the same underlying value and the same rotate factor.

struct BitGroup {

SDValue V;

unsigned RLAmt;

unsigned StartIdx, EndIdx;

838

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

839

// This rotation amount assumes that the lower 32 bits of the quantity are

840

// replicated in the high 32 bits by the rotation operator (which is done

841

// by rlwinm and friends in 64-bit mode).

842

bool Repl32;

843

// Did converting to Repl32 == true change the rotation factor? If it did,

844

// it decreased it by 32.

845

bool Repl32CR;

846

// Was this group coalesced after setting Repl32 to true?

847

bool Repl32Coalesced;

848

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

849

BitGroup(SDValue V, unsigned R, unsigned S, unsigned E)

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

850

: V(V), RLAmt(R), StartIdx(S), EndIdx(E), Repl32(false), Repl32CR(false),

851

Repl32Coalesced(false) {

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

852

DEBUG(dbgs() << "\tbit group for " << V.getNode() << " RLAmt = " << R <<

853

" [" << S << ", " << E << "]\n");

}

};

// Information on each (Value, RLAmt) pair (like the number of groups

858

// associated with each) used to choose the lowering method.

859

struct ValueRotInfo {

SDValue V;

unsigned RLAmt;

unsigned NumGroups;

unsigned FirstGroupStartIdx;

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

864

bool Repl32;

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

865

866

ValueRotInfo()

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

867

: RLAmt(UINT32_MAX), NumGroups(0), FirstGroupStartIdx(UINT32_MAX),

868

Repl32(false) {}

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

869

870

// For sorting (in reverse order) by NumGroups, and then by

871

// FirstGroupStartIdx.

872

bool operator < (const ValueRotInfo &Other) const {

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

873

// We need to sort so that the non-Repl32 come first because, when we're

874

// doing masking, the Repl32 bit groups might be subsumed into the 64-bit

875

// masking operation.

876

if (Repl32 < Other.Repl32)

877

return true;

878

else if (Repl32 > Other.Repl32)

879

return false;

880

else if (NumGroups > Other.NumGroups)

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

881

return true;

882

else if (NumGroups < Other.NumGroups)

883

return false;

884

else if (FirstGroupStartIdx < Other.FirstGroupStartIdx)

return true;

return false;

}

};

// Return true if something interesting was deduced, return false if we're

891

// providing only a generic representation of V (or something else likewise

892

// uninteresting for instruction selection).

893

bool getValueBits(SDValue V, SmallVector<ValueBit, 64> &Bits) {

894

switch (V.getOpcode()) {

895

default: break;

896

case ISD::ROTL:

897

if (isa<ConstantSDNode>(V.getOperand(1))) {

898

unsigned RotAmt = V.getConstantOperandVal(1);

899

900

SmallVector<ValueBit, 64> LHSBits(Bits.size());

901

getValueBits(V.getOperand(0), LHSBits);

902

903

for (unsigned i = 0; i < Bits.size(); ++i)

904

Bits[i] = LHSBits[i < RotAmt ? i + (Bits.size() - RotAmt) : i - RotAmt];

return true;

}

break;

case ISD::SHL:

if (isa<ConstantSDNode>(V.getOperand(1))) {

911

unsigned ShiftAmt = V.getConstantOperandVal(1);

912

913

SmallVector<ValueBit, 64> LHSBits(Bits.size());

914

getValueBits(V.getOperand(0), LHSBits);

915

916

for (unsigned i = ShiftAmt; i < Bits.size(); ++i)

917

Bits[i] = LHSBits[i - ShiftAmt];

918

919

for (unsigned i = 0; i < ShiftAmt; ++i)

920

Bits[i] = ValueBit(ValueBit::ConstZero);

return true;

}

break;

case ISD::SRL:

if (isa<ConstantSDNode>(V.getOperand(1))) {

927

unsigned ShiftAmt = V.getConstantOperandVal(1);

928

929

SmallVector<ValueBit, 64> LHSBits(Bits.size());

930

getValueBits(V.getOperand(0), LHSBits);

931

932

for (unsigned i = 0; i < Bits.size() - ShiftAmt; ++i)

933

Bits[i] = LHSBits[i + ShiftAmt];

934

935

for (unsigned i = Bits.size() - ShiftAmt; i < Bits.size(); ++i)

936

Bits[i] = ValueBit(ValueBit::ConstZero);

return true;

}

break;

case ISD::AND:

if (isa<ConstantSDNode>(V.getOperand(1))) {

943

uint64_t Mask = V.getConstantOperandVal(1);

944

945

SmallVector<ValueBit, 64> LHSBits(Bits.size());

946

bool LHSTrivial = getValueBits(V.getOperand(0), LHSBits);

947

948

for (unsigned i = 0; i < Bits.size(); ++i)

949

if (((Mask >> i) & 1) == 1)

950

Bits[i] = LHSBits[i];

951

else

952

Bits[i] = ValueBit(ValueBit::ConstZero);

953

954

// Mark this as interesting, only if the LHS was also interesting. This

955

// prevents the overall procedure from matching a single immediate 'and'

956

// (which is non-optimal because such an and might be folded with other

957

// things if we don't select it here).

return LHSTrivial;

}

break;

case ISD::OR: {

SmallVector<ValueBit, 64> LHSBits(Bits.size()), RHSBits(Bits.size());

963

getValueBits(V.getOperand(0), LHSBits);

964

getValueBits(V.getOperand(1), RHSBits);

965

966

bool AllDisjoint = true;

967

for (unsigned i = 0; i < Bits.size(); ++i)

968

if (LHSBits[i].isZero())

969

Bits[i] = RHSBits[i];

970

else if (RHSBits[i].isZero())

971

Bits[i] = LHSBits[i];

else {

AllDisjoint = false;

break;

}

if (!AllDisjoint)

break;

return true;

}

}

for (unsigned i = 0; i < Bits.size(); ++i)

985

Bits[i] = ValueBit(V, i);

return false;

}

// For each value (except the constant ones), compute the left-rotate amount

991

// to get it from its original to final position.

992

void computeRotationAmounts() {

993

HasZeros = false;

994

RLAmt.resize(Bits.size());

995

for (unsigned i = 0; i < Bits.size(); ++i)

996

if (Bits[i].hasValue()) {

997

unsigned VBI = Bits[i].getValueBitIndex();

if (i >= VBI)

RLAmt[i] = i - VBI;

else

RLAmt[i] = Bits.size() - (VBI - i);

1002

} else if (Bits[i].isZero()) {

1003

HasZeros = true;

1004

RLAmt[i] = UINT32_MAX;

1005

} else {

1006

llvm_unreachable("Unknown value bit type");

}

}

// Collect groups of consecutive bits with the same underlying value and

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1011

// rotation factor. If we're doing late masking, we ignore zeros, otherwise

1012

// they break up groups.

1013

void collectBitGroups(bool LateMask) {

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

1014

BitGroups.clear();

1015

1016

unsigned LastRLAmt = RLAmt[0];

1017

SDValue LastValue = Bits[0].hasValue() ? Bits[0].getValue() : SDValue();

1018

unsigned LastGroupStartIdx = 0;

1019

for (unsigned i = 1; i < Bits.size(); ++i) {

1020

unsigned ThisRLAmt = RLAmt[i];

1021

SDValue ThisValue = Bits[i].hasValue() ? Bits[i].getValue() : SDValue();

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1022

if (LateMask && !ThisValue) {

1023

ThisValue = LastValue;

1024

ThisRLAmt = LastRLAmt;

1025

// If we're doing late masking, then the first bit group always starts

1026

// at zero (even if the first bits were zero).

1027

if (BitGroups.empty())

1028

LastGroupStartIdx = 0;

1029

}

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

1030

1031

// If this bit has the same underlying value and the same rotate factor as

1032

// the last one, then they're part of the same group.

1033

if (ThisRLAmt == LastRLAmt && ThisValue == LastValue)

1034

continue;

1035

1036

if (LastValue.getNode())

1037

BitGroups.push_back(BitGroup(LastValue, LastRLAmt, LastGroupStartIdx,

1038

i-1));

1039

LastRLAmt = ThisRLAmt;

1040

LastValue = ThisValue;

1041

LastGroupStartIdx = i;

1042

}

1043

if (LastValue.getNode())

1044

BitGroups.push_back(BitGroup(LastValue, LastRLAmt, LastGroupStartIdx,

1045

Bits.size()-1));

1046

1047

if (BitGroups.empty())

1048

return;

1049

1050

// We might be able to combine the first and last groups.

1051

if (BitGroups.size() > 1) {

1052

// If the first and last groups are the same, then remove the first group

1053

// in favor of the last group, making the ending index of the last group

1054

// equal to the ending index of the to-be-removed first group.

1055

if (BitGroups[0].StartIdx == 0 &&

1056

BitGroups[BitGroups.size()-1].EndIdx == Bits.size()-1 &&

1057

BitGroups[0].V == BitGroups[BitGroups.size()-1].V &&

1058

BitGroups[0].RLAmt == BitGroups[BitGroups.size()-1].RLAmt) {

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1059

DEBUG(dbgs() << "\tcombining final bit group with inital one\n");

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

1060

BitGroups[BitGroups.size()-1].EndIdx = BitGroups[0].EndIdx;

1061

BitGroups.erase(BitGroups.begin());

}

}

}

// Take all (SDValue, RLAmt) pairs and sort them by the number of groups

1067

// associated with each. If there is a degeneracy, pick the one that occurs

1068

// first (in the final value).

1069

void collectValueRotInfo() {

1070

ValueRots.clear();

1071

1072

for (auto &BG : BitGroups) {

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1073

unsigned RLAmtKey = BG.RLAmt + (BG.Repl32 ? 64 : 0);

1074

ValueRotInfo &VRI = ValueRots[std::make_pair(BG.V, RLAmtKey)];

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

1075

VRI.V = BG.V;

1076

VRI.RLAmt = BG.RLAmt;

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1077

VRI.Repl32 = BG.Repl32;

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

1078

VRI.NumGroups += 1;

1079

VRI.FirstGroupStartIdx = std::min(VRI.FirstGroupStartIdx, BG.StartIdx);

1080

}

1081

1082

// Now that we've collected the various ValueRotInfo instances, we need to

1083

// sort them.

1084

ValueRotsVec.clear();

1085

for (auto &I : ValueRots) {

1086

ValueRotsVec.push_back(I.second);

1087

}

1088

std::sort(ValueRotsVec.begin(), ValueRotsVec.end());

1089

}

1090

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1091

// In 64-bit mode, rlwinm and friends have a rotation operator that

1092

// replicates the low-order 32 bits into the high-order 32-bits. The mask

1093

// indices of these instructions can only be in the lower 32 bits, so they

1094

// can only represent some 64-bit bit groups. However, when they can be used,

1095

// the 32-bit replication can be used to represent, as a single bit group,

1096

// otherwise separate bit groups. We'll convert to replicated-32-bit bit

1097

// groups when possible. Returns true if any of the bit groups were

1098

// converted.

1099

void assignRepl32BitGroups() {

1100

// If we have bits like this:

1101

//

1102

// Indices: 15 14 13 12 11 10 9 8 7 6 5 4 3 2 1 0

1103

// V bits: ... 7 6 5 4 3 2 1 0 31 30 29 28 27 26 25 24

1104

// Groups: | RLAmt = 8 | RLAmt = 40 |

1105

//

1106

// But, making use of a 32-bit operation that replicates the low-order 32

1107

// bits into the high-order 32 bits, this can be one bit group with a RLAmt

1108

// of 8.

1109

1110

auto IsAllLow32 = [this](BitGroup & BG) {

1111

if (BG.StartIdx <= BG.EndIdx) {

1112

for (unsigned i = BG.StartIdx; i <= BG.EndIdx; ++i) {

1113

if (!Bits[i].hasValue())

1114

continue;

1115

if (Bits[i].getValueBitIndex() >= 32)

return false;

}

} else {

for (unsigned i = BG.StartIdx; i < Bits.size(); ++i) {

1120

if (!Bits[i].hasValue())

1121

continue;

1122

if (Bits[i].getValueBitIndex() >= 32)

1123

return false;

1124

}

1125

for (unsigned i = 0; i <= BG.EndIdx; ++i) {

1126

if (!Bits[i].hasValue())

1127

continue;

1128

if (Bits[i].getValueBitIndex() >= 32)

return false;

}

}

return true;

};

for (auto &BG : BitGroups) {

1137

if (BG.StartIdx < 32 && BG.EndIdx < 32) {

1138

if (IsAllLow32(BG)) {

1139

if (BG.RLAmt >= 32) {

BG.RLAmt -= 32;

BG.Repl32CR = true;

}

BG.Repl32 = true;

DEBUG(dbgs() << "\t32-bit replicated bit group for " <<

1147

BG.V.getNode() << " RLAmt = " << BG.RLAmt <<

1148

" [" << BG.StartIdx << ", " << BG.EndIdx << "]\n");

}

}

}

// Now walk through the bit groups, consolidating where possible.

1154

for (auto I = BitGroups.begin(); I != BitGroups.end();) {

1155

// We might want to remove this bit group by merging it with the previous

1156

// group (which might be the ending group).

1157

auto IP = (I == BitGroups.begin()) ?

1158

std::prev(BitGroups.end()) : std::prev(I);

1159

if (I->Repl32 && IP->Repl32 && I->V == IP->V && I->RLAmt == IP->RLAmt &&

1160

I->StartIdx == (IP->EndIdx + 1) % 64 && I != IP) {

1161

1162

DEBUG(dbgs() << "\tcombining 32-bit replicated bit group for " <<

1163

I->V.getNode() << " RLAmt = " << I->RLAmt <<

1164

" [" << I->StartIdx << ", " << I->EndIdx <<

1165

"] with group with range [" <<

1166

IP->StartIdx << ", " << IP->EndIdx << "]\n");

1167

1168

IP->EndIdx = I->EndIdx;

1169

IP->Repl32CR = IP->Repl32CR || I->Repl32CR;

1170

IP->Repl32Coalesced = true;

1171

I = BitGroups.erase(I);

1172

continue;

1173

} else {

1174

// There is a special case worth handling: If there is a single group

1175

// covering the entire upper 32 bits, and it can be merged with both

1176

// the next and previous groups (which might be the same group), then

1177

// do so. If it is the same group (so there will be only one group in

1178

// total), then we need to reverse the order of the range so that it

1179

// covers the entire 64 bits.

1180

if (I->StartIdx == 32 && I->EndIdx == 63) {

1181

assert(std::next(I) == BitGroups.end() &&

1182

"bit group ends at index 63 but there is another?");

1183

auto IN = BitGroups.begin();

1184

1185

if (IP->Repl32 && IN->Repl32 && I->V == IP->V && I->V == IN->V &&

1186

(I->RLAmt % 32) == IP->RLAmt && (I->RLAmt % 32) == IN->RLAmt &&

1187

IP->EndIdx == 31 && IN->StartIdx == 0 && I != IP &&

1188

IsAllLow32(*I)) {

1189

1190

DEBUG(dbgs() << "\tcombining bit group for " <<

1191

I->V.getNode() << " RLAmt = " << I->RLAmt <<

1192

" [" << I->StartIdx << ", " << I->EndIdx <<

1193

"] with 32-bit replicated groups with ranges [" <<

1194

IP->StartIdx << ", " << IP->EndIdx << "] and [" <<

1195

IN->StartIdx << ", " << IN->EndIdx << "]\n");

1196

1197

if (IP == IN) {

1198

// There is only one other group; change it to cover the whole

1199

// range (backward, so that it can still be Repl32 but cover the

1200

// whole 64-bit range).

1201

IP->StartIdx = 31;

1202

IP->EndIdx = 30;

1203

IP->Repl32CR = IP->Repl32CR || I->RLAmt >= 32;

1204

IP->Repl32Coalesced = true;

1205

I = BitGroups.erase(I);

1206

} else {

1207

// There are two separate groups, one before this group and one

1208

// after us (at the beginning). We're going to remove this group,

1209

// but also the group at the very beginning.

1210

IP->EndIdx = IN->EndIdx;

1211

IP->Repl32CR = IP->Repl32CR || IN->Repl32CR || I->RLAmt >= 32;

1212

IP->Repl32Coalesced = true;

1213

I = BitGroups.erase(I);

1214

BitGroups.erase(BitGroups.begin());

1215

}

1216

1217

// This must be the last group in the vector (and we might have

1218

// just invalidated the iterator above), so break here.

break;

}

}

}

++I;

}

}

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

1228

SDValue getI32Imm(unsigned Imm) {

1229

return CurDAG->getTargetConstant(Imm, MVT::i32);

1230

}

1231

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1232

uint64_t getZerosMask() {

1233

uint64_t Mask = 0;

1234

for (unsigned i = 0; i < Bits.size(); ++i) {

1235

if (Bits[i].hasValue())

1236

continue;

Hal Finkel

2015-01-01 19:33:59 +0000

[diff] [blame]

1237

Mask |= (UINT64_C(1) << i);

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

}

return ~Mask;

}

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

1243

// Depending on the number of groups for a particular value, it might be

1244

// better to rotate, mask explicitly (using andi/andis), and then or the

1245

// result. Select this part of the result first.

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1246

void SelectAndParts32(SDLoc dl, SDValue &Res, unsigned *InstCnt) {

1247

if (BPermRewriterNoMasking)

1248

return;

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

1249

1250

for (ValueRotInfo &VRI : ValueRotsVec) {

1251

unsigned Mask = 0;

1252

for (unsigned i = 0; i < Bits.size(); ++i) {

1253

if (!Bits[i].hasValue() || Bits[i].getValue() != VRI.V)

1254

continue;

1255

if (RLAmt[i] != VRI.RLAmt)

continue;

Mask |= (1u << i);

}

// Compute the masks for andi/andis that would be necessary.

1261

unsigned ANDIMask = (Mask & UINT16_MAX), ANDISMask = Mask >> 16;

1262

assert((ANDIMask != 0 || ANDISMask != 0) &&

1263

"No set bits in mask for value bit groups");

1264

bool NeedsRotate = VRI.RLAmt != 0;

1265

1266

// We're trying to minimize the number of instructions. If we have one

1267

// group, using one of andi/andis can break even. If we have three

1268

// groups, we can use both andi and andis and break even (to use both

1269

// andi and andis we also need to or the results together). We need four

1270

// groups if we also need to rotate. To use andi/andis we need to do more

1271

// than break even because rotate-and-mask instructions tend to be easier

1272

// to schedule.

1273

1274

// FIXME: We've biased here against using andi/andis, which is right for

1275

// POWER cores, but not optimal everywhere. For example, on the A2,

1276

// andi/andis have single-cycle latency whereas the rotate-and-mask

1277

// instructions take two cycles, and it would be better to bias toward

1278

// andi/andis in break-even cases.

1279

1280

unsigned NumAndInsts = (unsigned) NeedsRotate +

1281

(unsigned) (ANDIMask != 0) +

1282

(unsigned) (ANDISMask != 0) +

1283

(unsigned) (ANDIMask != 0 && ANDISMask != 0) +

1284

(unsigned) (bool) Res;

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1285

1286

DEBUG(dbgs() << "\t\trotation groups for " << VRI.V.getNode() <<

1287

" RL: " << VRI.RLAmt << ":" <<

1288

"\n\t\t\tisel using masking: " << NumAndInsts <<

1289

" using rotates: " << VRI.NumGroups << "\n");

1290

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

1291

if (NumAndInsts >= VRI.NumGroups)

1292

continue;

1293

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1294

DEBUG(dbgs() << "\t\t\t\tusing masking\n");

1295

1296

if (InstCnt) *InstCnt += NumAndInsts;

1297

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

SDValue VRot;

if (VRI.RLAmt) {

SDValue Ops[] =

{ VRI.V, getI32Imm(VRI.RLAmt), getI32Imm(0), getI32Imm(31) };

1302

VRot = SDValue(CurDAG->getMachineNode(PPC::RLWINM, dl, MVT::i32,

Ops), 0);

} else {

VRot = VRI.V;

}

SDValue ANDIVal, ANDISVal;

1309

if (ANDIMask != 0)

1310

ANDIVal = SDValue(CurDAG->getMachineNode(PPC::ANDIo, dl, MVT::i32,

1311

VRot, getI32Imm(ANDIMask)), 0);

1312

if (ANDISMask != 0)

1313

ANDISVal = SDValue(CurDAG->getMachineNode(PPC::ANDISo, dl, MVT::i32,

1314

VRot, getI32Imm(ANDISMask)), 0);

SDValue TotalVal;

if (!ANDIVal)

TotalVal = ANDISVal;

else if (!ANDISVal)

TotalVal = ANDIVal;

else

TotalVal = SDValue(CurDAG->getMachineNode(PPC::OR, dl, MVT::i32,

1323

ANDIVal, ANDISVal), 0);

if (!Res)

Res = TotalVal;

else

Res = SDValue(CurDAG->getMachineNode(PPC::OR, dl, MVT::i32,

1329

Res, TotalVal), 0);

1330

1331

// Now, remove all groups with this underlying value and rotation

1332

// factor.

1333

for (auto I = BitGroups.begin(); I != BitGroups.end();) {

1334

if (I->V == VRI.V && I->RLAmt == VRI.RLAmt)

1335

I = BitGroups.erase(I);

else

++I;

}

}

}

// Instruction selection for the 32-bit case.

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1343

SDNode *Select32(SDNode *N, bool LateMask, unsigned *InstCnt) {

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

SDLoc dl(N);

SDValue Res;

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1347

if (InstCnt) *InstCnt = 0;

1348

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

1349

// Take care of cases that should use andi/andis first.

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1350

SelectAndParts32(dl, Res, InstCnt);

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

1351

1352

// If we've not yet selected a 'starting' instruction, and we have no zeros

1353

// to fill in, select the (Value, RLAmt) with the highest priority (largest

1354

// number of groups), and start with this rotated value.

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1355

if ((!HasZeros || LateMask) && !Res) {

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

1356

ValueRotInfo &VRI = ValueRotsVec[0];

1357

if (VRI.RLAmt) {

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1358

if (InstCnt) *InstCnt += 1;

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

1359

SDValue Ops[] =

1360

{ VRI.V, getI32Imm(VRI.RLAmt), getI32Imm(0), getI32Imm(31) };

1361

Res = SDValue(CurDAG->getMachineNode(PPC::RLWINM, dl, MVT::i32, Ops), 0);

} else {

Res = VRI.V;

}

// Now, remove all groups with this underlying value and rotation factor.

1367

for (auto I = BitGroups.begin(); I != BitGroups.end();) {

1368

if (I->V == VRI.V && I->RLAmt == VRI.RLAmt)

1369

I = BitGroups.erase(I);

else

++I;

}

}

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1375

if (InstCnt) *InstCnt += BitGroups.size();

1376

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

1377

// Insert the other groups (one at a time).

1378

for (auto &BG : BitGroups) {

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1379

if (!Res) {

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

1380

SDValue Ops[] =

1381

{ BG.V, getI32Imm(BG.RLAmt), getI32Imm(Bits.size() - BG.EndIdx - 1),

1382

getI32Imm(Bits.size() - BG.StartIdx - 1) };

1383

Res = SDValue(CurDAG->getMachineNode(PPC::RLWINM, dl, MVT::i32, Ops), 0);

1384

} else {

1385

SDValue Ops[] =

1386

{ Res, BG.V, getI32Imm(BG.RLAmt), getI32Imm(Bits.size() - BG.EndIdx - 1),

1387

getI32Imm(Bits.size() - BG.StartIdx - 1) };

1388

Res = SDValue(CurDAG->getMachineNode(PPC::RLWIMI, dl, MVT::i32, Ops), 0);

}

}

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1392

if (LateMask) {

1393

unsigned Mask = (unsigned) getZerosMask();

1394

1395

unsigned ANDIMask = (Mask & UINT16_MAX), ANDISMask = Mask >> 16;

1396

assert((ANDIMask != 0 || ANDISMask != 0) &&

1397

"No set bits in zeros mask?");

1398

1399

if (InstCnt) *InstCnt += (unsigned) (ANDIMask != 0) +

1400

(unsigned) (ANDISMask != 0) +

1401

(unsigned) (ANDIMask != 0 && ANDISMask != 0);

1402

1403

SDValue ANDIVal, ANDISVal;

1404

if (ANDIMask != 0)

1405

ANDIVal = SDValue(CurDAG->getMachineNode(PPC::ANDIo, dl, MVT::i32,

1406

Res, getI32Imm(ANDIMask)), 0);

1407

if (ANDISMask != 0)

1408

ANDISVal = SDValue(CurDAG->getMachineNode(PPC::ANDISo, dl, MVT::i32,

1409

Res, getI32Imm(ANDISMask)), 0);

if (!ANDIVal)

Res = ANDISVal;

else if (!ANDISVal)

Res = ANDIVal;

else

Res = SDValue(CurDAG->getMachineNode(PPC::OR, dl, MVT::i32,

1417

ANDIVal, ANDISVal), 0);

1418

}

1419

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

1420

return Res.getNode();

1421

}

1422

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1423

unsigned SelectRotMask64Count(unsigned RLAmt, bool Repl32,

1424

unsigned MaskStart, unsigned MaskEnd,

1425

bool IsIns) {

1426

// In the notation used by the instructions, 'start' and 'end' are reversed

1427

// because bits are counted from high to low order.

1428

unsigned InstMaskStart = 64 - MaskEnd - 1,

1429

InstMaskEnd = 64 - MaskStart - 1;

if (Repl32)

return 1;

if ((!IsIns && (InstMaskEnd == 63 || InstMaskStart == 0)) ||

1435

InstMaskEnd == 63 - RLAmt)

return 1;

return 2;

}

// For 64-bit values, not all combinations of rotates and masks are

1442

// available. Produce one if it is available.

1443

SDValue SelectRotMask64(SDValue V, SDLoc dl, unsigned RLAmt, bool Repl32,

1444

unsigned MaskStart, unsigned MaskEnd,

1445

unsigned *InstCnt = nullptr) {

1446

// In the notation used by the instructions, 'start' and 'end' are reversed

1447

// because bits are counted from high to low order.

1448

unsigned InstMaskStart = 64 - MaskEnd - 1,

1449

InstMaskEnd = 64 - MaskStart - 1;

1450

1451

if (InstCnt) *InstCnt += 1;

1452

1453

if (Repl32) {

1454

// This rotation amount assumes that the lower 32 bits of the quantity

1455

// are replicated in the high 32 bits by the rotation operator (which is

1456

// done by rlwinm and friends).

1457

assert(InstMaskStart >= 32 && "Mask cannot start out of range");

1458

assert(InstMaskEnd >= 32 && "Mask cannot end out of range");

1459

SDValue Ops[] =

1460

{ V, getI32Imm(RLAmt), getI32Imm(InstMaskStart - 32),

1461

getI32Imm(InstMaskEnd - 32) };

1462

return SDValue(CurDAG->getMachineNode(PPC::RLWINM8, dl, MVT::i64,

Ops), 0);

}

if (InstMaskEnd == 63) {

1467

SDValue Ops[] =

1468

{ V, getI32Imm(RLAmt), getI32Imm(InstMaskStart) };

1469

return SDValue(CurDAG->getMachineNode(PPC::RLDICL, dl, MVT::i64, Ops), 0);

1470

}

1471

1472

if (InstMaskStart == 0) {

1473

SDValue Ops[] =

1474

{ V, getI32Imm(RLAmt), getI32Imm(InstMaskEnd) };

1475

return SDValue(CurDAG->getMachineNode(PPC::RLDICR, dl, MVT::i64, Ops), 0);

1476

}

1477

1478

if (InstMaskEnd == 63 - RLAmt) {

1479

SDValue Ops[] =

1480

{ V, getI32Imm(RLAmt), getI32Imm(InstMaskStart) };

1481

return SDValue(CurDAG->getMachineNode(PPC::RLDIC, dl, MVT::i64, Ops), 0);

1482

}

1483

1484

// We cannot do this with a single instruction, so we'll use two. The

1485

// problem is that we're not free to choose both a rotation amount and mask

1486

// start and end independently. We can choose an arbitrary mask start and

1487

// end, but then the rotation amount is fixed. Rotation, however, can be

1488

// inverted, and so by applying an "inverse" rotation first, we can get the

1489

// desired result.

1490

if (InstCnt) *InstCnt += 1;

1491

1492

// The rotation mask for the second instruction must be MaskStart.

1493

unsigned RLAmt2 = MaskStart;

1494

// The first instruction must rotate V so that the overall rotation amount

1495

// is RLAmt.

1496

unsigned RLAmt1 = (64 + RLAmt - RLAmt2) % 64;

1497

if (RLAmt1)

1498

V = SelectRotMask64(V, dl, RLAmt1, false, 0, 63);

1499

return SelectRotMask64(V, dl, RLAmt2, false, MaskStart, MaskEnd);

1500

}

1501

1502

// For 64-bit values, not all combinations of rotates and masks are

1503

// available. Produce a rotate-mask-and-insert if one is available.

1504

SDValue SelectRotMaskIns64(SDValue Base, SDValue V, SDLoc dl, unsigned RLAmt,

1505

bool Repl32, unsigned MaskStart,

1506

unsigned MaskEnd, unsigned *InstCnt = nullptr) {

1507

// In the notation used by the instructions, 'start' and 'end' are reversed

1508

// because bits are counted from high to low order.

1509

unsigned InstMaskStart = 64 - MaskEnd - 1,

1510

InstMaskEnd = 64 - MaskStart - 1;

1511

1512

if (InstCnt) *InstCnt += 1;

1513

1514

if (Repl32) {

1515

// This rotation amount assumes that the lower 32 bits of the quantity

1516

// are replicated in the high 32 bits by the rotation operator (which is

1517

// done by rlwinm and friends).

1518

assert(InstMaskStart >= 32 && "Mask cannot start out of range");

1519

assert(InstMaskEnd >= 32 && "Mask cannot end out of range");

1520

SDValue Ops[] =

1521

{ Base, V, getI32Imm(RLAmt), getI32Imm(InstMaskStart - 32),

1522

getI32Imm(InstMaskEnd - 32) };

1523

return SDValue(CurDAG->getMachineNode(PPC::RLWIMI8, dl, MVT::i64,

Ops), 0);

}

if (InstMaskEnd == 63 - RLAmt) {

1528

SDValue Ops[] =

1529

{ Base, V, getI32Imm(RLAmt), getI32Imm(InstMaskStart) };

1530

return SDValue(CurDAG->getMachineNode(PPC::RLDIMI, dl, MVT::i64, Ops), 0);

1531

}

1532

1533

// We cannot do this with a single instruction, so we'll use two. The

1534

// problem is that we're not free to choose both a rotation amount and mask

1535

// start and end independently. We can choose an arbitrary mask start and

1536

// end, but then the rotation amount is fixed. Rotation, however, can be

1537

// inverted, and so by applying an "inverse" rotation first, we can get the

1538

// desired result.

1539

if (InstCnt) *InstCnt += 1;

1540

1541

// The rotation mask for the second instruction must be MaskStart.

1542

unsigned RLAmt2 = MaskStart;

1543

// The first instruction must rotate V so that the overall rotation amount

1544

// is RLAmt.

1545

unsigned RLAmt1 = (64 + RLAmt - RLAmt2) % 64;

1546

if (RLAmt1)

1547

V = SelectRotMask64(V, dl, RLAmt1, false, 0, 63);

1548

return SelectRotMaskIns64(Base, V, dl, RLAmt2, false, MaskStart, MaskEnd);

1549

}

1550

1551

void SelectAndParts64(SDLoc dl, SDValue &Res, unsigned *InstCnt) {

1552

if (BPermRewriterNoMasking)

1553

return;

1554

1555

// The idea here is the same as in the 32-bit version, but with additional

1556

// complications from the fact that Repl32 might be true. Because we

1557

// aggressively convert bit groups to Repl32 form (which, for small

1558

// rotation factors, involves no other change), and then coalesce, it might

1559

// be the case that a single 64-bit masking operation could handle both

1560

// some Repl32 groups and some non-Repl32 groups. If converting to Repl32

1561

// form allowed coalescing, then we must use a 32-bit rotaton in order to

1562

// completely capture the new combined bit group.

1563

1564

for (ValueRotInfo &VRI : ValueRotsVec) {

1565

uint64_t Mask = 0;

1566

1567

// We need to add to the mask all bits from the associated bit groups.

1568

// If Repl32 is false, we need to add bits from bit groups that have

1569

// Repl32 true, but are trivially convertable to Repl32 false. Such a

1570

// group is trivially convertable if it overlaps only with the lower 32

1571

// bits, and the group has not been coalesced.

1572

auto MatchingBG = [VRI](BitGroup &BG) {

if (VRI.V != BG.V)

return false;

unsigned EffRLAmt = BG.RLAmt;

1577

if (!VRI.Repl32 && BG.Repl32) {

1578

if (BG.StartIdx < 32 && BG.EndIdx < 32 && BG.StartIdx <= BG.EndIdx &&

1579

!BG.Repl32Coalesced) {

if (BG.Repl32CR)

EffRLAmt += 32;

} else {

return false;

}

} else if (VRI.Repl32 != BG.Repl32) {

return false;

}

if (VRI.RLAmt != EffRLAmt)

return false;

return true;

};

for (auto &BG : BitGroups) {

if (!MatchingBG(BG))

continue;

if (BG.StartIdx <= BG.EndIdx) {

1600

for (unsigned i = BG.StartIdx; i <= BG.EndIdx; ++i)

Hal Finkel

2015-01-01 19:33:59 +0000

[diff] [blame]

1601

Mask |= (UINT64_C(1) << i);

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1602

} else {

1603

for (unsigned i = BG.StartIdx; i < Bits.size(); ++i)

Hal Finkel

2015-01-01 19:33:59 +0000

[diff] [blame]

1604

Mask |= (UINT64_C(1) << i);

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1605

for (unsigned i = 0; i <= BG.EndIdx; ++i)

Hal Finkel

2015-01-01 19:33:59 +0000

[diff] [blame]

1606

Mask |= (UINT64_C(1) << i);

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

}

}

// We can use the 32-bit andi/andis technique if the mask does not

1611

// require any higher-order bits. This can save an instruction compared

1612

// to always using the general 64-bit technique.

1613

bool Use32BitInsts = isUInt<32>(Mask);

1614

// Compute the masks for andi/andis that would be necessary.

1615

unsigned ANDIMask = (Mask & UINT16_MAX),

1616

ANDISMask = (Mask >> 16) & UINT16_MAX;

1617

1618

bool NeedsRotate = VRI.RLAmt || (VRI.Repl32 && !isUInt<32>(Mask));

1619

1620

unsigned NumAndInsts = (unsigned) NeedsRotate +

1621

(unsigned) (bool) Res;

1622

if (Use32BitInsts)

1623

NumAndInsts += (unsigned) (ANDIMask != 0) + (unsigned) (ANDISMask != 0) +

1624

(unsigned) (ANDIMask != 0 && ANDISMask != 0);

1625

else

1626

NumAndInsts += SelectInt64Count(Mask) + /* and */ 1;

1627

1628

unsigned NumRLInsts = 0;

1629

bool FirstBG = true;

1630

for (auto &BG : BitGroups) {

if (!MatchingBG(BG))

continue;

NumRLInsts +=

SelectRotMask64Count(BG.RLAmt, BG.Repl32, BG.StartIdx, BG.EndIdx,

!FirstBG);

FirstBG = false;

}

DEBUG(dbgs() << "\t\trotation groups for " << VRI.V.getNode() <<

1640

" RL: " << VRI.RLAmt << (VRI.Repl32 ? " (32):" : ":") <<

1641

"\n\t\t\tisel using masking: " << NumAndInsts <<

1642

" using rotates: " << NumRLInsts << "\n");

1643

1644

// When we'd use andi/andis, we bias toward using the rotates (andi only

1645

// has a record form, and is cracked on POWER cores). However, when using

1646

// general 64-bit constant formation, bias toward the constant form,

1647

// because that exposes more opportunities for CSE.

1648

if (NumAndInsts > NumRLInsts)

1649

continue;

1650

if (Use32BitInsts && NumAndInsts == NumRLInsts)

1651

continue;

1652

1653

DEBUG(dbgs() << "\t\t\t\tusing masking\n");

1654

1655

if (InstCnt) *InstCnt += NumAndInsts;

1656

1657

SDValue VRot;

1658

// We actually need to generate a rotation if we have a non-zero rotation

1659

// factor or, in the Repl32 case, if we care about any of the

1660

// higher-order replicated bits. In the latter case, we generate a mask

1661

// backward so that it actually includes the entire 64 bits.

1662

if (VRI.RLAmt || (VRI.Repl32 && !isUInt<32>(Mask)))

1663

VRot = SelectRotMask64(VRI.V, dl, VRI.RLAmt, VRI.Repl32,

1664

VRI.Repl32 ? 31 : 0, VRI.Repl32 ? 30 : 63);

else

VRot = VRI.V;

SDValue TotalVal;

if (Use32BitInsts) {

assert((ANDIMask != 0 || ANDISMask != 0) &&

1671

"No set bits in mask when using 32-bit ands for 64-bit value");

1672

1673

SDValue ANDIVal, ANDISVal;

1674

if (ANDIMask != 0)

1675

ANDIVal = SDValue(CurDAG->getMachineNode(PPC::ANDIo8, dl, MVT::i64,

1676

VRot, getI32Imm(ANDIMask)), 0);

1677

if (ANDISMask != 0)

1678

ANDISVal = SDValue(CurDAG->getMachineNode(PPC::ANDISo8, dl, MVT::i64,

1679

VRot, getI32Imm(ANDISMask)), 0);

if (!ANDIVal)

TotalVal = ANDISVal;

else if (!ANDISVal)

TotalVal = ANDIVal;

else

TotalVal = SDValue(CurDAG->getMachineNode(PPC::OR8, dl, MVT::i64,

1687

ANDIVal, ANDISVal), 0);

1688

} else {

1689

TotalVal = SDValue(SelectInt64(CurDAG, dl, Mask), 0);

1690

TotalVal =

1691

SDValue(CurDAG->getMachineNode(PPC::AND8, dl, MVT::i64,

VRot, TotalVal), 0);

}

if (!Res)

Res = TotalVal;

else

Res = SDValue(CurDAG->getMachineNode(PPC::OR8, dl, MVT::i64,

1699

Res, TotalVal), 0);

1700

1701

// Now, remove all groups with this underlying value and rotation

1702

// factor.

1703

for (auto I = BitGroups.begin(); I != BitGroups.end();) {

1704

if (MatchingBG(*I))

1705

I = BitGroups.erase(I);

else

++I;

}

}

}

// Instruction selection for the 64-bit case.

1713

SDNode *Select64(SDNode *N, bool LateMask, unsigned *InstCnt) {

SDLoc dl(N);

SDValue Res;

if (InstCnt) *InstCnt = 0;

1718

1719

// Take care of cases that should use andi/andis first.

1720

SelectAndParts64(dl, Res, InstCnt);

1721

1722

// If we've not yet selected a 'starting' instruction, and we have no zeros

1723

// to fill in, select the (Value, RLAmt) with the highest priority (largest

1724

// number of groups), and start with this rotated value.

1725

if ((!HasZeros || LateMask) && !Res) {

1726

// If we have both Repl32 groups and non-Repl32 groups, the non-Repl32

1727

// groups will come first, and so the VRI representing the largest number

1728

// of groups might not be first (it might be the first Repl32 groups).

1729

unsigned MaxGroupsIdx = 0;

1730

if (!ValueRotsVec[0].Repl32) {

1731

for (unsigned i = 0, ie = ValueRotsVec.size(); i < ie; ++i)

1732

if (ValueRotsVec[i].Repl32) {

1733

if (ValueRotsVec[i].NumGroups > ValueRotsVec[0].NumGroups)

MaxGroupsIdx = i;

break;

}

}

ValueRotInfo &VRI = ValueRotsVec[MaxGroupsIdx];

1740

bool NeedsRotate = false;

1741

if (VRI.RLAmt) {

1742

NeedsRotate = true;

1743

} else if (VRI.Repl32) {

1744

for (auto &BG : BitGroups) {

1745

if (BG.V != VRI.V || BG.RLAmt != VRI.RLAmt ||

1746

BG.Repl32 != VRI.Repl32)

1747

continue;

1748

1749

// We don't need a rotate if the bit group is confined to the lower

1750

// 32 bits.

1751

if (BG.StartIdx < 32 && BG.EndIdx < 32 && BG.StartIdx < BG.EndIdx)

continue;

NeedsRotate = true;

break;

}

}

if (NeedsRotate)

Res = SelectRotMask64(VRI.V, dl, VRI.RLAmt, VRI.Repl32,

1761

VRI.Repl32 ? 31 : 0, VRI.Repl32 ? 30 : 63,

InstCnt);

else

Res = VRI.V;

// Now, remove all groups with this underlying value and rotation factor.

1767

if (Res)

1768

for (auto I = BitGroups.begin(); I != BitGroups.end();) {

1769

if (I->V == VRI.V && I->RLAmt == VRI.RLAmt && I->Repl32 == VRI.Repl32)

1770

I = BitGroups.erase(I);

else

++I;

}

}

// Because 64-bit rotates are more flexible than inserts, we might have a

1777

// preference regarding which one we do first (to save one instruction).

1778

if (!Res)

1779

for (auto I = BitGroups.begin(), IE = BitGroups.end(); I != IE; ++I) {

1780

if (SelectRotMask64Count(I->RLAmt, I->Repl32, I->StartIdx, I->EndIdx,

1781

false) <

1782

SelectRotMask64Count(I->RLAmt, I->Repl32, I->StartIdx, I->EndIdx,

1783

true)) {

1784

if (I != BitGroups.begin()) {

1785

BitGroup BG = *I;

1786

BitGroups.erase(I);

1787

BitGroups.insert(BitGroups.begin(), BG);

}

break;

}

}

// Insert the other groups (one at a time).

1795

for (auto &BG : BitGroups) {

1796

if (!Res)

1797

Res = SelectRotMask64(BG.V, dl, BG.RLAmt, BG.Repl32, BG.StartIdx,

1798

BG.EndIdx, InstCnt);

1799

else

1800

Res = SelectRotMaskIns64(Res, BG.V, dl, BG.RLAmt, BG.Repl32,

1801

BG.StartIdx, BG.EndIdx, InstCnt);

}

if (LateMask) {

uint64_t Mask = getZerosMask();

1806

1807

// We can use the 32-bit andi/andis technique if the mask does not

1808

// require any higher-order bits. This can save an instruction compared

1809

// to always using the general 64-bit technique.

1810

bool Use32BitInsts = isUInt<32>(Mask);

1811

// Compute the masks for andi/andis that would be necessary.

1812

unsigned ANDIMask = (Mask & UINT16_MAX),

1813

ANDISMask = (Mask >> 16) & UINT16_MAX;

1814

1815

if (Use32BitInsts) {

1816

assert((ANDIMask != 0 || ANDISMask != 0) &&

1817

"No set bits in mask when using 32-bit ands for 64-bit value");

1818

1819

if (InstCnt) *InstCnt += (unsigned) (ANDIMask != 0) +

1820

(unsigned) (ANDISMask != 0) +

1821

(unsigned) (ANDIMask != 0 && ANDISMask != 0);

1822

1823

SDValue ANDIVal, ANDISVal;

1824

if (ANDIMask != 0)

1825

ANDIVal = SDValue(CurDAG->getMachineNode(PPC::ANDIo8, dl, MVT::i64,

1826

Res, getI32Imm(ANDIMask)), 0);

1827

if (ANDISMask != 0)

1828

ANDISVal = SDValue(CurDAG->getMachineNode(PPC::ANDISo8, dl, MVT::i64,

1829

Res, getI32Imm(ANDISMask)), 0);

if (!ANDIVal)

Res = ANDISVal;

else if (!ANDISVal)

Res = ANDIVal;

else

Res = SDValue(CurDAG->getMachineNode(PPC::OR8, dl, MVT::i64,

1837

ANDIVal, ANDISVal), 0);

1838

} else {

1839

if (InstCnt) *InstCnt += SelectInt64Count(Mask) + /* and */ 1;

1840

1841

SDValue MaskVal = SDValue(SelectInt64(CurDAG, dl, Mask), 0);

1842

Res =

1843

SDValue(CurDAG->getMachineNode(PPC::AND8, dl, MVT::i64,

Res, MaskVal), 0);

}

}

return Res.getNode();

1849

}

1850

1851

SDNode *Select(SDNode *N, bool LateMask, unsigned *InstCnt = nullptr) {

1852

// Fill in BitGroups.

1853

collectBitGroups(LateMask);

1854

if (BitGroups.empty())

1855

return nullptr;

1856

1857

// For 64-bit values, figure out when we can use 32-bit instructions.

1858

if (Bits.size() == 64)

1859

assignRepl32BitGroups();

1860

1861

// Fill in ValueRotsVec.

1862

collectValueRotInfo();

1863

1864

if (Bits.size() == 32) {

1865

return Select32(N, LateMask, InstCnt);

1866

} else {

1867

assert(Bits.size() == 64 && "Not 64 bits here?");

1868

return Select64(N, LateMask, InstCnt);

}

return nullptr;

}

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

1874

SmallVector<ValueBit, 64> Bits;

1875

1876

bool HasZeros;

1877

SmallVector<unsigned, 64> RLAmt;

1878

1879

SmallVector<BitGroup, 16> BitGroups;

1880

1881

DenseMap<std::pair<SDValue, unsigned>, ValueRotInfo> ValueRots;

1882

SmallVector<ValueRotInfo, 16> ValueRotsVec;

1883

1884

SelectionDAG *CurDAG;

1885

1886

public:

1887

BitPermutationSelector(SelectionDAG *DAG)

1888

: CurDAG(DAG) {}

1889

1890

// Here we try to match complex bit permutations into a set of

1891

// rotate-and-shift/shift/and/or instructions, using a set of heuristics

1892

// known to produce optimial code for common cases (like i32 byte swapping).

1893

SDNode *Select(SDNode *N) {

1894

Bits.resize(N->getValueType(0).getSizeInBits());

1895

if (!getValueBits(SDValue(N, 0), Bits))

1896

return nullptr;

1897

1898

DEBUG(dbgs() << "Considering bit-permutation-based instruction"

1899

" selection for: ");

1900

DEBUG(N->dump(CurDAG));

1901

1902

// Fill it RLAmt and set HasZeros.

1903

computeRotationAmounts();

1904

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1905

if (!HasZeros)

1906

return Select(N, false);

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

1907

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1908

// We currently have two techniques for handling results with zeros: early

1909

// masking (the default) and late masking. Late masking is sometimes more

1910

// efficient, but because the structure of the bit groups is different, it

1911

// is hard to tell without generating both and comparing the results. With

1912

// late masking, we ignore zeros in the resulting value when inserting each

1913

// set of bit groups, and then mask in the zeros at the end. With early

1914

// masking, we only insert the non-zero parts of the result at every step.

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

1915

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1916

unsigned InstCnt, InstCntLateMask;

1917

DEBUG(dbgs() << "\tEarly masking:\n");

1918

SDNode *RN = Select(N, false, &InstCnt);

1919

DEBUG(dbgs() << "\t\tisel would use " << InstCnt << " instructions\n");

1920

1921

DEBUG(dbgs() << "\tLate masking:\n");

1922

SDNode *RNLM = Select(N, true, &InstCntLateMask);

1923

DEBUG(dbgs() << "\t\tisel would use " << InstCntLateMask <<

1924

" instructions\n");

1925

1926

if (InstCnt <= InstCntLateMask) {

1927

DEBUG(dbgs() << "\tUsing early-masking for isel\n");

1928

return RN;

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

1929

}

1930

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1931

DEBUG(dbgs() << "\tUsing late-masking for isel\n");

1932

return RNLM;

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

1933

}

1934

};

1935

} // anonymous namespace

1936

1937

SDNode *PPCDAGToDAGISel::SelectBitPermutation(SDNode *N) {

1938

if (N->getValueType(0) != MVT::i32 &&

1939

N->getValueType(0) != MVT::i64)

1940

return nullptr;

1941

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

1942

if (!UseBitPermRewriter)

1943

return nullptr;

1944

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

1945

switch (N->getOpcode()) {

default: break;

case ISD::ROTL:

case ISD::SHL:

case ISD::SRL:

case ISD::AND:

case ISD::OR: {

BitPermutationSelector BPS(CurDAG);

1953

return BPS.Select(N);

}

}

return nullptr;

}

Chris Lattner

2005-08-21 18:50:37 +0000

[diff] [blame]

1960

/// SelectCC - Select a comparison of the specified values with the specified

1961

/// condition code, returning the CR# of the expression.

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

1962

SDValue PPCDAGToDAGISel::SelectCC(SDValue LHS, SDValue RHS,

Andrew Trick

2013-05-25 02:42:55 +0000

[diff] [blame]

1963

ISD::CondCode CC, SDLoc dl) {

Chris Lattner

2005-08-21 18:50:37 +0000

[diff] [blame]

1964

// Always select the LHS.

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

1965

unsigned Opc;

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

1966

Owen Anderson

2009-08-11 20:47:22 +0000

[diff] [blame]

1967

if (LHS.getValueType() == MVT::i32) {

Chris Lattner

9a40cca

2006-06-27 00:10:13 +0000

[diff] [blame]

1968

unsigned Imm;

Chris Lattner

2006-09-20 04:25:47 +0000

[diff] [blame]

1969

if (CC == ISD::SETEQ || CC == ISD::SETNE) {

1970

if (isInt32Immediate(RHS, Imm)) {

1971

// SETEQ/SETNE comparison with 16-bit immediate, fold it.

Benjamin Kramer

2010-03-29 21:13:41 +0000

[diff] [blame]

1972

if (isUInt<16>(Imm))

Dan Gohman

2009-09-25 18:54:59 +0000

[diff] [blame]

1973

return SDValue(CurDAG->getMachineNode(PPC::CMPLWI, dl, MVT::i32, LHS,

1974

getI32Imm(Imm & 0xFFFF)), 0);

Chris Lattner

2006-09-20 04:25:47 +0000

[diff] [blame]

1975

// If this is a 16-bit signed immediate, fold it.

Benjamin Kramer

2010-03-29 21:13:41 +0000

[diff] [blame]

1976

if (isInt<16>((int)Imm))

Dan Gohman

2009-09-25 18:54:59 +0000

[diff] [blame]

1977

return SDValue(CurDAG->getMachineNode(PPC::CMPWI, dl, MVT::i32, LHS,

1978

getI32Imm(Imm & 0xFFFF)), 0);

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

1979

Chris Lattner

2006-09-20 04:25:47 +0000

[diff] [blame]

1980

// For non-equality comparisons, the default code would materialize the

1981

// constant, then compare against it, like this:

1982

// lis r2, 4660

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

1983

// ori r2, r2, 22136

Chris Lattner

2006-09-20 04:25:47 +0000

[diff] [blame]

1984

// cmpw cr0, r3, r2

1985

// Since we are just comparing for equality, we can emit this instead:

1986

// xoris r0,r3,0x1234

1987

// cmplwi cr0,r0,0x5678

1988

// beq cr0,L6

Dan Gohman

2009-09-25 18:54:59 +0000

[diff] [blame]

1989

SDValue Xor(CurDAG->getMachineNode(PPC::XORIS, dl, MVT::i32, LHS,

1990

getI32Imm(Imm >> 16)), 0);

1991

return SDValue(CurDAG->getMachineNode(PPC::CMPLWI, dl, MVT::i32, Xor,

1992

getI32Imm(Imm & 0xFFFF)), 0);

Chris Lattner

2006-09-20 04:25:47 +0000

[diff] [blame]

1993

}

1994

Opc = PPC::CMPLW;

1995

} else if (ISD::isUnsignedIntSetCC(CC)) {

Benjamin Kramer

2010-03-29 21:13:41 +0000

[diff] [blame]

1996

if (isInt32Immediate(RHS, Imm) && isUInt<16>(Imm))

Dan Gohman

2009-09-25 18:54:59 +0000

[diff] [blame]

1997

return SDValue(CurDAG->getMachineNode(PPC::CMPLWI, dl, MVT::i32, LHS,

1998

getI32Imm(Imm & 0xFFFF)), 0);

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

Opc = PPC::CMPLW;

} else {

short SImm;

if (isIntS16Immediate(RHS, SImm))

Dan Gohman

2009-09-25 18:54:59 +0000

[diff] [blame]

2003

return SDValue(CurDAG->getMachineNode(PPC::CMPWI, dl, MVT::i32, LHS,

2004

getI32Imm((int)SImm & 0xFFFF)),

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

2005

0);

2006

Opc = PPC::CMPW;

2007

}

Owen Anderson

2009-08-11 20:47:22 +0000

[diff] [blame]

2008

} else if (LHS.getValueType() == MVT::i64) {

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

2009

uint64_t Imm;

Chris Lattner

2006-09-20 04:33:27 +0000

[diff] [blame]

2010

if (CC == ISD::SETEQ || CC == ISD::SETNE) {

Gabor Greif

2008-08-28 21:40:38 +0000

[diff] [blame]

2011

if (isInt64Immediate(RHS.getNode(), Imm)) {

Chris Lattner

2006-09-20 04:33:27 +0000

[diff] [blame]

2012

// SETEQ/SETNE comparison with 16-bit immediate, fold it.

Benjamin Kramer

2010-03-29 21:13:41 +0000

[diff] [blame]

2013

if (isUInt<16>(Imm))

Dan Gohman

2009-09-25 18:54:59 +0000

[diff] [blame]

2014

return SDValue(CurDAG->getMachineNode(PPC::CMPLDI, dl, MVT::i64, LHS,

2015

getI32Imm(Imm & 0xFFFF)), 0);

Chris Lattner

2006-09-20 04:33:27 +0000

[diff] [blame]

2016

// If this is a 16-bit signed immediate, fold it.

Benjamin Kramer

2010-03-29 21:13:41 +0000

[diff] [blame]

2017

if (isInt<16>(Imm))

Dan Gohman

2009-09-25 18:54:59 +0000

[diff] [blame]

2018

return SDValue(CurDAG->getMachineNode(PPC::CMPDI, dl, MVT::i64, LHS,

2019

getI32Imm(Imm & 0xFFFF)), 0);

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2020

Chris Lattner

2006-09-20 04:33:27 +0000

[diff] [blame]

2021

// For non-equality comparisons, the default code would materialize the

2022

// constant, then compare against it, like this:

2023

// lis r2, 4660

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2024

// ori r2, r2, 22136

Chris Lattner

2006-09-20 04:33:27 +0000

[diff] [blame]

2025

// cmpd cr0, r3, r2

2026

// Since we are just comparing for equality, we can emit this instead:

2027

// xoris r0,r3,0x1234

2028

// cmpldi cr0,r0,0x5678

2029

// beq cr0,L6

Benjamin Kramer

2010-03-29 21:13:41 +0000

[diff] [blame]

2030

if (isUInt<32>(Imm)) {

Dan Gohman

2009-09-25 18:54:59 +0000

[diff] [blame]

2031

SDValue Xor(CurDAG->getMachineNode(PPC::XORIS8, dl, MVT::i64, LHS,

2032

getI64Imm(Imm >> 16)), 0);

2033

return SDValue(CurDAG->getMachineNode(PPC::CMPLDI, dl, MVT::i64, Xor,

2034

getI64Imm(Imm & 0xFFFF)), 0);

Chris Lattner

2006-09-20 04:33:27 +0000

[diff] [blame]

}

}

Opc = PPC::CMPLD;

} else if (ISD::isUnsignedIntSetCC(CC)) {

Benjamin Kramer

2010-03-29 21:13:41 +0000

[diff] [blame]

2039

if (isInt64Immediate(RHS.getNode(), Imm) && isUInt<16>(Imm))

Dan Gohman

2009-09-25 18:54:59 +0000

[diff] [blame]

2040

return SDValue(CurDAG->getMachineNode(PPC::CMPLDI, dl, MVT::i64, LHS,

2041

getI64Imm(Imm & 0xFFFF)), 0);

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

Opc = PPC::CMPLD;

} else {

short SImm;

if (isIntS16Immediate(RHS, SImm))

Dan Gohman

2009-09-25 18:54:59 +0000

[diff] [blame]

2046

return SDValue(CurDAG->getMachineNode(PPC::CMPDI, dl, MVT::i64, LHS,

2047

getI64Imm(SImm & 0xFFFF)),

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

2048

0);

2049

Opc = PPC::CMPD;

2050

}

Owen Anderson

2009-08-11 20:47:22 +0000

[diff] [blame]

2051

} else if (LHS.getValueType() == MVT::f32) {

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

2052

Opc = PPC::FCMPUS;

Chris Lattner

2005-08-21 18:50:37 +0000

[diff] [blame]

2053

} else {

Owen Anderson

2009-08-11 20:47:22 +0000

[diff] [blame]

2054

assert(LHS.getValueType() == MVT::f64 && "Unknown vt!");

Eric Christopher

2014-05-22 01:07:24 +0000

[diff] [blame]

2055

Opc = PPCSubTarget->hasVSX() ? PPC::XSCMPUDP : PPC::FCMPUD;

Chris Lattner

2005-08-21 18:50:37 +0000

[diff] [blame]

2056

}

Dan Gohman

2009-09-25 18:54:59 +0000

[diff] [blame]

2057

return SDValue(CurDAG->getMachineNode(Opc, dl, MVT::i32, LHS, RHS), 0);

Chris Lattner

2005-08-21 18:50:37 +0000

[diff] [blame]

2058

}

2059

Chris Lattner

2006-11-17 22:10:59 +0000

[diff] [blame]

2060

static PPC::Predicate getPredicateForSetCC(ISD::CondCode CC) {

Chris Lattner

2005-08-21 18:50:37 +0000

[diff] [blame]

2061

switch (CC) {

Chris Lattner

630bbce

2006-05-25 16:54:16 +0000

[diff] [blame]

2062

case ISD::SETUEQ:

Dale Johannesen

2008-11-07 22:54:33 +0000

[diff] [blame]

2063

case ISD::SETONE:

2064

case ISD::SETOLE:

2065

case ISD::SETOGE:

Torok Edwin

2009-07-14 16:55:14 +0000

[diff] [blame]

2066

llvm_unreachable("Should be lowered by legalize!");

2067

default: llvm_unreachable("Unknown condition!");

Dale Johannesen

2008-11-07 22:54:33 +0000

[diff] [blame]

2068

case ISD::SETOEQ:

Chris Lattner

2006-11-17 22:10:59 +0000

[diff] [blame]

2069

case ISD::SETEQ: return PPC::PRED_EQ;

Chris Lattner

630bbce

2006-05-25 16:54:16 +0000

[diff] [blame]

2070

case ISD::SETUNE:

Chris Lattner

2006-11-17 22:10:59 +0000

[diff] [blame]

2071

case ISD::SETNE: return PPC::PRED_NE;

Dale Johannesen

2008-11-07 22:54:33 +0000

[diff] [blame]

2072

case ISD::SETOLT:

Chris Lattner

2006-11-17 22:10:59 +0000

[diff] [blame]

2073

case ISD::SETLT: return PPC::PRED_LT;

Chris Lattner

2005-08-21 18:50:37 +0000

[diff] [blame]

2074

case ISD::SETULE:

Chris Lattner

2006-11-17 22:10:59 +0000

[diff] [blame]

2075

case ISD::SETLE: return PPC::PRED_LE;

Dale Johannesen

2008-11-07 22:54:33 +0000

[diff] [blame]

2076

case ISD::SETOGT:

Chris Lattner

2006-11-17 22:10:59 +0000

[diff] [blame]

2077

case ISD::SETGT: return PPC::PRED_GT;

Chris Lattner

2005-08-21 18:50:37 +0000

[diff] [blame]

2078

case ISD::SETUGE:

Chris Lattner

2006-11-17 22:10:59 +0000

[diff] [blame]

2079

case ISD::SETGE: return PPC::PRED_GE;

Chris Lattner

2006-11-17 22:10:59 +0000

[diff] [blame]

2080

case ISD::SETO: return PPC::PRED_NU;

2081

case ISD::SETUO: return PPC::PRED_UN;

Dale Johannesen

2008-11-07 22:54:33 +0000

[diff] [blame]

2082

// These two are invalid for floating point. Assume we have int.

2083

case ISD::SETULT: return PPC::PRED_LT;

2084

case ISD::SETUGT: return PPC::PRED_GT;

Chris Lattner

2005-08-21 18:50:37 +0000

[diff] [blame]

2085

}

Chris Lattner

2005-08-21 18:50:37 +0000

[diff] [blame]

2086

}

2087

Chris Lattner

2005-08-25 20:08:18 +0000

[diff] [blame]

2088

/// getCRIdxForSetCC - Return the index of the condition register field

2089

/// associated with the SetCC condition, and whether or not the field is

2090

/// treated as inverted. That is, lt = 0; ge = 0 inverted.

Ulrich Weigand

2013-07-03 15:13:30 +0000

[diff] [blame]

2091

static unsigned getCRIdxForSetCC(ISD::CondCode CC, bool &Invert) {

Chris Lattner

2008-01-08 06:46:30 +0000

[diff] [blame]

2092

Invert = false;

Chris Lattner

2005-08-25 20:08:18 +0000

[diff] [blame]

2093

switch (CC) {

Torok Edwin

2009-07-14 16:55:14 +0000

[diff] [blame]

2094

default: llvm_unreachable("Unknown condition!");

Chris Lattner

2008-01-08 06:46:30 +0000

[diff] [blame]

2095

case ISD::SETOLT:

2096

case ISD::SETLT: return 0; // Bit #0 = SETOLT

2097

case ISD::SETOGT:

2098

case ISD::SETGT: return 1; // Bit #1 = SETOGT

2099

case ISD::SETOEQ:

2100

case ISD::SETEQ: return 2; // Bit #2 = SETOEQ

2101

case ISD::SETUO: return 3; // Bit #3 = SETUO

Chris Lattner

2005-08-25 20:08:18 +0000

[diff] [blame]

2102

case ISD::SETUGE:

Chris Lattner

2008-01-08 06:46:30 +0000

[diff] [blame]

2103

case ISD::SETGE: Invert = true; return 0; // !Bit #0 = SETUGE

Chris Lattner

2005-08-25 20:08:18 +0000

[diff] [blame]

2104

case ISD::SETULE:

Chris Lattner

2008-01-08 06:46:30 +0000

[diff] [blame]

2105

case ISD::SETLE: Invert = true; return 1; // !Bit #1 = SETULE

Chris Lattner

1fbb0d3

2006-05-25 18:06:16 +0000

[diff] [blame]

2106

case ISD::SETUNE:

Chris Lattner

2008-01-08 06:46:30 +0000

[diff] [blame]

2107

case ISD::SETNE: Invert = true; return 2; // !Bit #2 = SETUNE

2108

case ISD::SETO: Invert = true; return 3; // !Bit #3 = SETO

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2109

case ISD::SETUEQ:

2110

case ISD::SETOGE:

2111

case ISD::SETOLE:

Dale Johannesen

2008-11-07 22:54:33 +0000

[diff] [blame]

2112

case ISD::SETONE:

Torok Edwin

2009-07-14 16:55:14 +0000

[diff] [blame]

2113

llvm_unreachable("Invalid branch code: should be expanded by legalize");

Dale Johannesen

2008-11-07 22:54:33 +0000

[diff] [blame]

2114

// These are invalid for floating point. Assume integer.

2115

case ISD::SETULT: return 0;

2116

case ISD::SETUGT: return 1;

Chris Lattner

2005-08-25 20:08:18 +0000

[diff] [blame]

2117

}

Chris Lattner

2005-08-25 20:08:18 +0000

[diff] [blame]

2118

}

Chris Lattner

c5292ec

2005-08-21 22:31:09 +0000

[diff] [blame]

2119

Adhemerval Zanella

2012-10-30 13:50:19 +0000

[diff] [blame]

2120

// getVCmpInst: return the vector compare instruction for the specified

2121

// vector type and condition code. Since this is for altivec specific code,

Kit Barton

2015-03-03 19:55:45 +0000

[diff] [blame]

2122

// only support the altivec types (v16i8, v8i16, v4i32, v2i64, and v4f32).

Ulrich Weigand

2014-08-04 13:13:57 +0000

[diff] [blame]

2123

static unsigned int getVCmpInst(MVT VecVT, ISD::CondCode CC,

2124

bool HasVSX, bool &Swap, bool &Negate) {

2125

Swap = false;

2126

Negate = false;

Adhemerval Zanella

2012-10-30 13:50:19 +0000

[diff] [blame]

2127

Ulrich Weigand

2014-08-04 13:13:57 +0000

[diff] [blame]

2128

if (VecVT.isFloatingPoint()) {

2129

/* Handle some cases by swapping input operands. */

2130

switch (CC) {

2131

case ISD::SETLE: CC = ISD::SETGE; Swap = true; break;

2132

case ISD::SETLT: CC = ISD::SETGT; Swap = true; break;

2133

case ISD::SETOLE: CC = ISD::SETOGE; Swap = true; break;

2134

case ISD::SETOLT: CC = ISD::SETOGT; Swap = true; break;

2135

case ISD::SETUGE: CC = ISD::SETULE; Swap = true; break;

2136

case ISD::SETUGT: CC = ISD::SETULT; Swap = true; break;

2137

default: break;

2138

}

2139

/* Handle some cases by negating the result. */

2140

switch (CC) {

2141

case ISD::SETNE: CC = ISD::SETEQ; Negate = true; break;

2142

case ISD::SETUNE: CC = ISD::SETOEQ; Negate = true; break;

2143

case ISD::SETULE: CC = ISD::SETOGT; Negate = true; break;

2144

case ISD::SETULT: CC = ISD::SETOGE; Negate = true; break;

2145

default: break;

2146

}

2147

/* We have instructions implementing the remaining cases. */

switch (CC) {

case ISD::SETEQ:

case ISD::SETOEQ:

if (VecVT == MVT::v4f32)

2152

return HasVSX ? PPC::XVCMPEQSP : PPC::VCMPEQFP;

2153

else if (VecVT == MVT::v2f64)

2154

return PPC::XVCMPEQDP;

break;

case ISD::SETGT:

case ISD::SETOGT:

if (VecVT == MVT::v4f32)

2159

return HasVSX ? PPC::XVCMPGTSP : PPC::VCMPGTFP;

2160

else if (VecVT == MVT::v2f64)

2161

return PPC::XVCMPGTDP;

break;

case ISD::SETGE:

case ISD::SETOGE:

if (VecVT == MVT::v4f32)

2166

return HasVSX ? PPC::XVCMPGESP : PPC::VCMPGEFP;

2167

else if (VecVT == MVT::v2f64)

2168

return PPC::XVCMPGEDP;

break;

default:

break;

}

llvm_unreachable("Invalid floating-point vector compare condition");

2174

} else {

2175

/* Handle some cases by swapping input operands. */

2176

switch (CC) {

2177

case ISD::SETGE: CC = ISD::SETLE; Swap = true; break;

2178

case ISD::SETLT: CC = ISD::SETGT; Swap = true; break;

2179

case ISD::SETUGE: CC = ISD::SETULE; Swap = true; break;

2180

case ISD::SETULT: CC = ISD::SETUGT; Swap = true; break;

2181

default: break;

2182

}

2183

/* Handle some cases by negating the result. */

2184

switch (CC) {

2185

case ISD::SETNE: CC = ISD::SETEQ; Negate = true; break;

2186

case ISD::SETUNE: CC = ISD::SETUEQ; Negate = true; break;

2187

case ISD::SETLE: CC = ISD::SETGT; Negate = true; break;

2188

case ISD::SETULE: CC = ISD::SETUGT; Negate = true; break;

2189

default: break;

2190

}

2191

/* We have instructions implementing the remaining cases. */

switch (CC) {

case ISD::SETEQ:

case ISD::SETUEQ:

if (VecVT == MVT::v16i8)

2196

return PPC::VCMPEQUB;

2197

else if (VecVT == MVT::v8i16)

2198

return PPC::VCMPEQUH;

2199

else if (VecVT == MVT::v4i32)

2200

return PPC::VCMPEQUW;

Kit Barton

2015-03-03 19:55:45 +0000

[diff] [blame]

2201

else if (VecVT == MVT::v2i64)

2202

return PPC::VCMPEQUD;

Ulrich Weigand

2014-08-04 13:13:57 +0000

[diff] [blame]

2203

break;

2204

case ISD::SETGT:

2205

if (VecVT == MVT::v16i8)

2206

return PPC::VCMPGTSB;

2207

else if (VecVT == MVT::v8i16)

2208

return PPC::VCMPGTSH;

2209

else if (VecVT == MVT::v4i32)

2210

return PPC::VCMPGTSW;

Kit Barton

2015-03-03 19:55:45 +0000

[diff] [blame]

2211

else if (VecVT == MVT::v2i64)

2212

return PPC::VCMPGTSD;

Ulrich Weigand

2014-08-04 13:13:57 +0000

[diff] [blame]

2213

break;

2214

case ISD::SETUGT:

2215

if (VecVT == MVT::v16i8)

2216

return PPC::VCMPGTUB;

2217

else if (VecVT == MVT::v8i16)

2218

return PPC::VCMPGTUH;

2219

else if (VecVT == MVT::v4i32)

2220

return PPC::VCMPGTUW;

Kit Barton

2015-03-03 19:55:45 +0000

[diff] [blame]

2221

else if (VecVT == MVT::v2i64)

2222

return PPC::VCMPGTUD;

Ulrich Weigand

2014-08-04 13:13:57 +0000

[diff] [blame]

break;

default:

break;

}

llvm_unreachable("Invalid integer vector compare condition");

Adhemerval Zanella

2012-10-30 13:50:19 +0000

[diff] [blame]

}

}

Dan Gohman

2010-01-05 01:24:18 +0000

[diff] [blame]

2231

SDNode *PPCDAGToDAGISel::SelectSETCC(SDNode *N) {

Andrew Trick

2013-05-25 02:42:55 +0000

[diff] [blame]

2232

SDLoc dl(N);

Chris Lattner

2005-10-06 19:03:35 +0000

[diff] [blame]

2233

unsigned Imm;

2234

ISD::CondCode CC = cast<CondCodeSDNode>(N->getOperand(2))->get();

Roman Divacky

2011-06-20 15:28:39 +0000

[diff] [blame]

2235

EVT PtrVT = CurDAG->getTargetLoweringInfo().getPointerTy();

2236

bool isPPC64 = (PtrVT == MVT::i64);

2237

Eric Christopher

2014-05-22 01:07:24 +0000

[diff] [blame]

2238

if (!PPCSubTarget->useCRBits() &&

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

2239

isInt32Immediate(N->getOperand(1), Imm)) {

Chris Lattner

2005-10-06 19:03:35 +0000

[diff] [blame]

2240

// We can codegen setcc op, imm very efficiently compared to a brcond.

2241

// Check for those cases here.

2242

// setcc op, 0

2243

if (Imm == 0) {

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2244

SDValue Op = N->getOperand(0);

Chris Lattner

2005-10-06 19:03:35 +0000

[diff] [blame]

2245

switch (CC) {

Chris Lattner

2005-10-21 21:17:10 +0000

[diff] [blame]

2246

default: break;

Evan Cheng

2006-08-27 08:14:06 +0000

[diff] [blame]

2247

case ISD::SETEQ: {

Dan Gohman

2009-09-25 18:54:59 +0000

[diff] [blame]

2248

Op = SDValue(CurDAG->getMachineNode(PPC::CNTLZW, dl, MVT::i32, Op), 0);

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2249

SDValue Ops[] = { Op, getI32Imm(27), getI32Imm(5), getI32Imm(31) };

Craig Topper

2014-04-27 19:21:11 +0000

[diff] [blame]

2250

return CurDAG->SelectNodeTo(N, PPC::RLWINM, MVT::i32, Ops);

Evan Cheng

2006-08-27 08:14:06 +0000

[diff] [blame]

2251

}

Chris Lattner

2005-10-21 21:17:10 +0000

[diff] [blame]

2252

case ISD::SETNE: {

Roman Divacky

2011-06-20 15:28:39 +0000

[diff] [blame]

2253

if (isPPC64) break;

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2254

SDValue AD =

Chris Lattner

3e5fbd7

2010-12-21 02:38:05 +0000

[diff] [blame]

2255

SDValue(CurDAG->getMachineNode(PPC::ADDIC, dl, MVT::i32, MVT::Glue,

Dan Gohman

2009-09-25 18:54:59 +0000

[diff] [blame]

2256

Op, getI32Imm(~0U)), 0);

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2257

return CurDAG->SelectNodeTo(N, PPC::SUBFE, MVT::i32, AD, Op,

Evan Cheng

34b70ee

2006-08-26 08:00:10 +0000

[diff] [blame]

2258

AD.getValue(1));

Chris Lattner

2005-10-06 19:03:35 +0000

[diff] [blame]

2259

}

Evan Cheng

2006-08-27 08:14:06 +0000

[diff] [blame]

2260

case ISD::SETLT: {

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2261

SDValue Ops[] = { Op, getI32Imm(1), getI32Imm(31), getI32Imm(31) };

Craig Topper

2014-04-27 19:21:11 +0000

[diff] [blame]

2262

return CurDAG->SelectNodeTo(N, PPC::RLWINM, MVT::i32, Ops);

Evan Cheng

2006-08-27 08:14:06 +0000

[diff] [blame]

2263

}

Chris Lattner

2005-10-21 21:17:10 +0000

[diff] [blame]

2264

case ISD::SETGT: {

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2265

SDValue T =

Dan Gohman

2009-09-25 18:54:59 +0000

[diff] [blame]

2266

SDValue(CurDAG->getMachineNode(PPC::NEG, dl, MVT::i32, Op), 0);

2267

T = SDValue(CurDAG->getMachineNode(PPC::ANDC, dl, MVT::i32, T, Op), 0);

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2268

SDValue Ops[] = { T, getI32Imm(1), getI32Imm(31), getI32Imm(31) };

Craig Topper

2014-04-27 19:21:11 +0000

[diff] [blame]

2269

return CurDAG->SelectNodeTo(N, PPC::RLWINM, MVT::i32, Ops);

Chris Lattner

2005-10-21 21:17:10 +0000

[diff] [blame]

2270

}

2271

}

Chris Lattner

2005-10-06 19:03:35 +0000

[diff] [blame]

2272

} else if (Imm == ~0U) { // setcc op, -1

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2273

SDValue Op = N->getOperand(0);

Chris Lattner

2005-10-06 19:03:35 +0000

[diff] [blame]

2274

switch (CC) {

Chris Lattner

2005-10-21 21:17:10 +0000

[diff] [blame]

2275

default: break;

2276

case ISD::SETEQ:

Roman Divacky

2011-06-20 15:28:39 +0000

[diff] [blame]

2277

if (isPPC64) break;

Chris Lattner

3e5fbd7

2010-12-21 02:38:05 +0000

[diff] [blame]

2278

Op = SDValue(CurDAG->getMachineNode(PPC::ADDIC, dl, MVT::i32, MVT::Glue,

Dan Gohman

2009-09-25 18:54:59 +0000

[diff] [blame]

2279

Op, getI32Imm(1)), 0);

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2280

return CurDAG->SelectNodeTo(N, PPC::ADDZE, MVT::i32,

2281

SDValue(CurDAG->getMachineNode(PPC::LI, dl,

Dan Gohman

2009-09-25 18:54:59 +0000

[diff] [blame]

2282

MVT::i32,

2283

getI32Imm(0)), 0),

Dale Johannesen

f08a47b

2009-02-04 23:02:30 +0000

[diff] [blame]

2284

Op.getValue(1));

Chris Lattner

2005-10-21 21:17:10 +0000

[diff] [blame]

2285

case ISD::SETNE: {

Roman Divacky

2011-06-20 15:28:39 +0000

[diff] [blame]

2286

if (isPPC64) break;

Dan Gohman

2009-09-25 18:54:59 +0000

[diff] [blame]

2287

Op = SDValue(CurDAG->getMachineNode(PPC::NOR, dl, MVT::i32, Op, Op), 0);

Chris Lattner

3e5fbd7

2010-12-21 02:38:05 +0000

[diff] [blame]

2288

SDNode *AD = CurDAG->getMachineNode(PPC::ADDIC, dl, MVT::i32, MVT::Glue,

Dan Gohman

2009-09-25 18:54:59 +0000

[diff] [blame]

2289

Op, getI32Imm(~0U));

Owen Anderson

2009-08-11 20:47:22 +0000

[diff] [blame]

2290

return CurDAG->SelectNodeTo(N, PPC::SUBFE, MVT::i32, SDValue(AD, 0),

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2291

Op, SDValue(AD, 1));

Chris Lattner

2005-10-06 19:03:35 +0000

[diff] [blame]

2292

}

Chris Lattner

2005-10-21 21:17:10 +0000

[diff] [blame]

2293

case ISD::SETLT: {

Dan Gohman

2009-09-25 18:54:59 +0000

[diff] [blame]

2294

SDValue AD = SDValue(CurDAG->getMachineNode(PPC::ADDI, dl, MVT::i32, Op,

2295

getI32Imm(1)), 0);

2296

SDValue AN = SDValue(CurDAG->getMachineNode(PPC::AND, dl, MVT::i32, AD,

2297

Op), 0);

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2298

SDValue Ops[] = { AN, getI32Imm(1), getI32Imm(31), getI32Imm(31) };

Craig Topper

2014-04-27 19:21:11 +0000

[diff] [blame]

2299

return CurDAG->SelectNodeTo(N, PPC::RLWINM, MVT::i32, Ops);

Chris Lattner

2005-10-21 21:17:10 +0000

[diff] [blame]

2300

}

Evan Cheng

2006-08-27 08:14:06 +0000

[diff] [blame]

2301

case ISD::SETGT: {

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2302

SDValue Ops[] = { Op, getI32Imm(1), getI32Imm(31), getI32Imm(31) };

Michael Liao

2013-04-19 22:22:57 +0000

[diff] [blame]

2303

Op = SDValue(CurDAG->getMachineNode(PPC::RLWINM, dl, MVT::i32, Ops),

Dale Johannesen

f08a47b

2009-02-04 23:02:30 +0000

[diff] [blame]

2304

0);

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2305

return CurDAG->SelectNodeTo(N, PPC::XORI, MVT::i32, Op,

Evan Cheng

34b70ee

2006-08-26 08:00:10 +0000

[diff] [blame]

2306

getI32Imm(1));

Chris Lattner

2005-10-21 21:17:10 +0000

[diff] [blame]

2307

}

Evan Cheng

2006-08-27 08:14:06 +0000

[diff] [blame]

2308

}

Chris Lattner

2005-10-06 19:03:35 +0000

[diff] [blame]

2309

}

2310

}

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2311

Adhemerval Zanella

2012-10-08 18:59:53 +0000

[diff] [blame]

2312

SDValue LHS = N->getOperand(0);

2313

SDValue RHS = N->getOperand(1);

2314

Adhemerval Zanella

2012-10-30 13:50:19 +0000

[diff] [blame]

2315

// Altivec Vector compare instructions do not set any CR register by default and

2316

// vector compare operations return the same type as the operands.

Adhemerval Zanella

2012-10-08 18:59:53 +0000

[diff] [blame]

2317

if (LHS.getValueType().isVector()) {

Hal Finkel

2015-02-25 01:06:45 +0000

[diff] [blame]

2318

if (PPCSubTarget->hasQPX())

2319

return nullptr;

2320

Adhemerval Zanella

2012-10-30 13:50:19 +0000

[diff] [blame]

2321

EVT VecVT = LHS.getValueType();

Ulrich Weigand

2014-08-04 13:13:57 +0000

[diff] [blame]

2322

bool Swap, Negate;

2323

unsigned int VCmpInst = getVCmpInst(VecVT.getSimpleVT(), CC,

2324

PPCSubTarget->hasVSX(), Swap, Negate);

2325

if (Swap)

2326

std::swap(LHS, RHS);

Adhemerval Zanella

2012-10-30 13:50:19 +0000

[diff] [blame]

2327

Ulrich Weigand

2014-08-04 13:13:57 +0000

[diff] [blame]

2328

if (Negate) {

2329

SDValue VCmp(CurDAG->getMachineNode(VCmpInst, dl, VecVT, LHS, RHS), 0);

2330

return CurDAG->SelectNodeTo(N, PPCSubTarget->hasVSX() ? PPC::XXLNOR :

2331

PPC::VNOR,

2332

VecVT, VCmp, VCmp);

Adhemerval Zanella

2012-10-30 13:50:19 +0000

[diff] [blame]

2333

}

Ulrich Weigand

2014-08-04 13:13:57 +0000

[diff] [blame]

2334

2335

return CurDAG->SelectNodeTo(N, VCmpInst, VecVT, LHS, RHS);

Adhemerval Zanella

2012-10-08 18:59:53 +0000

[diff] [blame]

2336

}

2337

Eric Christopher

2014-05-22 01:07:24 +0000

[diff] [blame]

2338

if (PPCSubTarget->useCRBits())

Craig Topper

2014-04-25 05:30:21 +0000

[diff] [blame]

2339

return nullptr;

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

2340

Chris Lattner

2005-10-06 19:03:35 +0000

[diff] [blame]

2341

bool Inv;

Ulrich Weigand

2013-07-03 15:13:30 +0000

[diff] [blame]

2342

unsigned Idx = getCRIdxForSetCC(CC, Inv);

Adhemerval Zanella

2012-10-08 18:59:53 +0000

[diff] [blame]

2343

SDValue CCReg = SelectCC(LHS, RHS, CC, dl);

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2344

SDValue IntCR;

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2345

Chris Lattner

2005-10-06 19:03:35 +0000

[diff] [blame]

2346

// Force the ccreg into CR7.

Owen Anderson

2009-08-11 20:47:22 +0000

[diff] [blame]

2347

SDValue CR7Reg = CurDAG->getRegister(PPC::CR7, MVT::i32);

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2348

Craig Topper

2014-04-25 05:30:21 +0000

[diff] [blame]

2349

SDValue InFlag(nullptr, 0); // Null incoming flag value.

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2350

CCReg = CurDAG->getCopyToReg(CurDAG->getEntryNode(), dl, CR7Reg, CCReg,

Chris Lattner

bd09910

2005-12-01 03:50:19 +0000

[diff] [blame]

2351

InFlag).getValue(1);

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2352

Ulrich Weigand

d5ebc62

2013-07-03 17:05:42 +0000

[diff] [blame]

2353

IntCR = SDValue(CurDAG->getMachineNode(PPC::MFOCRF, dl, MVT::i32, CR7Reg,

2354

CCReg), 0);

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2355

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2356

SDValue Ops[] = { IntCR, getI32Imm((32-(3-Idx)) & 31),

Evan Cheng

2006-08-27 08:14:06 +0000

[diff] [blame]

2357

getI32Imm(31), getI32Imm(31) };

Ulrich Weigand

2013-07-03 15:13:30 +0000

[diff] [blame]

2358

if (!Inv)

Craig Topper

2014-04-27 19:21:11 +0000

[diff] [blame]

2359

return CurDAG->SelectNodeTo(N, PPC::RLWINM, MVT::i32, Ops);

Chris Lattner

2008-01-08 06:46:30 +0000

[diff] [blame]

2360

2361

// Get the specified bit.

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2362

SDValue Tmp =

Michael Liao

2013-04-19 22:22:57 +0000

[diff] [blame]

2363

SDValue(CurDAG->getMachineNode(PPC::RLWINM, dl, MVT::i32, Ops), 0);

Ulrich Weigand

2013-07-03 15:13:30 +0000

[diff] [blame]

2364

return CurDAG->SelectNodeTo(N, PPC::XORI, MVT::i32, Tmp, getI32Imm(1));

Chris Lattner

2005-10-06 19:03:35 +0000

[diff] [blame]

2365

}

Chris Lattner

502a369

2005-10-06 18:56:10 +0000

[diff] [blame]

2366

Hal Finkel

2015-02-25 21:36:59 +0000

[diff] [blame]

2367

SDNode *PPCDAGToDAGISel::transferMemOperands(SDNode *N, SDNode *Result) {

2368

// Transfer memoperands.

2369

MachineSDNode::mmo_iterator MemOp = MF->allocateMemRefsArray(1);

2370

MemOp[0] = cast<MemSDNode>(N)->getMemOperand();

2371

cast<MachineSDNode>(Result)->setMemRefs(MemOp, MemOp + 1);

return Result;

}

Chris Lattner

2005-10-06 19:07:45 +0000

[diff] [blame]

2375

Chris Lattner

2005-08-17 19:33:03 +0000

[diff] [blame]

2376

// Select - Convert the specified operand from a target-independent to a

2377

// target-specific node if it hasn't already been changed.

Dan Gohman

2010-01-05 01:24:18 +0000

[diff] [blame]

2378

SDNode *PPCDAGToDAGISel::Select(SDNode *N) {

Andrew Trick

2013-05-25 02:42:55 +0000

[diff] [blame]

2379

SDLoc dl(N);

Tim Northover

31d093c

2013-09-22 08:21:56 +0000

[diff] [blame]

2380

if (N->isMachineOpcode()) {

2381

N->setNodeId(-1);

Craig Topper

2014-04-25 05:30:21 +0000

[diff] [blame]

2382

return nullptr; // Already selected.

Tim Northover

31d093c

2013-09-22 08:21:56 +0000

[diff] [blame]

2383

}

Chris Lattner

08c319f

2005-09-29 00:59:32 +0000

[diff] [blame]

2384

Hal Finkel

51b3fd1

2014-09-02 06:23:54 +0000

[diff] [blame]

2385

// In case any misguided DAG-level optimizations form an ADD with a

2386

// TargetConstant operand, crash here instead of miscompiling (by selecting

2387

// an r+r add instead of some kind of r+i add).

2388

if (N->getOpcode() == ISD::ADD &&

2389

N->getOperand(1).getOpcode() == ISD::TargetConstant)

2390

llvm_unreachable("Invalid ADD with TargetConstant operand");

2391

Hal Finkel

2014-12-16 05:51:41 +0000

[diff] [blame]

2392

// Try matching complex bit permutations before doing anything else.

2393

if (SDNode *NN = SelectBitPermutation(N))

2394

return NN;

2395

Chris Lattner

2005-08-17 19:33:03 +0000

[diff] [blame]

2396

switch (N->getOpcode()) {

Chris Lattner

498915d

2005-09-07 23:45:15 +0000

[diff] [blame]

2397

default: break;

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2398

Jim Laskey

095e6f3

2006-12-12 13:23:43 +0000

[diff] [blame]

2399

case ISD::Constant: {

Hal Finkel

2015-01-01 02:53:29 +0000

[diff] [blame]

2400

if (N->getValueType(0) == MVT::i64)

2401

return SelectInt64(CurDAG, N);

Jim Laskey

095e6f3

2006-12-12 13:23:43 +0000

[diff] [blame]

2402

break;

2403

}

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2404

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

2405

case ISD::SETCC: {

2406

SDNode *SN = SelectSETCC(N);

if (SN)

return SN;

break;

}

Evan Cheng

6dc90ca

2006-02-09 00:37:58 +0000

[diff] [blame]

2411

case PPCISD::GlobalBaseReg:

Evan Cheng

61413a3

2006-08-26 05:34:46 +0000

[diff] [blame]

2412

return getGlobalBaseReg();

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2413

Hal Finkel

2014-12-11 22:51:06 +0000

[diff] [blame]

2414

case ISD::FrameIndex:

2415

return getFrameIndex(N, N);

Chris Lattner

6961fc7

2006-03-26 10:06:40 +0000

[diff] [blame]

2416

Ulrich Weigand

d5ebc62

2013-07-03 17:05:42 +0000

[diff] [blame]

2417

case PPCISD::MFOCRF: {

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2418

SDValue InFlag = N->getOperand(1);

Ulrich Weigand

d5ebc62

2013-07-03 17:05:42 +0000

[diff] [blame]

2419

return CurDAG->getMachineNode(PPC::MFOCRF, dl, MVT::i32,

2420

N->getOperand(0), InFlag);

Chris Lattner

6961fc7

2006-03-26 10:06:40 +0000

[diff] [blame]

2421

}

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2422

Hal Finkel

bbdee93

2014-12-02 22:01:00 +0000

[diff] [blame]

2423

case PPCISD::READ_TIME_BASE: {

2424

return CurDAG->getMachineNode(PPC::ReadTB, dl, MVT::i32, MVT::i32,

2425

MVT::Other, N->getOperand(0));

2426

}

2427

Hal Finkel

13d104b

2014-12-11 18:37:52 +0000

[diff] [blame]

2428

case PPCISD::SRA_ADDZE: {

2429

SDValue N0 = N->getOperand(0);

2430

SDValue ShiftAmt =

2431

CurDAG->getTargetConstant(*cast<ConstantSDNode>(N->getOperand(1))->

2432

getConstantIntValue(), N->getValueType(0));

2433

if (N->getValueType(0) == MVT::i64) {

2434

SDNode *Op =

2435

CurDAG->getMachineNode(PPC::SRADI, dl, MVT::i64, MVT::Glue,

2436

N0, ShiftAmt);

2437

return CurDAG->SelectNodeTo(N, PPC::ADDZE8, MVT::i64,

2438

SDValue(Op, 0), SDValue(Op, 1));

2439

} else {

2440

assert(N->getValueType(0) == MVT::i32 &&

2441

"Expecting i64 or i32 in PPCISD::SRA_ADDZE");

2442

SDNode *Op =

2443

CurDAG->getMachineNode(PPC::SRAWI, dl, MVT::i32, MVT::Glue,

2444

N0, ShiftAmt);

2445

return CurDAG->SelectNodeTo(N, PPC::ADDZE, MVT::i32,

2446

SDValue(Op, 0), SDValue(Op, 1));

Chris Lattner

dc66457

2005-08-25 17:50:06 +0000

[diff] [blame]

2447

}

Chris Lattner

6e184f2

2005-08-25 22:04:30 +0000

[diff] [blame]

2448

}

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2449

Chris Lattner

2006-11-10 02:08:47 +0000

[diff] [blame]

2450

case ISD::LOAD: {

2451

// Handle preincrement loads.

Dan Gohman

2010-01-05 01:24:18 +0000

[diff] [blame]

2452

LoadSDNode *LD = cast<LoadSDNode>(N);

Owen Anderson

53aa7a9

2009-08-10 22:56:29 +0000

[diff] [blame]

2453

EVT LoadedVT = LD->getMemoryVT();

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2454

Chris Lattner

2006-11-10 02:08:47 +0000

[diff] [blame]

2455

// Normal loads are handled by code generated from the .td file.

2456

if (LD->getAddressingMode() != ISD::PRE_INC)

2457

break;

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2458

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2459

SDValue Offset = LD->getOffset();

Ulrich Weigand

d1b99d3

2013-03-22 14:58:17 +0000

[diff] [blame]

2460

if (Offset.getOpcode() == ISD::TargetConstant ||

Chris Lattner

c5102bf

2006-11-11 04:53:30 +0000

[diff] [blame]

2461

Offset.getOpcode() == ISD::TargetGlobalAddress) {

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2462

Chris Lattner

2006-11-15 19:55:13 +0000

[diff] [blame]

2463

unsigned Opcode;

2464

bool isSExt = LD->getExtensionType() == ISD::SEXTLOAD;

Owen Anderson

2009-08-11 20:47:22 +0000

[diff] [blame]

2465

if (LD->getValueType(0) != MVT::i64) {

Chris Lattner

2006-11-15 19:55:13 +0000

[diff] [blame]

2466

// Handle PPC32 integer and normal FP loads.

Owen Anderson

2009-08-11 20:47:22 +0000

[diff] [blame]

2467

assert((!isSExt || LoadedVT == MVT::i16) && "Invalid sext update load");

2468

switch (LoadedVT.getSimpleVT().SimpleTy) {

Torok Edwin

2009-07-14 16:55:14 +0000

[diff] [blame]

2469

default: llvm_unreachable("Invalid PPC load type!");

Owen Anderson

2009-08-11 20:47:22 +0000

[diff] [blame]

2470

case MVT::f64: Opcode = PPC::LFDU; break;

2471

case MVT::f32: Opcode = PPC::LFSU; break;

2472

case MVT::i32: Opcode = PPC::LWZU; break;

2473

case MVT::i16: Opcode = isSExt ? PPC::LHAU : PPC::LHZU; break;

2474

case MVT::i1:

2475

case MVT::i8: Opcode = PPC::LBZU; break;

Chris Lattner

2006-11-15 19:55:13 +0000

[diff] [blame]

2476

}

2477

} else {

Owen Anderson

2009-08-11 20:47:22 +0000

[diff] [blame]

2478

assert(LD->getValueType(0) == MVT::i64 && "Unknown load result type!");

2479

assert((!isSExt || LoadedVT == MVT::i16) && "Invalid sext update load");

2480

switch (LoadedVT.getSimpleVT().SimpleTy) {

Torok Edwin

2009-07-14 16:55:14 +0000

[diff] [blame]

2481

default: llvm_unreachable("Invalid PPC load type!");

Owen Anderson

2009-08-11 20:47:22 +0000

[diff] [blame]

2482

case MVT::i64: Opcode = PPC::LDU; break;

2483

case MVT::i32: Opcode = PPC::LWZU8; break;

2484

case MVT::i16: Opcode = isSExt ? PPC::LHAU8 : PPC::LHZU8; break;

2485

case MVT::i1:

2486

case MVT::i8: Opcode = PPC::LBZU8; break;

Chris Lattner

2006-11-15 19:55:13 +0000

[diff] [blame]

2487

}

2488

}

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2489

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2490

SDValue Chain = LD->getChain();

2491

SDValue Base = LD->getBasePtr();

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2492

SDValue Ops[] = { Offset, Base, Chain };

Hal Finkel

2015-02-25 21:36:59 +0000

[diff] [blame]

2493

return transferMemOperands(N, CurDAG->getMachineNode(Opcode, dl,

2494

LD->getValueType(0),

2495

PPCLowering->getPointerTy(),

2496

MVT::Other, Ops));

Chris Lattner

2006-11-10 02:08:47 +0000

[diff] [blame]

2497

} else {

Hal Finkel

ca542be

2012-06-20 15:43:03 +0000

[diff] [blame]

2498

unsigned Opcode;

2499

bool isSExt = LD->getExtensionType() == ISD::SEXTLOAD;

2500

if (LD->getValueType(0) != MVT::i64) {

2501

// Handle PPC32 integer and normal FP loads.

2502

assert((!isSExt || LoadedVT == MVT::i16) && "Invalid sext update load");

2503

switch (LoadedVT.getSimpleVT().SimpleTy) {

2504

default: llvm_unreachable("Invalid PPC load type!");

Hal Finkel

2015-02-25 01:06:45 +0000

[diff] [blame]

2505

case MVT::v4f64: Opcode = PPC::QVLFDUX; break; // QPX

2506

case MVT::v4f32: Opcode = PPC::QVLFSUX; break; // QPX

Hal Finkel

ca542be

2012-06-20 15:43:03 +0000

[diff] [blame]

2507

case MVT::f64: Opcode = PPC::LFDUX; break;

2508

case MVT::f32: Opcode = PPC::LFSUX; break;

2509

case MVT::i32: Opcode = PPC::LWZUX; break;

2510

case MVT::i16: Opcode = isSExt ? PPC::LHAUX : PPC::LHZUX; break;

2511

case MVT::i1:

2512

case MVT::i8: Opcode = PPC::LBZUX; break;

2513

}

2514

} else {

2515

assert(LD->getValueType(0) == MVT::i64 && "Unknown load result type!");

2516

assert((!isSExt || LoadedVT == MVT::i16 || LoadedVT == MVT::i32) &&

2517

"Invalid sext update load");

2518

switch (LoadedVT.getSimpleVT().SimpleTy) {

2519

default: llvm_unreachable("Invalid PPC load type!");

2520

case MVT::i64: Opcode = PPC::LDUX; break;

2521

case MVT::i32: Opcode = isSExt ? PPC::LWAUX : PPC::LWZUX8; break;

2522

case MVT::i16: Opcode = isSExt ? PPC::LHAUX8 : PPC::LHZUX8; break;

2523

case MVT::i1:

2524

case MVT::i8: Opcode = PPC::LBZUX8; break;

}

}

SDValue Chain = LD->getChain();

2529

SDValue Base = LD->getBasePtr();

Ulrich Weigand

e90b022

2013-03-22 14:58:48 +0000

[diff] [blame]

2530

SDValue Ops[] = { Base, Offset, Chain };

Hal Finkel

2015-02-25 21:36:59 +0000

[diff] [blame]

2531

return transferMemOperands(N, CurDAG->getMachineNode(Opcode, dl,

2532

LD->getValueType(0),

2533

PPCLowering->getPointerTy(),

2534

MVT::Other, Ops));

Chris Lattner

2006-11-10 02:08:47 +0000

[diff] [blame]

2535

}

2536

}

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2537

Nate Begeman

2005-08-18 07:30:46 +0000

[diff] [blame]

2538

case ISD::AND: {

Nate Begeman

2006-09-22 05:01:56 +0000

[diff] [blame]

2539

unsigned Imm, Imm2, SH, MB, ME;

Hal Finkel

e39526a

2012-08-28 02:10:15 +0000

[diff] [blame]

2540

uint64_t Imm64;

Nate Begeman

2006-09-22 05:01:56 +0000

[diff] [blame]

2541

Nate Begeman

2005-08-18 07:30:46 +0000

[diff] [blame]

2542

// If this is an and of a value rotated between 0 and 31 bits and then and'd

2543

// with a mask, emit rlwinm

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

2544

if (isInt32Immediate(N->getOperand(1), Imm) &&

Gabor Greif

2008-08-28 21:40:38 +0000

[diff] [blame]

2545

isRotateAndMask(N->getOperand(0).getNode(), Imm, false, SH, MB, ME)) {

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2546

SDValue Val = N->getOperand(0).getOperand(0);

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2547

SDValue Ops[] = { Val, getI32Imm(SH), getI32Imm(MB), getI32Imm(ME) };

Craig Topper

2014-04-27 19:21:11 +0000

[diff] [blame]

2548

return CurDAG->SelectNodeTo(N, PPC::RLWINM, MVT::i32, Ops);

Nate Begeman

2005-08-18 07:30:46 +0000

[diff] [blame]

2549

}

Nate Begeman

2006-09-22 05:01:56 +0000

[diff] [blame]

2550

// If this is just a masked value where the input is not handled above, and

2551

// is not a rotate-left (handled by a pattern in the .td file), emit rlwinm

2552

if (isInt32Immediate(N->getOperand(1), Imm) &&

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2553

isRunOfOnes(Imm, MB, ME) &&

Nate Begeman

2006-09-22 05:01:56 +0000

[diff] [blame]

2554

N->getOperand(0).getOpcode() != ISD::ROTL) {

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2555

SDValue Val = N->getOperand(0);

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2556

SDValue Ops[] = { Val, getI32Imm(0), getI32Imm(MB), getI32Imm(ME) };

Craig Topper

2014-04-27 19:21:11 +0000

[diff] [blame]

2557

return CurDAG->SelectNodeTo(N, PPC::RLWINM, MVT::i32, Ops);

Nate Begeman

2006-09-22 05:01:56 +0000

[diff] [blame]

2558

}

Hal Finkel

e39526a

2012-08-28 02:10:15 +0000

[diff] [blame]

2559

// If this is a 64-bit zero-extension mask, emit rldicl.

2560

if (isInt64Immediate(N->getOperand(1).getNode(), Imm64) &&

2561

isMask_64(Imm64)) {

2562

SDValue Val = N->getOperand(0);

Benjamin Kramer

5f6a907

2015-02-12 15:35:40 +0000

[diff] [blame]

2563

MB = 64 - countTrailingOnes(Imm64);

Hal Finkel

22498fa

2013-11-20 01:10:15 +0000

[diff] [blame]

2564

SH = 0;

2565

2566

// If the operand is a logical right shift, we can fold it into this

2567

// instruction: rldicl(rldicl(x, 64-n, n), 0, mb) -> rldicl(x, 64-n, mb)

2568

// for n <= mb. The right shift is really a left rotate followed by a

2569

// mask, and this mask is a more-restrictive sub-mask of the mask implied

2570

// by the shift.

2571

if (Val.getOpcode() == ISD::SRL &&

2572

isInt32Immediate(Val.getOperand(1).getNode(), Imm) && Imm <= MB) {

2573

assert(Imm < 64 && "Illegal shift amount");

2574

Val = Val.getOperand(0);

SH = 64 - Imm;

}

SDValue Ops[] = { Val, getI32Imm(SH), getI32Imm(MB) };

Craig Topper

2014-04-27 19:21:11 +0000

[diff] [blame]

2579

return CurDAG->SelectNodeTo(N, PPC::RLDICL, MVT::i64, Ops);

Hal Finkel

e39526a

2012-08-28 02:10:15 +0000

[diff] [blame]

2580

}

Nate Begeman

2006-09-22 05:01:56 +0000

[diff] [blame]

2581

// AND X, 0 -> 0, not "rlwinm 32".

2582

if (isInt32Immediate(N->getOperand(1), Imm) && (Imm == 0)) {

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2583

ReplaceUses(SDValue(N, 0), N->getOperand(1));

Craig Topper

2014-04-25 05:30:21 +0000

[diff] [blame]

2584

return nullptr;

Nate Begeman

2006-09-22 05:01:56 +0000

[diff] [blame]

2585

}

Nate Begeman

2005-12-24 01:00:15 +0000

[diff] [blame]

2586

// ISD::OR doesn't get all the bitfield insertion fun.

2587

// (and (or x, c1), c2) where isRunOfOnes(~(c1^c2)) is a bitfield insert

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2588

if (isInt32Immediate(N->getOperand(1), Imm) &&

Nate Begeman

2005-12-24 01:00:15 +0000

[diff] [blame]

2589

N->getOperand(0).getOpcode() == ISD::OR &&

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

2590

isInt32Immediate(N->getOperand(0).getOperand(1), Imm2)) {

Chris Lattner

20c88df

2006-01-05 18:32:49 +0000

[diff] [blame]

2591

unsigned MB, ME;

Nate Begeman

2005-12-24 01:00:15 +0000

[diff] [blame]

2592

Imm = ~(Imm^Imm2);

2593

if (isRunOfOnes(Imm, MB, ME)) {

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2594

SDValue Ops[] = { N->getOperand(0).getOperand(0),

Evan Cheng

2006-08-27 08:14:06 +0000

[diff] [blame]

2595

N->getOperand(0).getOperand(1),

2596

getI32Imm(0), getI32Imm(MB),getI32Imm(ME) };

Michael Liao

2013-04-19 22:22:57 +0000

[diff] [blame]

2597

return CurDAG->getMachineNode(PPC::RLWIMI, dl, MVT::i32, Ops);

Nate Begeman

2005-12-24 01:00:15 +0000

[diff] [blame]

2598

}

2599

}

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2600

Chris Lattner

1de5706

2005-09-29 23:33:31 +0000

[diff] [blame]

2601

// Other cases are autogenerated.

2602

break;

Nate Begeman

2005-08-18 07:30:46 +0000

[diff] [blame]

2603

}

Hal Finkel

2014-12-11 22:51:06 +0000

[diff] [blame]

2604

case ISD::OR: {

Owen Anderson

2009-08-11 20:47:22 +0000

[diff] [blame]

2605

if (N->getValueType(0) == MVT::i32)

Chris Lattner

bc485fd

2006-08-15 23:48:22 +0000

[diff] [blame]

2606

if (SDNode *I = SelectBitfieldInsert(N))

2607

return I;

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2608

Hal Finkel

2014-12-11 22:51:06 +0000

[diff] [blame]

2609

short Imm;

2610

if (N->getOperand(0)->getOpcode() == ISD::FrameIndex &&

2611

isIntS16Immediate(N->getOperand(1), Imm)) {

2612

APInt LHSKnownZero, LHSKnownOne;

2613

CurDAG->computeKnownBits(N->getOperand(0), LHSKnownZero, LHSKnownOne);

2614

2615

// If this is equivalent to an add, then we can fold it with the

2616

// FrameIndex calculation.

2617

if ((LHSKnownZero.getZExtValue()|~(uint64_t)Imm) == ~0ULL)

2618

return getFrameIndex(N, N->getOperand(0).getNode(), (int)Imm);

2619

}

2620

Chris Lattner

1de5706

2005-09-29 23:33:31 +0000

[diff] [blame]

2621

// Other cases are autogenerated.

2622

break;

Hal Finkel

2014-12-11 22:51:06 +0000

[diff] [blame]

}

case ISD::ADD: {

short Imm;

if (N->getOperand(0)->getOpcode() == ISD::FrameIndex &&

2627

isIntS16Immediate(N->getOperand(1), Imm))

2628

return getFrameIndex(N, N->getOperand(0).getNode(), (int)Imm);

2629

2630

break;

2631

}

Nate Begeman

33acb2c

2005-08-18 23:38:00 +0000

[diff] [blame]

2632

case ISD::SHL: {

2633

unsigned Imm, SH, MB, ME;

Gabor Greif

2008-08-28 21:40:38 +0000

[diff] [blame]

2634

if (isOpcWithIntImmediate(N->getOperand(0).getNode(), ISD::AND, Imm) &&

Nate Begeman

9f3c26c

2005-10-19 18:42:01 +0000

[diff] [blame]

2635

isRotateAndMask(N, Imm, true, SH, MB, ME)) {

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2636

SDValue Ops[] = { N->getOperand(0).getOperand(0),

Evan Cheng

2006-08-27 08:14:06 +0000

[diff] [blame]

2637

getI32Imm(SH), getI32Imm(MB), getI32Imm(ME) };

Craig Topper

2014-04-27 19:21:11 +0000

[diff] [blame]

2638

return CurDAG->SelectNodeTo(N, PPC::RLWINM, MVT::i32, Ops);

Nate Begeman

9eaa6ba

2005-10-19 01:12:32 +0000

[diff] [blame]

2639

}

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2640

Nate Begeman

9f3c26c

2005-10-19 18:42:01 +0000

[diff] [blame]

2641

// Other cases are autogenerated.

2642

break;

Nate Begeman

33acb2c

2005-08-18 23:38:00 +0000

[diff] [blame]

2643

}

2644

case ISD::SRL: {

2645

unsigned Imm, SH, MB, ME;

Gabor Greif

2008-08-28 21:40:38 +0000

[diff] [blame]

2646

if (isOpcWithIntImmediate(N->getOperand(0).getNode(), ISD::AND, Imm) &&

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2647

isRotateAndMask(N, Imm, true, SH, MB, ME)) {

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2648

SDValue Ops[] = { N->getOperand(0).getOperand(0),

Evan Cheng

2006-08-27 08:14:06 +0000

[diff] [blame]

2649

getI32Imm(SH), getI32Imm(MB), getI32Imm(ME) };

Craig Topper

2014-04-27 19:21:11 +0000

[diff] [blame]

2650

return CurDAG->SelectNodeTo(N, PPC::RLWINM, MVT::i32, Ops);

Nate Begeman

9eaa6ba

2005-10-19 01:12:32 +0000

[diff] [blame]

2651

}

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2652

Nate Begeman

9f3c26c

2005-10-19 18:42:01 +0000

[diff] [blame]

2653

// Other cases are autogenerated.

2654

break;

Nate Begeman

33acb2c

2005-08-18 23:38:00 +0000

[diff] [blame]

2655

}

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

2656

// FIXME: Remove this once the ANDI glue bug is fixed:

2657

case PPCISD::ANDIo_1_EQ_BIT:

2658

case PPCISD::ANDIo_1_GT_BIT: {

if (!ANDIGlueBug)

break;

EVT InVT = N->getOperand(0).getValueType();

2663

assert((InVT == MVT::i64 || InVT == MVT::i32) &&

2664

"Invalid input type for ANDIo_1_EQ_BIT");

2665

2666

unsigned Opcode = (InVT == MVT::i64) ? PPC::ANDIo8 : PPC::ANDIo;

2667

SDValue AndI(CurDAG->getMachineNode(Opcode, dl, InVT, MVT::Glue,

2668

N->getOperand(0),

2669

CurDAG->getTargetConstant(1, InVT)), 0);

2670

SDValue CR0Reg = CurDAG->getRegister(PPC::CR0, MVT::i32);

2671

SDValue SRIdxVal =

2672

CurDAG->getTargetConstant(N->getOpcode() == PPCISD::ANDIo_1_EQ_BIT ?

2673

PPC::sub_eq : PPC::sub_gt, MVT::i32);

2674

2675

return CurDAG->SelectNodeTo(N, TargetOpcode::EXTRACT_SUBREG, MVT::i1,

2676

CR0Reg, SRIdxVal,

2677

SDValue(AndI.getNode(), 1) /* glue */);

2678

}

Chris Lattner

bec817c

2005-08-26 18:46:49 +0000

[diff] [blame]

2679

case ISD::SELECT_CC: {

2680

ISD::CondCode CC = cast<CondCodeSDNode>(N->getOperand(4))->get();

Roman Divacky

2011-06-20 15:28:39 +0000

[diff] [blame]

2681

EVT PtrVT = CurDAG->getTargetLoweringInfo().getPointerTy();

2682

bool isPPC64 = (PtrVT == MVT::i64);

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

2683

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

2684

// If this is a select of i1 operands, we'll pattern match it.

Eric Christopher

2014-05-22 01:07:24 +0000

[diff] [blame]

2685

if (PPCSubTarget->useCRBits() &&

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

2686

N->getOperand(0).getValueType() == MVT::i1)

2687

break;

2688

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

2689

// Handle the setcc cases here. select_cc lhs, 0, 1, 0, cc

Roman Divacky

2011-06-20 15:28:39 +0000

[diff] [blame]

2690

if (!isPPC64)

2691

if (ConstantSDNode *N1C = dyn_cast<ConstantSDNode>(N->getOperand(1)))

2692

if (ConstantSDNode *N2C = dyn_cast<ConstantSDNode>(N->getOperand(2)))

2693

if (ConstantSDNode *N3C = dyn_cast<ConstantSDNode>(N->getOperand(3)))

2694

if (N1C->isNullValue() && N3C->isNullValue() &&

2695

N2C->getZExtValue() == 1ULL && CC == ISD::SETNE &&

2696

// FIXME: Implement this optzn for PPC64.

2697

N->getValueType(0) == MVT::i32) {

2698

SDNode *Tmp =

2699

CurDAG->getMachineNode(PPC::ADDIC, dl, MVT::i32, MVT::Glue,

2700

N->getOperand(0), getI32Imm(~0U));

2701

return CurDAG->SelectNodeTo(N, PPC::SUBFE, MVT::i32,

2702

SDValue(Tmp, 0), N->getOperand(0),

2703

SDValue(Tmp, 1));

2704

}

Chris Lattner

9b577f1

2005-08-26 21:23:58 +0000

[diff] [blame]

2705

Dale Johannesen

ab8e442

2009-02-06 19:16:40 +0000

[diff] [blame]

2706

SDValue CCReg = SelectCC(N->getOperand(0), N->getOperand(1), CC, dl);

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

2707

2708

if (N->getValueType(0) == MVT::i1) {

2709

// An i1 select is: (c & t) | (!c & f).

2710

bool Inv;

2711

unsigned Idx = getCRIdxForSetCC(CC, Inv);

unsigned SRI;

switch (Idx) {

default: llvm_unreachable("Invalid CC index");

2716

case 0: SRI = PPC::sub_lt; break;

2717

case 1: SRI = PPC::sub_gt; break;

2718

case 2: SRI = PPC::sub_eq; break;

2719

case 3: SRI = PPC::sub_un; break;

2720

}

2721

2722

SDValue CCBit = CurDAG->getTargetExtractSubreg(SRI, dl, MVT::i1, CCReg);

2723

2724

SDValue NotCCBit(CurDAG->getMachineNode(PPC::CRNOR, dl, MVT::i1,

2725

CCBit, CCBit), 0);

2726

SDValue C = Inv ? NotCCBit : CCBit,

2727

NotC = Inv ? CCBit : NotCCBit;

2728

2729

SDValue CAndT(CurDAG->getMachineNode(PPC::CRAND, dl, MVT::i1,

2730

C, N->getOperand(2)), 0);

2731

SDValue NotCAndF(CurDAG->getMachineNode(PPC::CRAND, dl, MVT::i1,

2732

NotC, N->getOperand(3)), 0);

2733

2734

return CurDAG->SelectNodeTo(N, PPC::CROR, MVT::i1, CAndT, NotCAndF);

2735

}

2736

Chris Lattner

2006-11-17 22:10:59 +0000

[diff] [blame]

2737

unsigned BROpc = getPredicateForSetCC(CC);

Chris Lattner

9b577f1

2005-08-26 21:23:58 +0000

[diff] [blame]

2738

Chris Lattner

d3eee1a

2005-10-01 01:35:02 +0000

[diff] [blame]

2739

unsigned SelectCCOp;

Owen Anderson

2009-08-11 20:47:22 +0000

[diff] [blame]

2740

if (N->getValueType(0) == MVT::i32)

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

2741

SelectCCOp = PPC::SELECT_CC_I4;

Owen Anderson

2009-08-11 20:47:22 +0000

[diff] [blame]

2742

else if (N->getValueType(0) == MVT::i64)

Chris Lattner

2006-06-27 00:04:13 +0000

[diff] [blame]

2743

SelectCCOp = PPC::SELECT_CC_I8;

Owen Anderson

2009-08-11 20:47:22 +0000

[diff] [blame]

2744

else if (N->getValueType(0) == MVT::f32)

Chris Lattner

d3eee1a

2005-10-01 01:35:02 +0000

[diff] [blame]

2745

SelectCCOp = PPC::SELECT_CC_F4;

Owen Anderson

2009-08-11 20:47:22 +0000

[diff] [blame]

2746

else if (N->getValueType(0) == MVT::f64)

Bill Schmidt

9c54bbd

2014-10-22 16:58:20 +0000

[diff] [blame]

2747

if (PPCSubTarget->hasVSX())

2748

SelectCCOp = PPC::SELECT_CC_VSFRC;

2749

else

2750

SelectCCOp = PPC::SELECT_CC_F8;

Hal Finkel

2015-02-25 01:06:45 +0000

[diff] [blame]

2751

else if (PPCSubTarget->hasQPX() && N->getValueType(0) == MVT::v4f64)

2752

SelectCCOp = PPC::SELECT_CC_QFRC;

2753

else if (PPCSubTarget->hasQPX() && N->getValueType(0) == MVT::v4f32)

2754

SelectCCOp = PPC::SELECT_CC_QSRC;

2755

else if (PPCSubTarget->hasQPX() && N->getValueType(0) == MVT::v4i1)

2756

SelectCCOp = PPC::SELECT_CC_QBRC;

Bill Schmidt

2014-10-22 13:13:40 +0000

[diff] [blame]

2757

else if (N->getValueType(0) == MVT::v2f64 ||

2758

N->getValueType(0) == MVT::v2i64)

2759

SelectCCOp = PPC::SELECT_CC_VSRC;

Chris Lattner

0a3d1bb

2006-04-08 22:45:08 +0000

[diff] [blame]

2760

else

2761

SelectCCOp = PPC::SELECT_CC_VRRC;

2762

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2763

SDValue Ops[] = { CCReg, N->getOperand(2), N->getOperand(3),

Evan Cheng

2006-08-27 08:14:06 +0000

[diff] [blame]

2764

getI32Imm(BROpc) };

Craig Topper

2014-04-27 19:21:11 +0000

[diff] [blame]

2765

return CurDAG->SelectNodeTo(N, SelectCCOp, N->getValueType(0), Ops);

Chris Lattner

bec817c

2005-08-26 18:46:49 +0000

[diff] [blame]

2766

}

Hal Finkel

732f0f7

2014-03-26 12:49:28 +0000

[diff] [blame]

2767

case ISD::VSELECT:

Eric Christopher

2014-05-22 01:07:24 +0000

[diff] [blame]

2768

if (PPCSubTarget->hasVSX()) {

Hal Finkel

732f0f7

2014-03-26 12:49:28 +0000

[diff] [blame]

2769

SDValue Ops[] = { N->getOperand(2), N->getOperand(1), N->getOperand(0) };

Craig Topper

2014-04-27 19:21:11 +0000

[diff] [blame]

2770

return CurDAG->SelectNodeTo(N, PPC::XXSEL, N->getValueType(0), Ops);

Hal Finkel

732f0f7

2014-03-26 12:49:28 +0000

[diff] [blame]

2771

}

2772

2773

break;

Hal Finkel

2014-03-26 22:58:37 +0000

[diff] [blame]

2774

case ISD::VECTOR_SHUFFLE:

Eric Christopher

2014-05-22 01:07:24 +0000

[diff] [blame]

2775

if (PPCSubTarget->hasVSX() && (N->getValueType(0) == MVT::v2f64 ||

Hal Finkel

2014-03-26 22:58:37 +0000

[diff] [blame]

2776

N->getValueType(0) == MVT::v2i64)) {

2777

ShuffleVectorSDNode *SVN = cast<ShuffleVectorSDNode>(N);

2778

2779

SDValue Op1 = N->getOperand(SVN->getMaskElt(0) < 2 ? 0 : 1),

2780

Op2 = N->getOperand(SVN->getMaskElt(1) < 2 ? 0 : 1);

2781

unsigned DM[2];

2782

2783

for (int i = 0; i < 2; ++i)

2784

if (SVN->getMaskElt(i) <= 0 || SVN->getMaskElt(i) == 2)

DM[i] = 0;

else

DM[i] = 1;

Bill Schmidt

2014-12-09 16:52:29 +0000

[diff] [blame]

2789

// For little endian, we must swap the input operands and adjust

2790

// the mask elements (reverse and invert them).

2791

if (PPCSubTarget->isLittleEndian()) {

2792

std::swap(Op1, Op2);

2793

unsigned tmp = DM[0];

DM[0] = 1 - DM[1];

DM[1] = 1 - tmp;

}

Hal Finkel

2014-03-28 20:24:55 +0000

[diff] [blame]

2798

SDValue DMV = CurDAG->getTargetConstant(DM[1] | (DM[0] << 1), MVT::i32);

Hal Finkel

2014-03-26 22:58:37 +0000

[diff] [blame]

2799

2800

if (Op1 == Op2 && DM[0] == 0 && DM[1] == 0 &&

2801

Op1.getOpcode() == ISD::SCALAR_TO_VECTOR &&

2802

isa<LoadSDNode>(Op1.getOperand(0))) {

2803

LoadSDNode *LD = cast<LoadSDNode>(Op1.getOperand(0));

2804

SDValue Base, Offset;

2805

2806

if (LD->isUnindexed() &&

2807

SelectAddrIdxOnly(LD->getBasePtr(), Base, Offset)) {

2808

SDValue Chain = LD->getChain();

2809

SDValue Ops[] = { Base, Offset, Chain };

2810

return CurDAG->SelectNodeTo(N, PPC::LXVDSX,

Craig Topper

2014-04-27 19:21:11 +0000

[diff] [blame]

2811

N->getValueType(0), Ops);

Hal Finkel

2014-03-26 22:58:37 +0000

[diff] [blame]

}

}

SDValue Ops[] = { Op1, Op2, DMV };

Craig Topper

2014-04-27 19:21:11 +0000

[diff] [blame]

2816

return CurDAG->SelectNodeTo(N, PPC::XXPERMDI, N->getValueType(0), Ops);

Hal Finkel

2014-03-26 22:58:37 +0000

[diff] [blame]

2817

}

2818

2819

break;

Hal Finkel

25c1992

2013-05-15 21:37:41 +0000

[diff] [blame]

2820

case PPCISD::BDNZ:

2821

case PPCISD::BDZ: {

Eric Christopher

2014-05-22 01:07:24 +0000

[diff] [blame]

2822

bool IsPPC64 = PPCSubTarget->isPPC64();

Hal Finkel

25c1992

2013-05-15 21:37:41 +0000

[diff] [blame]

2823

SDValue Ops[] = { N->getOperand(1), N->getOperand(0) };

2824

return CurDAG->SelectNodeTo(N, N->getOpcode() == PPCISD::BDNZ ?

2825

(IsPPC64 ? PPC::BDNZ8 : PPC::BDNZ) :

2826

(IsPPC64 ? PPC::BDZ8 : PPC::BDZ),

Craig Topper

2014-04-27 19:21:11 +0000

[diff] [blame]

2827

MVT::Other, Ops);

Hal Finkel

25c1992

2013-05-15 21:37:41 +0000

[diff] [blame]

2828

}

Chris Lattner

2006-11-17 22:37:34 +0000

[diff] [blame]

2829

case PPCISD::COND_BRANCH: {

Dan Gohman

7a638a8

2008-11-05 17:16:24 +0000

[diff] [blame]

2830

// Op #0 is the Chain.

Chris Lattner

2006-11-17 22:37:34 +0000

[diff] [blame]

2831

// Op #1 is the PPC::PRED_* number.

2832

// Op #2 is the CR#

2833

// Op #3 is the Dest MBB

Dan Gohman

f14b77e

2008-11-05 04:14:16 +0000

[diff] [blame]

2834

// Op #4 is the Flag.

Evan Cheng

58d1eac

2007-06-29 01:25:06 +0000

[diff] [blame]

2835

// Prevent PPC::PRED_* from being selected into LI.

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2836

SDValue Pred =

Dan Gohman

2008-09-12 16:56:44 +0000

[diff] [blame]

2837

getI32Imm(cast<ConstantSDNode>(N->getOperand(1))->getZExtValue());

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2838

SDValue Ops[] = { Pred, N->getOperand(2), N->getOperand(3),

Chris Lattner

2006-11-17 22:37:34 +0000

[diff] [blame]

2839

N->getOperand(0), N->getOperand(4) };

Craig Topper

2014-04-27 19:21:11 +0000

[diff] [blame]

2840

return CurDAG->SelectNodeTo(N, PPC::BCC, MVT::Other, Ops);

Chris Lattner

2006-11-17 22:37:34 +0000

[diff] [blame]

2841

}

Nate Begeman

bb01d4f

2006-03-17 01:40:33 +0000

[diff] [blame]

2842

case ISD::BR_CC: {

Chris Lattner

2005-08-21 18:50:37 +0000

[diff] [blame]

2843

ISD::CondCode CC = cast<CondCodeSDNode>(N->getOperand(1))->get();

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

2844

unsigned PCC = getPredicateForSetCC(CC);

2845

2846

if (N->getOperand(2).getValueType() == MVT::i1) {

unsigned Opc;

bool Swap;

switch (PCC) {

default: llvm_unreachable("Unexpected Boolean-operand predicate");

2851

case PPC::PRED_LT: Opc = PPC::CRANDC; Swap = true; break;

2852

case PPC::PRED_LE: Opc = PPC::CRORC; Swap = true; break;

2853

case PPC::PRED_EQ: Opc = PPC::CREQV; Swap = false; break;

2854

case PPC::PRED_GE: Opc = PPC::CRORC; Swap = false; break;

2855

case PPC::PRED_GT: Opc = PPC::CRANDC; Swap = false; break;

2856

case PPC::PRED_NE: Opc = PPC::CRXOR; Swap = false; break;

2857

}

2858

2859

SDValue BitComp(CurDAG->getMachineNode(Opc, dl, MVT::i1,

2860

N->getOperand(Swap ? 3 : 2),

2861

N->getOperand(Swap ? 2 : 3)), 0);

2862

return CurDAG->SelectNodeTo(N, PPC::BC, MVT::Other,

2863

BitComp, N->getOperand(4), N->getOperand(0));

2864

}

2865

Dale Johannesen

ab8e442

2009-02-06 19:16:40 +0000

[diff] [blame]

2866

SDValue CondCode = SelectCC(N->getOperand(2), N->getOperand(3), CC, dl);

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

2867

SDValue Ops[] = { getI32Imm(PCC), CondCode,

Evan Cheng

2006-08-27 08:14:06 +0000

[diff] [blame]

2868

N->getOperand(4), N->getOperand(0) };

Craig Topper

2014-04-27 19:21:11 +0000

[diff] [blame]

2869

return CurDAG->SelectNodeTo(N, PPC::BCC, MVT::Other, Ops);

Chris Lattner

2005-08-21 18:50:37 +0000

[diff] [blame]

2870

}

Nate Begeman

4ca2ea5

2006-04-22 18:53:45 +0000

[diff] [blame]

2871

case ISD::BRIND: {

Chris Lattner

b055c87

2006-06-10 01:15:02 +0000

[diff] [blame]

2872

// FIXME: Should custom lower this.

Dan Gohman

2008-07-27 21:46:04 +0000

[diff] [blame]

2873

SDValue Chain = N->getOperand(0);

2874

SDValue Target = N->getOperand(1);

Owen Anderson

2009-08-11 20:47:22 +0000

[diff] [blame]

2875

unsigned Opc = Target.getValueType() == MVT::i32 ? PPC::MTCTR : PPC::MTCTR8;

Roman Divacky

a4a59ae

2011-06-03 15:47:49 +0000

[diff] [blame]

2876

unsigned Reg = Target.getValueType() == MVT::i32 ? PPC::BCTR : PPC::BCTR8;

Hal Finkel

528ff4b

2011-12-08 04:36:44 +0000

[diff] [blame]

2877

Chain = SDValue(CurDAG->getMachineNode(Opc, dl, MVT::Glue, Target,

Dan Gohman

2009-09-25 18:54:59 +0000

[diff] [blame]

2878

Chain), 0);

Roman Divacky

a4a59ae

2011-06-03 15:47:49 +0000

[diff] [blame]

2879

return CurDAG->SelectNodeTo(N, Reg, MVT::Other, Chain);

Nate Begeman

4ca2ea5

2006-04-22 18:53:45 +0000

[diff] [blame]

2880

}

Bill Schmidt

2012-11-27 17:35:46 +0000

[diff] [blame]

2881

case PPCISD::TOC_ENTRY: {

Justin Hibbits

2014-11-12 15:16:30 +0000

[diff] [blame]

2882

assert ((PPCSubTarget->isPPC64() || PPCSubTarget->isSVR4ABI()) &&

2883

"Only supported for 64-bit ABI and 32-bit SVR4");

Hal Finkel

2014-07-18 23:29:49 +0000

[diff] [blame]

2884

if (PPCSubTarget->isSVR4ABI() && !PPCSubTarget->isPPC64()) {

2885

SDValue GA = N->getOperand(0);

Hal Finkel

2015-02-25 21:36:59 +0000

[diff] [blame]

2886

return transferMemOperands(N, CurDAG->getMachineNode(PPC::LWZtoc, dl,

2887

MVT::i32, GA, N->getOperand(1)));

Justin Hibbits

3476db4

2014-08-28 04:40:55 +0000

[diff] [blame]

2888

}

Bill Schmidt

2012-11-27 17:35:46 +0000

[diff] [blame]

2889

Bill Schmidt

2791778

2013-02-21 17:12:27 +0000

[diff] [blame]

2890

// For medium and large code model, we generate two instructions as

2891

// described below. Otherwise we allow SelectCodeCommon to handle this,

Ulrich Weigand

c8c2ea2

2014-10-31 10:33:14 +0000

[diff] [blame]

2892

// selecting one of LDtoc, LDtocJTI, LDtocCPT, and LDtocBA.

Bill Schmidt

2791778

2013-02-21 17:12:27 +0000

[diff] [blame]

2893

CodeModel::Model CModel = TM.getCodeModel();

2894

if (CModel != CodeModel::Medium && CModel != CodeModel::Large)

Bill Schmidt

2012-11-27 17:35:46 +0000

[diff] [blame]

2895

break;

2896

Bill Schmidt

5d82f09

2014-06-16 21:36:02 +0000

[diff] [blame]

2897

// The first source operand is a TargetGlobalAddress or a TargetJumpTable.

2898

// If it is an externally defined symbol, a symbol with common linkage,

2899

// a non-local function address, or a jump table address, or if we are

2900

// generating code for large code model, we generate:

Bill Schmidt

2012-11-27 17:35:46 +0000

[diff] [blame]

2901

// LDtocL(<ga:@sym>, ADDIStocHA(%X2, <ga:@sym>))

2902

// Otherwise we generate:

2903

// ADDItocL(ADDIStocHA(%X2, <ga:@sym>), <ga:@sym>)

2904

SDValue GA = N->getOperand(0);

2905

SDValue TOCbase = N->getOperand(1);

2906

SDNode *Tmp = CurDAG->getMachineNode(PPC::ADDIStocHA, dl, MVT::i64,

Hal Finkel

2015-02-25 21:36:59 +0000

[diff] [blame]

2907

TOCbase, GA);

Bill Schmidt

2012-11-27 17:35:46 +0000

[diff] [blame]

2908

Ulrich Weigand

c8c2ea2

2014-10-31 10:33:14 +0000

[diff] [blame]

2909

if (isa<JumpTableSDNode>(GA) || isa<BlockAddressSDNode>(GA) ||

2910

CModel == CodeModel::Large)

Hal Finkel

2015-02-25 21:36:59 +0000

[diff] [blame]

2911

return transferMemOperands(N, CurDAG->getMachineNode(PPC::LDtocL, dl,

2912

MVT::i64, GA, SDValue(Tmp, 0)));

Bill Schmidt

2012-11-27 17:35:46 +0000

[diff] [blame]

2913

2914

if (GlobalAddressSDNode *G = dyn_cast<GlobalAddressSDNode>(GA)) {

2915

const GlobalValue *GValue = G->getGlobal();

Bill Schmidt

5d82f09

2014-06-16 21:36:02 +0000

[diff] [blame]

2916

if ((GValue->getType()->getElementType()->isFunctionTy() &&

2917

(GValue->isDeclaration() || GValue->isWeakForLinker())) ||

Rafael Espindola

0490286

2014-05-29 15:41:38 +0000

[diff] [blame]

2918

GValue->isDeclaration() || GValue->hasCommonLinkage() ||

2919

GValue->hasAvailableExternallyLinkage())

Hal Finkel

2015-02-25 21:36:59 +0000

[diff] [blame]

2920

return transferMemOperands(N, CurDAG->getMachineNode(PPC::LDtocL, dl,

2921

MVT::i64, GA, SDValue(Tmp, 0)));

Bill Schmidt

2012-11-27 17:35:46 +0000

[diff] [blame]

2922

}

2923

2924

return CurDAG->getMachineNode(PPC::ADDItocL, dl, MVT::i64,

2925

SDValue(Tmp, 0), GA);

2926

}

Hal Finkel

7c8ae53

2014-07-25 17:47:22 +0000

[diff] [blame]

2927

case PPCISD::PPC32_PICGOT: {

2928

// Generate a PIC-safe GOT reference.

2929

assert(!PPCSubTarget->isPPC64() && PPCSubTarget->isSVR4ABI() &&

2930

"PPCISD::PPC32_PICGOT is only supported for 32-bit SVR4");

2931

return CurDAG->SelectNodeTo(N, PPC::PPC32PICGOT, PPCLowering->getPointerTy(), MVT::i32);

2932

}

Bill Schmidt

2013-02-20 15:50:31 +0000

[diff] [blame]

2933

case PPCISD::VADD_SPLAT: {

Bill Schmidt

2013-02-20 20:41:42 +0000

[diff] [blame]

2934

// This expands into one of three sequences, depending on whether

2935

// the first operand is odd or even, positive or negative.

Bill Schmidt

2013-02-20 15:50:31 +0000

[diff] [blame]

2936

assert(isa<ConstantSDNode>(N->getOperand(0)) &&

2937

isa<ConstantSDNode>(N->getOperand(1)) &&

2938

"Invalid operand on VADD_SPLAT!");

Bill Schmidt

2013-02-20 20:41:42 +0000

[diff] [blame]

2939

2940

int Elt = N->getConstantOperandVal(0);

Bill Schmidt

2013-02-20 15:50:31 +0000

[diff] [blame]

2941

int EltSize = N->getConstantOperandVal(1);

Bill Schmidt

2013-02-20 20:41:42 +0000

[diff] [blame]

2942

unsigned Opc1, Opc2, Opc3;

Bill Schmidt

2013-02-20 15:50:31 +0000

[diff] [blame]

2943

EVT VT;

Bill Schmidt

2013-02-20 20:41:42 +0000

[diff] [blame]

2944

Bill Schmidt

2013-02-20 15:50:31 +0000

[diff] [blame]

2945

if (EltSize == 1) {

2946

Opc1 = PPC::VSPLTISB;

2947

Opc2 = PPC::VADDUBM;

Bill Schmidt

2013-02-20 20:41:42 +0000

[diff] [blame]

2948

Opc3 = PPC::VSUBUBM;

Bill Schmidt

2013-02-20 15:50:31 +0000

[diff] [blame]

2949

VT = MVT::v16i8;

2950

} else if (EltSize == 2) {

2951

Opc1 = PPC::VSPLTISH;

2952

Opc2 = PPC::VADDUHM;

Bill Schmidt

2013-02-20 20:41:42 +0000

[diff] [blame]

2953

Opc3 = PPC::VSUBUHM;

Bill Schmidt

2013-02-20 15:50:31 +0000

[diff] [blame]

2954

VT = MVT::v8i16;

2955

} else {

2956

assert(EltSize == 4 && "Invalid element size on VADD_SPLAT!");

2957

Opc1 = PPC::VSPLTISW;

2958

Opc2 = PPC::VADDUWM;

Bill Schmidt

2013-02-20 20:41:42 +0000

[diff] [blame]

2959

Opc3 = PPC::VSUBUWM;

Bill Schmidt

2013-02-20 15:50:31 +0000

[diff] [blame]

2960

VT = MVT::v4i32;

2961

}

Bill Schmidt

2013-02-20 20:41:42 +0000

[diff] [blame]

2962

2963

if ((Elt & 1) == 0) {

2964

// Elt is even, in the range [-32,-18] + [16,30].

2965

//

2966

// Convert: VADD_SPLAT elt, size

2967

// Into: tmp = VSPLTIS[BHW] elt

2968

// VADDU[BHW]M tmp, tmp

2969

// Where: [BHW] = B for size = 1, H for size = 2, W for size = 4

2970

SDValue EltVal = getI32Imm(Elt >> 1);

2971

SDNode *Tmp = CurDAG->getMachineNode(Opc1, dl, VT, EltVal);

2972

SDValue TmpVal = SDValue(Tmp, 0);

2973

return CurDAG->getMachineNode(Opc2, dl, VT, TmpVal, TmpVal);

2974

2975

} else if (Elt > 0) {

2976

// Elt is odd and positive, in the range [17,31].

2977

//

2978

// Convert: VADD_SPLAT elt, size

2979

// Into: tmp1 = VSPLTIS[BHW] elt-16

2980

// tmp2 = VSPLTIS[BHW] -16

2981

// VSUBU[BHW]M tmp1, tmp2

2982

SDValue EltVal = getI32Imm(Elt - 16);

2983

SDNode *Tmp1 = CurDAG->getMachineNode(Opc1, dl, VT, EltVal);

2984

EltVal = getI32Imm(-16);

2985

SDNode *Tmp2 = CurDAG->getMachineNode(Opc1, dl, VT, EltVal);

2986

return CurDAG->getMachineNode(Opc3, dl, VT, SDValue(Tmp1, 0),

SDValue(Tmp2, 0));

} else {

// Elt is odd and negative, in the range [-31,-17].

2991

//

2992

// Convert: VADD_SPLAT elt, size

2993

// Into: tmp1 = VSPLTIS[BHW] elt+16

2994

// tmp2 = VSPLTIS[BHW] -16

2995

// VADDU[BHW]M tmp1, tmp2

2996

SDValue EltVal = getI32Imm(Elt + 16);

2997

SDNode *Tmp1 = CurDAG->getMachineNode(Opc1, dl, VT, EltVal);

2998

EltVal = getI32Imm(-16);

2999

SDNode *Tmp2 = CurDAG->getMachineNode(Opc1, dl, VT, EltVal);

3000

return CurDAG->getMachineNode(Opc2, dl, VT, SDValue(Tmp1, 0),

3001

SDValue(Tmp2, 0));

3002

}

Bill Schmidt

2013-02-20 15:50:31 +0000

[diff] [blame]

3003

}

Chris Lattner

2005-08-17 19:33:03 +0000

[diff] [blame]

3004

}

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

3005

Dan Gohman

2010-01-05 01:24:18 +0000

[diff] [blame]

3006

return SelectCode(N);

Chris Lattner

2005-08-17 19:33:03 +0000

[diff] [blame]

3007

}

3008

Hal Finkel

2015-01-03 01:16:37 +0000

[diff] [blame]

3009

// If the target supports the cmpb instruction, do the idiom recognition here.

3010

// We don't do this as a DAG combine because we don't want to do it as nodes

3011

// are being combined (because we might miss part of the eventual idiom). We

3012

// don't want to do it during instruction selection because we want to reuse

3013

// the logic for lowering the masking operations already part of the

3014

// instruction selector.

3015

SDValue PPCDAGToDAGISel::combineToCMPB(SDNode *N) {

3016

SDLoc dl(N);

3017

3018

assert(N->getOpcode() == ISD::OR &&

3019

"Only OR nodes are supported for CMPB");

3020

3021

SDValue Res;

3022

if (!PPCSubTarget->hasCMPB())

3023

return Res;

3024

3025

if (N->getValueType(0) != MVT::i32 &&

3026

N->getValueType(0) != MVT::i64)

3027

return Res;

3028

3029

EVT VT = N->getValueType(0);

3030

3031

SDValue RHS, LHS;

3032

bool BytesFound[8] = { 0, 0, 0, 0, 0, 0, 0, 0 };

3033

uint64_t Mask = 0, Alt = 0;

3034

3035

auto IsByteSelectCC = [this](SDValue O, unsigned &b,

3036

uint64_t &Mask, uint64_t &Alt,

3037

SDValue &LHS, SDValue &RHS) {

3038

if (O.getOpcode() != ISD::SELECT_CC)

3039

return false;

3040

ISD::CondCode CC = cast<CondCodeSDNode>(O.getOperand(4))->get();

3041

3042

if (!isa<ConstantSDNode>(O.getOperand(2)) ||

3043

!isa<ConstantSDNode>(O.getOperand(3)))

3044

return false;

3045

3046

uint64_t PM = O.getConstantOperandVal(2);

3047

uint64_t PAlt = O.getConstantOperandVal(3);

3048

for (b = 0; b < 8; ++b) {

3049

uint64_t Mask = UINT64_C(0xFF) << (8*b);

3050

if (PM && (PM & Mask) == PM && (PAlt & Mask) == PAlt)

break;

}

if (b == 8)

return false;

Mask |= PM;

Alt |= PAlt;

if (!isa<ConstantSDNode>(O.getOperand(1)) ||

3060

O.getConstantOperandVal(1) != 0) {

3061

SDValue Op0 = O.getOperand(0), Op1 = O.getOperand(1);

3062

if (Op0.getOpcode() == ISD::TRUNCATE)

3063

Op0 = Op0.getOperand(0);

3064

if (Op1.getOpcode() == ISD::TRUNCATE)

3065

Op1 = Op1.getOperand(0);

3066

3067

if (Op0.getOpcode() == ISD::SRL && Op1.getOpcode() == ISD::SRL &&

3068

Op0.getOperand(1) == Op1.getOperand(1) && CC == ISD::SETEQ &&

3069

isa<ConstantSDNode>(Op0.getOperand(1))) {

3070

3071

unsigned Bits = Op0.getValueType().getSizeInBits();

3072

if (b != Bits/8-1)

3073

return false;

3074

if (Op0.getConstantOperandVal(1) != Bits-8)

3075

return false;

3076

3077

LHS = Op0.getOperand(0);

3078

RHS = Op1.getOperand(0);

return true;

}

// When we have small integers (i16 to be specific), the form present

3083

// post-legalization uses SETULT in the SELECT_CC for the

3084

// higher-order byte, depending on the fact that the

3085

// even-higher-order bytes are known to all be zero, for example:

3086

// select_cc (xor $lhs, $rhs), 256, 65280, 0, setult

3087

// (so when the second byte is the same, because all higher-order

3088

// bits from bytes 3 and 4 are known to be zero, the result of the

3089

// xor can be at most 255)

3090

if (Op0.getOpcode() == ISD::XOR && CC == ISD::SETULT &&

3091

isa<ConstantSDNode>(O.getOperand(1))) {

3092

3093

uint64_t ULim = O.getConstantOperandVal(1);

3094

if (ULim != (UINT64_C(1) << b*8))

3095

return false;

3096

3097

// Now we need to make sure that the upper bytes are known to be

3098

// zero.

3099

unsigned Bits = Op0.getValueType().getSizeInBits();

3100

if (!CurDAG->MaskedValueIsZero(Op0,

3101

APInt::getHighBitsSet(Bits, Bits - (b+1)*8)))

3102

return false;

3103

3104

LHS = Op0.getOperand(0);

3105

RHS = Op0.getOperand(1);

return true;

}

return false;

}

if (CC != ISD::SETEQ)

3113

return false;

3114

3115

SDValue Op = O.getOperand(0);

3116

if (Op.getOpcode() == ISD::AND) {

3117

if (!isa<ConstantSDNode>(Op.getOperand(1)))

3118

return false;

3119

if (Op.getConstantOperandVal(1) != (UINT64_C(0xFF) << (8*b)))

3120

return false;

3121

3122

SDValue XOR = Op.getOperand(0);

3123

if (XOR.getOpcode() == ISD::TRUNCATE)

3124

XOR = XOR.getOperand(0);

3125

if (XOR.getOpcode() != ISD::XOR)

3126

return false;

3127

3128

LHS = XOR.getOperand(0);

3129

RHS = XOR.getOperand(1);

3130

return true;

3131

} else if (Op.getOpcode() == ISD::SRL) {

3132

if (!isa<ConstantSDNode>(Op.getOperand(1)))

3133

return false;

3134

unsigned Bits = Op.getValueType().getSizeInBits();

3135

if (b != Bits/8-1)

3136

return false;

3137

if (Op.getConstantOperandVal(1) != Bits-8)

3138

return false;

3139

3140

SDValue XOR = Op.getOperand(0);

3141

if (XOR.getOpcode() == ISD::TRUNCATE)

3142

XOR = XOR.getOperand(0);

3143

if (XOR.getOpcode() != ISD::XOR)

3144

return false;

3145

3146

LHS = XOR.getOperand(0);

3147

RHS = XOR.getOperand(1);

return true;

}

return false;

};

SmallVector<SDValue, 8> Queue(1, SDValue(N, 0));

3155

while (!Queue.empty()) {

3156

SDValue V = Queue.pop_back_val();

3157

3158

for (const SDValue &O : V.getNode()->ops()) {

3159

unsigned b;

3160

uint64_t M = 0, A = 0;

3161

SDValue OLHS, ORHS;

3162

if (O.getOpcode() == ISD::OR) {

3163

Queue.push_back(O);

3164

} else if (IsByteSelectCC(O, b, M, A, OLHS, ORHS)) {

if (!LHS) {

LHS = OLHS;

RHS = ORHS;

BytesFound[b] = true;

3169

Mask |= M;

3170

Alt |= A;

3171

} else if ((LHS == ORHS && RHS == OLHS) ||

3172

(RHS == ORHS && LHS == OLHS)) {

3173

BytesFound[b] = true;

Mask |= M;

Alt |= A;

} else {

return Res;

}

} else {

return Res;

}

}

}

unsigned LastB = 0, BCnt = 0;

3186

for (unsigned i = 0; i < 8; ++i)

3187

if (BytesFound[LastB]) {

++BCnt;

LastB = i;

}

if (!LastB || BCnt < 2)

3193

return Res;

3194

3195

// Because we'll be zero-extending the output anyway if don't have a specific

3196

// value for each input byte (via the Mask), we can 'anyext' the inputs.

3197

if (LHS.getValueType() != VT) {

3198

LHS = CurDAG->getAnyExtOrTrunc(LHS, dl, VT);

3199

RHS = CurDAG->getAnyExtOrTrunc(RHS, dl, VT);

3200

}

3201

3202

Res = CurDAG->getNode(PPCISD::CMPB, dl, VT, LHS, RHS);

3203

3204

bool NonTrivialMask = ((int64_t) Mask) != INT64_C(-1);

3205

if (NonTrivialMask && !Alt) {

3206

// Res = Mask & CMPB

3207

Res = CurDAG->getNode(ISD::AND, dl, VT, Res, CurDAG->getConstant(Mask, VT));

3208

} else if (Alt) {

3209

// Res = (CMPB & Mask) | (~CMPB & Alt)

3210

// Which, as suggested here:

3211

// https://graphics.stanford.edu/~seander/bithacks.html#MaskedMerge

3212

// can be written as:

3213

// Res = Alt ^ ((Alt ^ Mask) & CMPB)

3214

// useful because the (Alt ^ Mask) can be pre-computed.

3215

Res = CurDAG->getNode(ISD::AND, dl, VT, Res,

3216

CurDAG->getConstant(Mask ^ Alt, VT));

3217

Res = CurDAG->getNode(ISD::XOR, dl, VT, Res, CurDAG->getConstant(Alt, VT));

}

return Res;

}

Hal Finkel

2015-01-05 21:10:24 +0000

[diff] [blame]

3223

// When CR bit registers are enabled, an extension of an i1 variable to a i32

3224

// or i64 value is lowered in terms of a SELECT_I[48] operation, and thus

3225

// involves constant materialization of a 0 or a 1 or both. If the result of

3226

// the extension is then operated upon by some operator that can be constant

3227

// folded with a constant 0 or 1, and that constant can be materialized using

3228

// only one instruction (like a zero or one), then we should fold in those

3229

// operations with the select.

3230

void PPCDAGToDAGISel::foldBoolExts(SDValue &Res, SDNode *&N) {

3231

if (!PPCSubTarget->useCRBits())

3232

return;

3233

3234

if (N->getOpcode() != ISD::ZERO_EXTEND &&

3235

N->getOpcode() != ISD::SIGN_EXTEND &&

3236

N->getOpcode() != ISD::ANY_EXTEND)

3237

return;

3238

3239

if (N->getOperand(0).getValueType() != MVT::i1)

return;

if (!N->hasOneUse())

return;

SDLoc dl(N);

EVT VT = N->getValueType(0);

3247

SDValue Cond = N->getOperand(0);

3248

SDValue ConstTrue =

3249

CurDAG->getConstant(N->getOpcode() == ISD::SIGN_EXTEND ? -1 : 1, VT);

3250

SDValue ConstFalse = CurDAG->getConstant(0, VT);

3251

3252

do {

3253

SDNode *User = *N->use_begin();

3254

if (User->getNumOperands() != 2)

3255

break;

3256

3257

auto TryFold = [this, N, User](SDValue Val) {

3258

SDValue UserO0 = User->getOperand(0), UserO1 = User->getOperand(1);

3259

SDValue O0 = UserO0.getNode() == N ? Val : UserO0;

3260

SDValue O1 = UserO1.getNode() == N ? Val : UserO1;

3261

3262

return CurDAG->FoldConstantArithmetic(User->getOpcode(),

3263

User->getValueType(0),

3264

O0.getNode(), O1.getNode());

3265

};

3266

3267

SDValue TrueRes = TryFold(ConstTrue);

3268

if (!TrueRes)

3269

break;

3270

SDValue FalseRes = TryFold(ConstFalse);

if (!FalseRes)

break;

// For us to materialize these using one instruction, we must be able to

3275

// represent them as signed 16-bit integers.

3276

uint64_t True = cast<ConstantSDNode>(TrueRes)->getZExtValue(),

3277

False = cast<ConstantSDNode>(FalseRes)->getZExtValue();

3278

if (!isInt<16>(True) || !isInt<16>(False))

3279

break;

3280

3281

// We can replace User with a new SELECT node, and try again to see if we

3282

// can fold the select with its user.

3283

Res = CurDAG->getSelect(dl, User->getValueType(0), Cond, TrueRes, FalseRes);

3284

N = User;

3285

ConstTrue = TrueRes;

3286

ConstFalse = FalseRes;

3287

} while (N->hasOneUse());

3288

}

3289

Hal Finkel

2015-01-03 01:16:37 +0000

[diff] [blame]

3290

void PPCDAGToDAGISel::PreprocessISelDAG() {

3291

SelectionDAG::allnodes_iterator Position(CurDAG->getRoot().getNode());

3292

++Position;

3293

3294

bool MadeChange = false;

3295

while (Position != CurDAG->allnodes_begin()) {

3296

SDNode *N = --Position;

if (N->use_empty())

continue;

SDValue Res;

switch (N->getOpcode()) {

3302

default: break;

3303

case ISD::OR:

3304

Res = combineToCMPB(N);

break;

}

Hal Finkel

2015-01-05 21:10:24 +0000

[diff] [blame]

3308

if (!Res)

3309

foldBoolExts(Res, N);

3310

Hal Finkel

2015-01-03 01:16:37 +0000

[diff] [blame]

3311

if (Res) {

3312

DEBUG(dbgs() << "PPC DAG preprocessing replacing:\nOld: ");

3313

DEBUG(N->dump(CurDAG));

3314

DEBUG(dbgs() << "\nNew: ");

3315

DEBUG(Res.getNode()->dump(CurDAG));

3316

DEBUG(dbgs() << "\n");

3317

3318

CurDAG->ReplaceAllUsesOfValueWith(SDValue(N, 0), Res);

MadeChange = true;

}

}

if (MadeChange)

CurDAG->RemoveDeadNodes();

3325

}

3326

Hal Finkel

860fa90

2014-01-02 22:09:39 +0000

[diff] [blame]

3327

/// PostprocessISelDAG - Perform some late peephole optimizations

Bill Schmidt

2013-02-21 00:38:25 +0000

[diff] [blame]

3328

/// on the DAG representation.

3329

void PPCDAGToDAGISel::PostprocessISelDAG() {

3330

3331

// Skip peepholes at -O0.

3332

if (TM.getOptLevel() == CodeGenOpt::None)

3333

return;

3334

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

3335

PeepholePPC64();

Eric Christopher

02e1804

2014-05-14 00:31:15 +0000

[diff] [blame]

3336

PeepholeCROps();

Hal Finkel

2014-12-12 23:59:36 +0000

[diff] [blame]

3337

PeepholePPC64ZExt();

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

3338

}

3339

Hal Finkel

2014-02-28 06:11:16 +0000

[diff] [blame]

3340

// Check if all users of this node will become isel where the second operand

3341

// is the constant zero. If this is so, and if we can negate the condition,

3342

// then we can flip the true and false operands. This will allow the zero to

3343

// be folded with the isel so that we don't need to materialize a register

3344

// containing zero.

3345

bool PPCDAGToDAGISel::AllUsersSelectZero(SDNode *N) {

3346

// If we're not using isel, then this does not matter.

Eric Christopher

2014-05-22 01:07:24 +0000

[diff] [blame]

3347

if (!PPCSubTarget->hasISEL())

Hal Finkel

2014-02-28 06:11:16 +0000

[diff] [blame]

3348

return false;

3349

3350

for (SDNode::use_iterator UI = N->use_begin(), UE = N->use_end();

3351

UI != UE; ++UI) {

3352

SDNode *User = *UI;

3353

if (!User->isMachineOpcode())

3354

return false;

3355

if (User->getMachineOpcode() != PPC::SELECT_I4 &&

3356

User->getMachineOpcode() != PPC::SELECT_I8)

3357

return false;

3358

3359

SDNode *Op2 = User->getOperand(2).getNode();

3360

if (!Op2->isMachineOpcode())

3361

return false;

3362

3363

if (Op2->getMachineOpcode() != PPC::LI &&

3364

Op2->getMachineOpcode() != PPC::LI8)

3365

return false;

3366

3367

ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op2->getOperand(0));

if (!C)

return false;

if (!C->isNullValue())

return false;

}

return true;

}

void PPCDAGToDAGISel::SwapAllSelectUsers(SDNode *N) {

3379

SmallVector<SDNode *, 4> ToReplace;

3380

for (SDNode::use_iterator UI = N->use_begin(), UE = N->use_end();

3381

UI != UE; ++UI) {

3382

SDNode *User = *UI;

3383

assert((User->getMachineOpcode() == PPC::SELECT_I4 ||

3384

User->getMachineOpcode() == PPC::SELECT_I8) &&

3385

"Must have all select users");

3386

ToReplace.push_back(User);

3387

}

3388

3389

for (SmallVector<SDNode *, 4>::iterator UI = ToReplace.begin(),

3390

UE = ToReplace.end(); UI != UE; ++UI) {

3391

SDNode *User = *UI;

3392

SDNode *ResNode =

3393

CurDAG->getMachineNode(User->getMachineOpcode(), SDLoc(User),

3394

User->getValueType(0), User->getOperand(0),

3395

User->getOperand(2),

3396

User->getOperand(1));

3397

3398

DEBUG(dbgs() << "CR Peephole replacing:\nOld: ");

3399

DEBUG(User->dump(CurDAG));

3400

DEBUG(dbgs() << "\nNew: ");

3401

DEBUG(ResNode->dump(CurDAG));

3402

DEBUG(dbgs() << "\n");

3403

3404

ReplaceUses(User, ResNode);

}

}

Eric Christopher

2014-05-14 00:31:15 +0000

[diff] [blame]

3408

void PPCDAGToDAGISel::PeepholeCROps() {

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

bool IsModified;

do {

IsModified = false;

for (SelectionDAG::allnodes_iterator I = CurDAG->allnodes_begin(),

3413

E = CurDAG->allnodes_end(); I != E; ++I) {

3414

MachineSDNode *MachineNode = dyn_cast<MachineSDNode>(I);

3415

if (!MachineNode || MachineNode->use_empty())

3416

continue;

3417

SDNode *ResNode = MachineNode;

3418

3419

bool Op1Set = false, Op1Unset = false,

3420

Op1Not = false,

3421

Op2Set = false, Op2Unset = false,

3422

Op2Not = false;

3423

3424

unsigned Opcode = MachineNode->getMachineOpcode();

switch (Opcode) {

default: break;

case PPC::CRAND:

case PPC::CRNAND:

case PPC::CROR:

case PPC::CRXOR:

case PPC::CRNOR:

case PPC::CREQV:

case PPC::CRANDC:

case PPC::CRORC: {

SDValue Op = MachineNode->getOperand(1);

3436

if (Op.isMachineOpcode()) {

3437

if (Op.getMachineOpcode() == PPC::CRSET)

3438

Op2Set = true;

3439

else if (Op.getMachineOpcode() == PPC::CRUNSET)

3440

Op2Unset = true;

3441

else if (Op.getMachineOpcode() == PPC::CRNOR &&

3442

Op.getOperand(0) == Op.getOperand(1))

Op2Not = true;

}

} // fallthrough

case PPC::BC:

case PPC::BCn:

case PPC::SELECT_I4:

case PPC::SELECT_I8:

case PPC::SELECT_F4:

case PPC::SELECT_F8:

Hal Finkel

2015-02-25 01:06:45 +0000

[diff] [blame]

3452

case PPC::SELECT_QFRC:

3453

case PPC::SELECT_QSRC:

3454

case PPC::SELECT_QBRC:

Bill Schmidt

2014-10-22 13:13:40 +0000

[diff] [blame]

3455

case PPC::SELECT_VRRC:

Bill Schmidt

9c54bbd

2014-10-22 16:58:20 +0000

[diff] [blame]

3456

case PPC::SELECT_VSFRC:

Bill Schmidt

2014-10-22 13:13:40 +0000

[diff] [blame]

3457

case PPC::SELECT_VSRC: {

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

3458

SDValue Op = MachineNode->getOperand(0);

3459

if (Op.isMachineOpcode()) {

3460

if (Op.getMachineOpcode() == PPC::CRSET)

3461

Op1Set = true;

3462

else if (Op.getMachineOpcode() == PPC::CRUNSET)

3463

Op1Unset = true;

3464

else if (Op.getMachineOpcode() == PPC::CRNOR &&

3465

Op.getOperand(0) == Op.getOperand(1))

Op1Not = true;

}

}

break;

}

Hal Finkel

2014-02-28 06:11:16 +0000

[diff] [blame]

3472

bool SelectSwap = false;

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

switch (Opcode) {

default: break;

case PPC::CRAND:

if (MachineNode->getOperand(0) == MachineNode->getOperand(1))

3477

// x & x = x

3478

ResNode = MachineNode->getOperand(0).getNode();

3479

else if (Op1Set)

3480

// 1 & y = y

3481

ResNode = MachineNode->getOperand(1).getNode();

3482

else if (Op2Set)

3483

// x & 1 = x

3484

ResNode = MachineNode->getOperand(0).getNode();

3485

else if (Op1Unset || Op2Unset)

3486

// x & 0 = 0 & y = 0

3487

ResNode = CurDAG->getMachineNode(PPC::CRUNSET, SDLoc(MachineNode),

3488

MVT::i1);

3489

else if (Op1Not)

3490

// ~x & y = andc(y, x)

3491

ResNode = CurDAG->getMachineNode(PPC::CRANDC, SDLoc(MachineNode),

3492

MVT::i1, MachineNode->getOperand(1),

3493

MachineNode->getOperand(0).

3494

getOperand(0));

3495

else if (Op2Not)

3496

// x & ~y = andc(x, y)

3497

ResNode = CurDAG->getMachineNode(PPC::CRANDC, SDLoc(MachineNode),

3498

MVT::i1, MachineNode->getOperand(0),

3499

MachineNode->getOperand(1).

3500

getOperand(0));

Hal Finkel

2014-02-28 06:11:16 +0000

[diff] [blame]

3501

else if (AllUsersSelectZero(MachineNode))

3502

ResNode = CurDAG->getMachineNode(PPC::CRNAND, SDLoc(MachineNode),

3503

MVT::i1, MachineNode->getOperand(0),

3504

MachineNode->getOperand(1)),

3505

SelectSwap = true;

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

3506

break;

3507

case PPC::CRNAND:

3508

if (MachineNode->getOperand(0) == MachineNode->getOperand(1))

3509

// nand(x, x) -> nor(x, x)

3510

ResNode = CurDAG->getMachineNode(PPC::CRNOR, SDLoc(MachineNode),

3511

MVT::i1, MachineNode->getOperand(0),

3512

MachineNode->getOperand(0));

3513

else if (Op1Set)

3514

// nand(1, y) -> nor(y, y)

3515

ResNode = CurDAG->getMachineNode(PPC::CRNOR, SDLoc(MachineNode),

3516

MVT::i1, MachineNode->getOperand(1),

3517

MachineNode->getOperand(1));

3518

else if (Op2Set)

3519

// nand(x, 1) -> nor(x, x)

3520

ResNode = CurDAG->getMachineNode(PPC::CRNOR, SDLoc(MachineNode),

3521

MVT::i1, MachineNode->getOperand(0),

3522

MachineNode->getOperand(0));

3523

else if (Op1Unset || Op2Unset)

3524

// nand(x, 0) = nand(0, y) = 1

3525

ResNode = CurDAG->getMachineNode(PPC::CRSET, SDLoc(MachineNode),

3526

MVT::i1);

3527

else if (Op1Not)

3528

// nand(~x, y) = ~(~x & y) = x | ~y = orc(x, y)

3529

ResNode = CurDAG->getMachineNode(PPC::CRORC, SDLoc(MachineNode),

3530

MVT::i1, MachineNode->getOperand(0).

3531

getOperand(0),

3532

MachineNode->getOperand(1));

3533

else if (Op2Not)

3534

// nand(x, ~y) = ~x | y = orc(y, x)

3535

ResNode = CurDAG->getMachineNode(PPC::CRORC, SDLoc(MachineNode),

3536

MVT::i1, MachineNode->getOperand(1).

3537

getOperand(0),

3538

MachineNode->getOperand(0));

Hal Finkel

2014-02-28 06:11:16 +0000

[diff] [blame]

3539

else if (AllUsersSelectZero(MachineNode))

3540

ResNode = CurDAG->getMachineNode(PPC::CRAND, SDLoc(MachineNode),

3541

MVT::i1, MachineNode->getOperand(0),

3542

MachineNode->getOperand(1)),

3543

SelectSwap = true;

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

3544

break;

3545

case PPC::CROR:

3546

if (MachineNode->getOperand(0) == MachineNode->getOperand(1))

3547

// x | x = x

3548

ResNode = MachineNode->getOperand(0).getNode();

3549

else if (Op1Set || Op2Set)

3550

// x | 1 = 1 | y = 1

3551

ResNode = CurDAG->getMachineNode(PPC::CRSET, SDLoc(MachineNode),

MVT::i1);

else if (Op1Unset)

// 0 | y = y

ResNode = MachineNode->getOperand(1).getNode();

3556

else if (Op2Unset)

3557

// x | 0 = x

3558

ResNode = MachineNode->getOperand(0).getNode();

3559

else if (Op1Not)

3560

// ~x | y = orc(y, x)

3561

ResNode = CurDAG->getMachineNode(PPC::CRORC, SDLoc(MachineNode),

3562

MVT::i1, MachineNode->getOperand(1),

3563

MachineNode->getOperand(0).

3564

getOperand(0));

3565

else if (Op2Not)

3566

// x | ~y = orc(x, y)

3567

ResNode = CurDAG->getMachineNode(PPC::CRORC, SDLoc(MachineNode),

3568

MVT::i1, MachineNode->getOperand(0),

3569

MachineNode->getOperand(1).

3570

getOperand(0));

Hal Finkel

2014-02-28 06:11:16 +0000

[diff] [blame]

3571

else if (AllUsersSelectZero(MachineNode))

3572

ResNode = CurDAG->getMachineNode(PPC::CRNOR, SDLoc(MachineNode),

3573

MVT::i1, MachineNode->getOperand(0),

3574

MachineNode->getOperand(1)),

3575

SelectSwap = true;

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

3576

break;

3577

case PPC::CRXOR:

3578

if (MachineNode->getOperand(0) == MachineNode->getOperand(1))

3579

// xor(x, x) = 0

3580

ResNode = CurDAG->getMachineNode(PPC::CRUNSET, SDLoc(MachineNode),

3581

MVT::i1);

3582

else if (Op1Set)

3583

// xor(1, y) -> nor(y, y)

3584

ResNode = CurDAG->getMachineNode(PPC::CRNOR, SDLoc(MachineNode),

3585

MVT::i1, MachineNode->getOperand(1),

3586

MachineNode->getOperand(1));

3587

else if (Op2Set)

3588

// xor(x, 1) -> nor(x, x)

3589

ResNode = CurDAG->getMachineNode(PPC::CRNOR, SDLoc(MachineNode),

3590

MVT::i1, MachineNode->getOperand(0),

3591

MachineNode->getOperand(0));

3592

else if (Op1Unset)

3593

// xor(0, y) = y

3594

ResNode = MachineNode->getOperand(1).getNode();

3595

else if (Op2Unset)

3596

// xor(x, 0) = x

3597

ResNode = MachineNode->getOperand(0).getNode();

3598

else if (Op1Not)

3599

// xor(~x, y) = eqv(x, y)

3600

ResNode = CurDAG->getMachineNode(PPC::CREQV, SDLoc(MachineNode),

3601

MVT::i1, MachineNode->getOperand(0).

3602

getOperand(0),

3603

MachineNode->getOperand(1));

3604

else if (Op2Not)

3605

// xor(x, ~y) = eqv(x, y)

3606

ResNode = CurDAG->getMachineNode(PPC::CREQV, SDLoc(MachineNode),

3607

MVT::i1, MachineNode->getOperand(0),

3608

MachineNode->getOperand(1).

3609

getOperand(0));

Hal Finkel

2014-02-28 06:11:16 +0000

[diff] [blame]

3610

else if (AllUsersSelectZero(MachineNode))

3611

ResNode = CurDAG->getMachineNode(PPC::CREQV, SDLoc(MachineNode),

3612

MVT::i1, MachineNode->getOperand(0),

3613

MachineNode->getOperand(1)),

3614

SelectSwap = true;

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

3615

break;

3616

case PPC::CRNOR:

3617

if (Op1Set || Op2Set)

3618

// nor(1, y) -> 0

3619

ResNode = CurDAG->getMachineNode(PPC::CRUNSET, SDLoc(MachineNode),

3620

MVT::i1);

3621

else if (Op1Unset)

3622

// nor(0, y) = ~y -> nor(y, y)

3623

ResNode = CurDAG->getMachineNode(PPC::CRNOR, SDLoc(MachineNode),

3624

MVT::i1, MachineNode->getOperand(1),

3625

MachineNode->getOperand(1));

3626

else if (Op2Unset)

3627

// nor(x, 0) = ~x

3628

ResNode = CurDAG->getMachineNode(PPC::CRNOR, SDLoc(MachineNode),

3629

MVT::i1, MachineNode->getOperand(0),

3630

MachineNode->getOperand(0));

3631

else if (Op1Not)

3632

// nor(~x, y) = andc(x, y)

3633

ResNode = CurDAG->getMachineNode(PPC::CRANDC, SDLoc(MachineNode),

3634

MVT::i1, MachineNode->getOperand(0).

3635

getOperand(0),

3636

MachineNode->getOperand(1));

3637

else if (Op2Not)

3638

// nor(x, ~y) = andc(y, x)

3639

ResNode = CurDAG->getMachineNode(PPC::CRANDC, SDLoc(MachineNode),

3640

MVT::i1, MachineNode->getOperand(1).

3641

getOperand(0),

3642

MachineNode->getOperand(0));

Hal Finkel

2014-02-28 06:11:16 +0000

[diff] [blame]

3643

else if (AllUsersSelectZero(MachineNode))

3644

ResNode = CurDAG->getMachineNode(PPC::CROR, SDLoc(MachineNode),

3645

MVT::i1, MachineNode->getOperand(0),

3646

MachineNode->getOperand(1)),

3647

SelectSwap = true;

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

3648

break;

3649

case PPC::CREQV:

3650

if (MachineNode->getOperand(0) == MachineNode->getOperand(1))

3651

// eqv(x, x) = 1

3652

ResNode = CurDAG->getMachineNode(PPC::CRSET, SDLoc(MachineNode),

MVT::i1);

else if (Op1Set)

// eqv(1, y) = y

ResNode = MachineNode->getOperand(1).getNode();

3657

else if (Op2Set)

3658

// eqv(x, 1) = x

3659

ResNode = MachineNode->getOperand(0).getNode();

3660

else if (Op1Unset)

3661

// eqv(0, y) = ~y -> nor(y, y)

3662

ResNode = CurDAG->getMachineNode(PPC::CRNOR, SDLoc(MachineNode),

3663

MVT::i1, MachineNode->getOperand(1),

3664

MachineNode->getOperand(1));

3665

else if (Op2Unset)

3666

// eqv(x, 0) = ~x

3667

ResNode = CurDAG->getMachineNode(PPC::CRNOR, SDLoc(MachineNode),

3668

MVT::i1, MachineNode->getOperand(0),

3669

MachineNode->getOperand(0));

3670

else if (Op1Not)

3671

// eqv(~x, y) = xor(x, y)

3672

ResNode = CurDAG->getMachineNode(PPC::CRXOR, SDLoc(MachineNode),

3673

MVT::i1, MachineNode->getOperand(0).

3674

getOperand(0),

3675

MachineNode->getOperand(1));

3676

else if (Op2Not)

3677

// eqv(x, ~y) = xor(x, y)

3678

ResNode = CurDAG->getMachineNode(PPC::CRXOR, SDLoc(MachineNode),

3679

MVT::i1, MachineNode->getOperand(0),

3680

MachineNode->getOperand(1).

3681

getOperand(0));

Hal Finkel

2014-02-28 06:11:16 +0000

[diff] [blame]

3682

else if (AllUsersSelectZero(MachineNode))

3683

ResNode = CurDAG->getMachineNode(PPC::CRXOR, SDLoc(MachineNode),

3684

MVT::i1, MachineNode->getOperand(0),

3685

MachineNode->getOperand(1)),

3686

SelectSwap = true;

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

3687

break;

3688

case PPC::CRANDC:

3689

if (MachineNode->getOperand(0) == MachineNode->getOperand(1))

3690

// andc(x, x) = 0

3691

ResNode = CurDAG->getMachineNode(PPC::CRUNSET, SDLoc(MachineNode),

MVT::i1);

else if (Op1Set)

// andc(1, y) = ~y

ResNode = CurDAG->getMachineNode(PPC::CRNOR, SDLoc(MachineNode),

3696

MVT::i1, MachineNode->getOperand(1),

3697

MachineNode->getOperand(1));

3698

else if (Op1Unset || Op2Set)

3699

// andc(0, y) = andc(x, 1) = 0

3700

ResNode = CurDAG->getMachineNode(PPC::CRUNSET, SDLoc(MachineNode),

MVT::i1);

else if (Op2Unset)

// andc(x, 0) = x

ResNode = MachineNode->getOperand(0).getNode();

3705

else if (Op1Not)

3706

// andc(~x, y) = ~(x | y) = nor(x, y)

3707

ResNode = CurDAG->getMachineNode(PPC::CRNOR, SDLoc(MachineNode),

3708

MVT::i1, MachineNode->getOperand(0).

3709

getOperand(0),

3710

MachineNode->getOperand(1));

3711

else if (Op2Not)

3712

// andc(x, ~y) = x & y

3713

ResNode = CurDAG->getMachineNode(PPC::CRAND, SDLoc(MachineNode),

3714

MVT::i1, MachineNode->getOperand(0),

3715

MachineNode->getOperand(1).

3716

getOperand(0));

Hal Finkel

2014-02-28 06:11:16 +0000

[diff] [blame]

3717

else if (AllUsersSelectZero(MachineNode))

3718

ResNode = CurDAG->getMachineNode(PPC::CRORC, SDLoc(MachineNode),

3719

MVT::i1, MachineNode->getOperand(1),

3720

MachineNode->getOperand(0)),

3721

SelectSwap = true;

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

3722

break;

3723

case PPC::CRORC:

3724

if (MachineNode->getOperand(0) == MachineNode->getOperand(1))

3725

// orc(x, x) = 1

3726

ResNode = CurDAG->getMachineNode(PPC::CRSET, SDLoc(MachineNode),

3727

MVT::i1);

3728

else if (Op1Set || Op2Unset)

3729

// orc(1, y) = orc(x, 0) = 1

3730

ResNode = CurDAG->getMachineNode(PPC::CRSET, SDLoc(MachineNode),

MVT::i1);

else if (Op2Set)

// orc(x, 1) = x

ResNode = MachineNode->getOperand(0).getNode();

3735

else if (Op1Unset)

3736

// orc(0, y) = ~y

3737

ResNode = CurDAG->getMachineNode(PPC::CRNOR, SDLoc(MachineNode),

3738

MVT::i1, MachineNode->getOperand(1),

3739

MachineNode->getOperand(1));

3740

else if (Op1Not)

3741

// orc(~x, y) = ~(x & y) = nand(x, y)

3742

ResNode = CurDAG->getMachineNode(PPC::CRNAND, SDLoc(MachineNode),

3743

MVT::i1, MachineNode->getOperand(0).

3744

getOperand(0),

3745

MachineNode->getOperand(1));

3746

else if (Op2Not)

3747

// orc(x, ~y) = x | y

3748

ResNode = CurDAG->getMachineNode(PPC::CROR, SDLoc(MachineNode),

3749

MVT::i1, MachineNode->getOperand(0),

3750

MachineNode->getOperand(1).

3751

getOperand(0));

Hal Finkel

2014-02-28 06:11:16 +0000

[diff] [blame]

3752

else if (AllUsersSelectZero(MachineNode))

3753

ResNode = CurDAG->getMachineNode(PPC::CRANDC, SDLoc(MachineNode),

3754

MVT::i1, MachineNode->getOperand(1),

3755

MachineNode->getOperand(0)),

3756

SelectSwap = true;

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

break;

case PPC::SELECT_I4:

case PPC::SELECT_I8:

case PPC::SELECT_F4:

case PPC::SELECT_F8:

Hal Finkel

2015-02-25 01:06:45 +0000

[diff] [blame]

3762

case PPC::SELECT_QFRC:

3763

case PPC::SELECT_QSRC:

3764

case PPC::SELECT_QBRC:

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

3765

case PPC::SELECT_VRRC:

Bill Schmidt

9c54bbd

2014-10-22 16:58:20 +0000

[diff] [blame]

3766

case PPC::SELECT_VSFRC:

Bill Schmidt

2014-10-22 13:13:40 +0000

[diff] [blame]

3767

case PPC::SELECT_VSRC:

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

3768

if (Op1Set)

3769

ResNode = MachineNode->getOperand(1).getNode();

3770

else if (Op1Unset)

3771

ResNode = MachineNode->getOperand(2).getNode();

3772

else if (Op1Not)

3773

ResNode = CurDAG->getMachineNode(MachineNode->getMachineOpcode(),

3774

SDLoc(MachineNode),

3775

MachineNode->getValueType(0),

3776

MachineNode->getOperand(0).

3777

getOperand(0),

3778

MachineNode->getOperand(2),

3779

MachineNode->getOperand(1));

break;

case PPC::BC:

case PPC::BCn:

if (Op1Not)

ResNode = CurDAG->getMachineNode(Opcode == PPC::BC ? PPC::BCn :

PPC::BC,

SDLoc(MachineNode),

MVT::Other,

MachineNode->getOperand(0).

3789

getOperand(0),

3790

MachineNode->getOperand(1),

3791

MachineNode->getOperand(2));

3792

// FIXME: Handle Op1Set, Op1Unset here too.

break;

}

Hal Finkel

2014-02-28 06:11:16 +0000

[diff] [blame]

3796

// If we're inverting this node because it is used only by selects that

3797

// we'd like to swap, then swap the selects before the node replacement.

3798

if (SelectSwap)

3799

SwapAllSelectUsers(MachineNode);

3800

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

3801

if (ResNode != MachineNode) {

3802

DEBUG(dbgs() << "CR Peephole replacing:\nOld: ");

3803

DEBUG(MachineNode->dump(CurDAG));

3804

DEBUG(dbgs() << "\nNew: ");

3805

DEBUG(ResNode->dump(CurDAG));

3806

DEBUG(dbgs() << "\n");

3807

3808

ReplaceUses(MachineNode, ResNode);

IsModified = true;

}

}

if (IsModified)

CurDAG->RemoveDeadNodes();

3814

} while (IsModified);

3815

}

3816

Hal Finkel

2014-12-12 23:59:36 +0000

[diff] [blame]

3817

// Gather the set of 32-bit operations that are known to have their

3818

// higher-order 32 bits zero, where ToPromote contains all such operations.

3819

static bool PeepholePPC64ZExtGather(SDValue Op32,

3820

SmallPtrSetImpl<SDNode *> &ToPromote) {

3821

if (!Op32.isMachineOpcode())

3822

return false;

3823

3824

// First, check for the "frontier" instructions (those that will clear the

3825

// higher-order 32 bits.

3826

3827

// For RLWINM and RLWNM, we need to make sure that the mask does not wrap

3828

// around. If it does not, then these instructions will clear the

3829

// higher-order bits.

3830

if ((Op32.getMachineOpcode() == PPC::RLWINM ||

3831

Op32.getMachineOpcode() == PPC::RLWNM) &&

3832

Op32.getConstantOperandVal(2) <= Op32.getConstantOperandVal(3)) {

3833

ToPromote.insert(Op32.getNode());

return true;

}

// SLW and SRW always clear the higher-order bits.

3838

if (Op32.getMachineOpcode() == PPC::SLW ||

3839

Op32.getMachineOpcode() == PPC::SRW) {

3840

ToPromote.insert(Op32.getNode());

return true;

}

// For LI and LIS, we need the immediate to be positive (so that it is not

3845

// sign extended).

3846

if (Op32.getMachineOpcode() == PPC::LI ||

3847

Op32.getMachineOpcode() == PPC::LIS) {

3848

if (!isUInt<15>(Op32.getConstantOperandVal(0)))

3849

return false;

3850

3851

ToPromote.insert(Op32.getNode());

return true;

}

Hal Finkel

2015-01-05 18:09:06 +0000

[diff] [blame]

3855

// LHBRX and LWBRX always clear the higher-order bits.

3856

if (Op32.getMachineOpcode() == PPC::LHBRX ||

3857

Op32.getMachineOpcode() == PPC::LWBRX) {

3858

ToPromote.insert(Op32.getNode());

return true;

}

Hal Finkel

2015-01-05 18:52:29 +0000

[diff] [blame]

3862

// CNTLZW always produces a 64-bit value in [0,32], and so is zero extended.

3863

if (Op32.getMachineOpcode() == PPC::CNTLZW) {

3864

ToPromote.insert(Op32.getNode());

return true;

}

Hal Finkel

2014-12-12 23:59:36 +0000

[diff] [blame]

3868

// Next, check for those instructions we can look through.

3869

3870

// Assuming the mask does not wrap around, then the higher-order bits are

3871

// taken directly from the first operand.

3872

if (Op32.getMachineOpcode() == PPC::RLWIMI &&

3873

Op32.getConstantOperandVal(3) <= Op32.getConstantOperandVal(4)) {

3874

SmallPtrSet<SDNode *, 16> ToPromote1;

3875

if (!PeepholePPC64ZExtGather(Op32.getOperand(0), ToPromote1))

3876

return false;

3877

3878

ToPromote.insert(Op32.getNode());

3879

ToPromote.insert(ToPromote1.begin(), ToPromote1.end());

return true;

}

// For OR, the higher-order bits are zero if that is true for both operands.

3884

// For SELECT_I4, the same is true (but the relevant operand numbers are

3885

// shifted by 1).

3886

if (Op32.getMachineOpcode() == PPC::OR ||

3887

Op32.getMachineOpcode() == PPC::SELECT_I4) {

3888

unsigned B = Op32.getMachineOpcode() == PPC::SELECT_I4 ? 1 : 0;

3889

SmallPtrSet<SDNode *, 16> ToPromote1;

3890

if (!PeepholePPC64ZExtGather(Op32.getOperand(B+0), ToPromote1))

3891

return false;

3892

if (!PeepholePPC64ZExtGather(Op32.getOperand(B+1), ToPromote1))

3893

return false;

3894

3895

ToPromote.insert(Op32.getNode());

3896

ToPromote.insert(ToPromote1.begin(), ToPromote1.end());

return true;

}

// For ORI and ORIS, we need the higher-order bits of the first operand to be

3901

// zero, and also for the constant to be positive (so that it is not sign

3902

// extended).

3903

if (Op32.getMachineOpcode() == PPC::ORI ||

3904

Op32.getMachineOpcode() == PPC::ORIS) {

3905

SmallPtrSet<SDNode *, 16> ToPromote1;

3906

if (!PeepholePPC64ZExtGather(Op32.getOperand(0), ToPromote1))

3907

return false;

3908

if (!isUInt<15>(Op32.getConstantOperandVal(1)))

3909

return false;

3910

3911

ToPromote.insert(Op32.getNode());

3912

ToPromote.insert(ToPromote1.begin(), ToPromote1.end());

return true;

}

// The higher-order bits of AND are zero if that is true for at least one of

3917

// the operands.

3918

if (Op32.getMachineOpcode() == PPC::AND) {

3919

SmallPtrSet<SDNode *, 16> ToPromote1, ToPromote2;

3920

bool Op0OK =

3921

PeepholePPC64ZExtGather(Op32.getOperand(0), ToPromote1);

3922

bool Op1OK =

3923

PeepholePPC64ZExtGather(Op32.getOperand(1), ToPromote2);

3924

if (!Op0OK && !Op1OK)

3925

return false;

3926

3927

ToPromote.insert(Op32.getNode());

3928

3929

if (Op0OK)

3930

ToPromote.insert(ToPromote1.begin(), ToPromote1.end());

3931

3932

if (Op1OK)

3933

ToPromote.insert(ToPromote2.begin(), ToPromote2.end());

return true;

}

// For ANDI and ANDIS, the higher-order bits are zero if either that is true

3939

// of the first operand, or if the second operand is positive (so that it is

3940

// not sign extended).

3941

if (Op32.getMachineOpcode() == PPC::ANDIo ||

3942

Op32.getMachineOpcode() == PPC::ANDISo) {

3943

SmallPtrSet<SDNode *, 16> ToPromote1;

3944

bool Op0OK =

3945

PeepholePPC64ZExtGather(Op32.getOperand(0), ToPromote1);

3946

bool Op1OK = isUInt<15>(Op32.getConstantOperandVal(1));

3947

if (!Op0OK && !Op1OK)

3948

return false;

3949

3950

ToPromote.insert(Op32.getNode());

3951

3952

if (Op0OK)

3953

ToPromote.insert(ToPromote1.begin(), ToPromote1.end());

return true;

}

return false;

}

void PPCDAGToDAGISel::PeepholePPC64ZExt() {

3962

if (!PPCSubTarget->isPPC64())

3963

return;

3964

3965

// When we zero-extend from i32 to i64, we use a pattern like this:

3966

// def : Pat<(i64 (zext i32:$in)),

3967

// (RLDICL (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $in, sub_32),

3968

// 0, 32)>;

3969

// There are several 32-bit shift/rotate instructions, however, that will

3970

// clear the higher-order bits of their output, rendering the RLDICL

3971

// unnecessary. When that happens, we remove it here, and redefine the

3972

// relevant 32-bit operation to be a 64-bit operation.

3973

3974

SelectionDAG::allnodes_iterator Position(CurDAG->getRoot().getNode());

3975

++Position;

3976

3977

bool MadeChange = false;

3978

while (Position != CurDAG->allnodes_begin()) {

3979

SDNode *N = --Position;

3980

// Skip dead nodes and any non-machine opcodes.

3981

if (N->use_empty() || !N->isMachineOpcode())

3982

continue;

3983

3984

if (N->getMachineOpcode() != PPC::RLDICL)

3985

continue;

3986

3987

if (N->getConstantOperandVal(1) != 0 ||

3988

N->getConstantOperandVal(2) != 32)

3989

continue;

3990

3991

SDValue ISR = N->getOperand(0);

3992

if (!ISR.isMachineOpcode() ||

3993

ISR.getMachineOpcode() != TargetOpcode::INSERT_SUBREG)

3994

continue;

3995

3996

if (!ISR.hasOneUse())

3997

continue;

3998

3999

if (ISR.getConstantOperandVal(2) != PPC::sub_32)

4000

continue;

4001

4002

SDValue IDef = ISR.getOperand(0);

4003

if (!IDef.isMachineOpcode() ||

4004

IDef.getMachineOpcode() != TargetOpcode::IMPLICIT_DEF)

4005

continue;

4006

4007

// We now know that we're looking at a canonical i32 -> i64 zext. See if we

4008

// can get rid of it.

4009

4010

SDValue Op32 = ISR->getOperand(1);

4011

if (!Op32.isMachineOpcode())

4012

continue;

4013

4014

// There are some 32-bit instructions that always clear the high-order 32

4015

// bits, there are also some instructions (like AND) that we can look

4016

// through.

4017

SmallPtrSet<SDNode *, 16> ToPromote;

4018

if (!PeepholePPC64ZExtGather(Op32, ToPromote))

4019

continue;

4020

4021

// If the ToPromote set contains nodes that have uses outside of the set

4022

// (except for the original INSERT_SUBREG), then abort the transformation.

4023

bool OutsideUse = false;

4024

for (SDNode *PN : ToPromote) {

4025

for (SDNode *UN : PN->uses()) {

4026

if (!ToPromote.count(UN) && UN != ISR.getNode()) {

OutsideUse = true;

break;

}

}

if (OutsideUse)

break;

}

if (OutsideUse)

continue;

MadeChange = true;

// We now know that this zero extension can be removed by promoting to

4041

// nodes in ToPromote to 64-bit operations, where for operations in the

4042

// frontier of the set, we need to insert INSERT_SUBREGs for their

4043

// operands.

4044

for (SDNode *PN : ToPromote) {

4045

unsigned NewOpcode;

4046

switch (PN->getMachineOpcode()) {

4047

default:

4048

llvm_unreachable("Don't know the 64-bit variant of this instruction");

4049

case PPC::RLWINM: NewOpcode = PPC::RLWINM8; break;

4050

case PPC::RLWNM: NewOpcode = PPC::RLWNM8; break;

4051

case PPC::SLW: NewOpcode = PPC::SLW8; break;

4052

case PPC::SRW: NewOpcode = PPC::SRW8; break;

4053

case PPC::LI: NewOpcode = PPC::LI8; break;

4054

case PPC::LIS: NewOpcode = PPC::LIS8; break;

Hal Finkel

4e2c782

2015-01-05 18:09:06 +0000

[diff] [blame]

4055

case PPC::LHBRX: NewOpcode = PPC::LHBRX8; break;

4056

case PPC::LWBRX: NewOpcode = PPC::LWBRX8; break;

Hal Finkel

49557f1

2015-01-05 18:52:29 +0000

[diff] [blame]

4057

case PPC::CNTLZW: NewOpcode = PPC::CNTLZW8; break;

Hal Finkel

2014-12-12 23:59:36 +0000

[diff] [blame]

4058

case PPC::RLWIMI: NewOpcode = PPC::RLWIMI8; break;

4059

case PPC::OR: NewOpcode = PPC::OR8; break;

4060

case PPC::SELECT_I4: NewOpcode = PPC::SELECT_I8; break;

4061

case PPC::ORI: NewOpcode = PPC::ORI8; break;

4062

case PPC::ORIS: NewOpcode = PPC::ORIS8; break;

4063

case PPC::AND: NewOpcode = PPC::AND8; break;

4064

case PPC::ANDIo: NewOpcode = PPC::ANDIo8; break;

4065

case PPC::ANDISo: NewOpcode = PPC::ANDISo8; break;

4066

}

4067

4068

// Note: During the replacement process, the nodes will be in an

4069

// inconsistent state (some instructions will have operands with values

4070

// of the wrong type). Once done, however, everything should be right

4071

// again.

4072

4073

SmallVector<SDValue, 4> Ops;

4074

for (const SDValue &V : PN->ops()) {

4075

if (!ToPromote.count(V.getNode()) && V.getValueType() == MVT::i32 &&

4076

!isa<ConstantSDNode>(V)) {

4077

SDValue ReplOpOps[] = { ISR.getOperand(0), V, ISR.getOperand(2) };

4078

SDNode *ReplOp =

4079

CurDAG->getMachineNode(TargetOpcode::INSERT_SUBREG, SDLoc(V),

4080

ISR.getNode()->getVTList(), ReplOpOps);

4081

Ops.push_back(SDValue(ReplOp, 0));

} else {

Ops.push_back(V);

}

}

// Because all to-be-promoted nodes only have users that are other

4088

// promoted nodes (or the original INSERT_SUBREG), we can safely replace

4089

// the i32 result value type with i64.

4090

4091

SmallVector<EVT, 2> NewVTs;

4092

SDVTList VTs = PN->getVTList();

4093

for (unsigned i = 0, ie = VTs.NumVTs; i != ie; ++i)

4094

if (VTs.VTs[i] == MVT::i32)

4095

NewVTs.push_back(MVT::i64);

4096

else

4097

NewVTs.push_back(VTs.VTs[i]);

4098

4099

DEBUG(dbgs() << "PPC64 ZExt Peephole morphing:\nOld: ");

4100

DEBUG(PN->dump(CurDAG));

4101

4102

CurDAG->SelectNodeTo(PN, NewOpcode, CurDAG->getVTList(NewVTs), Ops);

4103

4104

DEBUG(dbgs() << "\nNew: ");

4105

DEBUG(PN->dump(CurDAG));

4106

DEBUG(dbgs() << "\n");

4107

}

4108

4109

// Now we replace the original zero extend and its associated INSERT_SUBREG

4110

// with the value feeding the INSERT_SUBREG (which has now been promoted to

4111

// return an i64).

4112

4113

DEBUG(dbgs() << "PPC64 ZExt Peephole replacing:\nOld: ");

4114

DEBUG(N->dump(CurDAG));

4115

DEBUG(dbgs() << "\nNew: ");

4116

DEBUG(Op32.getNode()->dump(CurDAG));

4117

DEBUG(dbgs() << "\n");

4118

4119

ReplaceUses(N, Op32.getNode());

}

if (MadeChange)

CurDAG->RemoveDeadNodes();

4124

}

4125

Hal Finkel

2014-02-28 00:27:01 +0000

[diff] [blame]

4126

void PPCDAGToDAGISel::PeepholePPC64() {

Bill Schmidt

2013-02-21 00:38:25 +0000

[diff] [blame]

4127

// These optimizations are currently supported only for 64-bit SVR4.

Eric Christopher

2014-05-22 01:07:24 +0000

[diff] [blame]

4128

if (PPCSubTarget->isDarwin() || !PPCSubTarget->isPPC64())

Bill Schmidt

2013-02-21 00:38:25 +0000

[diff] [blame]

4129

return;

4130

4131

SelectionDAG::allnodes_iterator Position(CurDAG->getRoot().getNode());

4132

++Position;

4133

4134

while (Position != CurDAG->allnodes_begin()) {

4135

SDNode *N = --Position;

4136

// Skip dead nodes and any non-machine opcodes.

4137

if (N->use_empty() || !N->isMachineOpcode())

continue;

unsigned FirstOp;

unsigned StorageOpcode = N->getMachineOpcode();

4142

4143

switch (StorageOpcode) {

default: continue;

case PPC::LBZ:

case PPC::LBZ8:

case PPC::LD:

case PPC::LFD:

case PPC::LFS:

case PPC::LHA:

case PPC::LHA8:

case PPC::LHZ:

case PPC::LHZ8:

case PPC::LWA:

case PPC::LWZ:

case PPC::LWZ8:

FirstOp = 0;

break;

case PPC::STB:

case PPC::STB8:

case PPC::STD:

case PPC::STFD:

case PPC::STFS:

case PPC::STH:

case PPC::STH8:

case PPC::STW:

case PPC::STW8:

FirstOp = 1;

break;

}

// If this is a load or store with a zero offset, we may be able to

4175

// fold an add-immediate into the memory operation.

4176

if (!isa<ConstantSDNode>(N->getOperand(FirstOp)) ||

4177

N->getConstantOperandVal(FirstOp) != 0)

4178

continue;

4179

4180

SDValue Base = N->getOperand(FirstOp + 1);

4181

if (!Base.isMachineOpcode())

continue;

unsigned Flags = 0;

bool ReplaceFlags = true;

4186

4187

// When the feeding operation is an add-immediate of some sort,

4188

// determine whether we need to add relocation information to the

4189

// target flags on the immediate operand when we fold it into the

4190

// load instruction.

4191

//

4192

// For something like ADDItocL, the relocation information is

4193

// inferred from the opcode; when we process it in the AsmPrinter,

4194

// we add the necessary relocation there. A load, though, can receive

4195

// relocation from various flavors of ADDIxxx, so we need to carry

4196

// the relocation information in the target flags.

4197

switch (Base.getMachineOpcode()) {

4198

default: continue;

4199

4200

case PPC::ADDI8:

Ulrich Weigand

35f9fdf

2013-03-26 10:55:20 +0000

[diff] [blame]

4201

case PPC::ADDI:

Bill Schmidt

2013-02-21 00:38:25 +0000

[diff] [blame]

4202

// In some cases (such as TLS) the relocation information

4203

// is already in place on the operand, so copying the operand

4204

// is sufficient.

4205

ReplaceFlags = false;

4206

// For these cases, the immediate may not be divisible by 4, in

4207

// which case the fold is illegal for DS-form instructions. (The

4208

// other cases provide aligned addresses and are always safe.)

4209

if ((StorageOpcode == PPC::LWA ||

4210

StorageOpcode == PPC::LD ||

4211

StorageOpcode == PPC::STD) &&

4212

(!isa<ConstantSDNode>(Base.getOperand(1)) ||

4213

Base.getConstantOperandVal(1) % 4 != 0))

4214

continue;

4215

break;

4216

case PPC::ADDIdtprelL:

Ulrich Weigand

d51c09f

2013-06-21 14:42:20 +0000

[diff] [blame]

4217

Flags = PPCII::MO_DTPREL_LO;

Bill Schmidt

2013-02-21 00:38:25 +0000

[diff] [blame]

4218

break;

4219

case PPC::ADDItlsldL:

Ulrich Weigand

d51c09f

2013-06-21 14:42:20 +0000

[diff] [blame]

4220

Flags = PPCII::MO_TLSLD_LO;

Bill Schmidt

2013-02-21 00:38:25 +0000

[diff] [blame]

4221

break;

4222

case PPC::ADDItocL:

Ulrich Weigand

d51c09f

2013-06-21 14:42:20 +0000

[diff] [blame]

4223

Flags = PPCII::MO_TOC_LO;

Bill Schmidt

2013-02-21 00:38:25 +0000

[diff] [blame]

break;

}

// We found an opportunity. Reverse the operands from the add

4228

// immediate and substitute them into the load or store. If

4229

// needed, update the target flags for the immediate operand to

4230

// reflect the necessary relocation information.

4231

DEBUG(dbgs() << "Folding add-immediate into mem-op:\nBase: ");

4232

DEBUG(Base->dump(CurDAG));

4233

DEBUG(dbgs() << "\nN: ");

4234

DEBUG(N->dump(CurDAG));

4235

DEBUG(dbgs() << "\n");

4236

4237

SDValue ImmOpnd = Base.getOperand(1);

4238

4239

// If the relocation information isn't already present on the

4240

// immediate operand, add it now.

4241

if (ReplaceFlags) {

Bill Schmidt

49498da

2013-02-21 14:35:42 +0000

[diff] [blame]

4242

if (GlobalAddressSDNode *GA = dyn_cast<GlobalAddressSDNode>(ImmOpnd)) {

Andrew Trick

2013-05-25 02:42:55 +0000

[diff] [blame]

4243

SDLoc dl(GA);

Bill Schmidt

2013-02-21 00:38:25 +0000

[diff] [blame]

4244

const GlobalValue *GV = GA->getGlobal();

Bill Schmidt

48fc20a

2013-07-01 20:52:27 +0000

[diff] [blame]

4245

// We can't perform this optimization for data whose alignment

4246

// is insufficient for the instruction encoding.

4247

if (GV->getAlignment() < 4 &&

4248

(StorageOpcode == PPC::LD || StorageOpcode == PPC::STD ||

4249

StorageOpcode == PPC::LWA)) {

4250

DEBUG(dbgs() << "Rejected this candidate for alignment.\n\n");

4251

continue;

4252

}

Bill Schmidt

2013-02-21 00:38:25 +0000

[diff] [blame]

4253

ImmOpnd = CurDAG->getTargetGlobalAddress(GV, dl, MVT::i64, 0, Flags);

Bill Schmidt

836c45b

2013-02-21 17:26:05 +0000

[diff] [blame]

4254

} else if (ConstantPoolSDNode *CP =

4255

dyn_cast<ConstantPoolSDNode>(ImmOpnd)) {

Bill Schmidt

49498da

2013-02-21 14:35:42 +0000

[diff] [blame]

4256

const Constant *C = CP->getConstVal();

4257

ImmOpnd = CurDAG->getTargetConstantPool(C, MVT::i64,

4258

CP->getAlignment(),

4259

0, Flags);

Bill Schmidt

2013-02-21 00:38:25 +0000

[diff] [blame]

}

}

if (FirstOp == 1) // Store

4264

(void)CurDAG->UpdateNodeOperands(N, N->getOperand(0), ImmOpnd,

4265

Base.getOperand(0), N->getOperand(3));

4266

else // Load

4267

(void)CurDAG->UpdateNodeOperands(N, ImmOpnd, Base.getOperand(0),

4268

N->getOperand(2));

4269

4270

// The add-immediate may now be dead, in which case remove it.

4271

if (Base.getNode()->use_empty())

4272

CurDAG->RemoveDeadNode(Base.getNode());

4273

}

4274

}

Chris Lattner

2005-08-17 19:33:03 +0000

[diff] [blame]

4275

Chris Lattner

b055c87

2006-06-10 01:15:02 +0000

[diff] [blame]

4276

Andrew Trick

2010-12-24 04:28:06 +0000

[diff] [blame]

4277

/// createPPCISelDag - This pass converts a legalized DAG into a

Chris Lattner

2005-08-17 19:33:03 +0000

[diff] [blame]

4278

/// PowerPC-specific DAG, ready for instruction scheduling.

4279

///

Evan Cheng

2dd2c65

2006-03-13 23:20:37 +0000

[diff] [blame]

4280

FunctionPass *llvm::createPPCISelDag(PPCTargetMachine &TM) {

Nate Begeman

0b71e00

2005-10-18 00:28:58 +0000

[diff] [blame]

4281

return new PPCDAGToDAGISel(TM);

Chris Lattner

2005-08-17 19:33:03 +0000

[diff] [blame]

4282

}

4283

Krzysztof Parzyszek

2013-02-13 17:40:07 +0000

[diff] [blame]

4284

static void initializePassOnce(PassRegistry &Registry) {

4285

const char *Name = "PowerPC DAG->DAG Pattern Instruction Selection";

Craig Topper

2014-04-25 05:30:21 +0000

[diff] [blame]

4286

PassInfo *PI = new PassInfo(Name, "ppc-codegen", &SelectionDAGISel::ID,

4287

nullptr, false, false);

Krzysztof Parzyszek