Blame - llvm/lib/Target/X86/X86InstrFPStack.td - toolchain/llvm-project

Evan Cheng

6e595b9

2006-02-21 19:13:53 +0000

[diff] [blame]

1

//==- X86InstrFPStack.td - Describe the X86 Instruction Set -------*- C++ -*-=//

2

//

3

// The LLVM Compiler Infrastructure

4

//

5

// This file was developed by the Evan Cheng and is distributed under

6

// the University of Illinois Open Source License. See LICENSE.TXT for details.

7

//

8

//===----------------------------------------------------------------------===//

9

//

10

// This file describes the X86 x87 FPU instruction set, defining the

11

// instructions, and properties of the instructions which are needed for code

12

// generation, machine code emission, and analysis.

13

//

14

//===----------------------------------------------------------------------===//

15

Evan Cheng

4f67492

2006-03-17 19:55:52 +0000

[diff] [blame]

16

//===----------------------------------------------------------------------===//

Evan Cheng

9bf978d

2006-03-18 01:23:20 +0000

[diff] [blame^]

17

// FPStack specific DAG Nodes.

18

//===----------------------------------------------------------------------===//

19

20

def SDTX86FpGet : SDTypeProfile<1, 0, [SDTCisVT<0, f64>]>;

21

def SDTX86FpSet : SDTypeProfile<0, 1, [SDTCisFP<0>]>;

22

def SDTX86Fld : SDTypeProfile<1, 2, [SDTCisVT<0, f64>,

23

SDTCisPtrTy<1>, SDTCisVT<2, OtherVT>]>;

24

def SDTX86Fst : SDTypeProfile<0, 3, [SDTCisFP<0>,

25

SDTCisPtrTy<1>, SDTCisVT<2, OtherVT>]>;

26

def SDTX86Fild : SDTypeProfile<1, 2, [SDTCisVT<0, f64>, SDTCisPtrTy<1>,

27

SDTCisVT<2, OtherVT>]>;

28

def SDTX86FpToIMem: SDTypeProfile<0, 2, [SDTCisFP<0>, SDTCisPtrTy<1>]>;

29

30

def X86fpget : SDNode<"X86ISD::FP_GET_RESULT", SDTX86FpGet,

31

[SDNPHasChain, SDNPInFlag, SDNPOutFlag]>;

32

def X86fpset : SDNode<"X86ISD::FP_SET_RESULT", SDTX86FpSet,

33

[SDNPHasChain, SDNPOutFlag]>;

34

def X86fld : SDNode<"X86ISD::FLD", SDTX86Fld,

35

[SDNPHasChain]>;

36

def X86fst : SDNode<"X86ISD::FST", SDTX86Fst,

37

[SDNPHasChain, SDNPInFlag]>;

38

def X86fild : SDNode<"X86ISD::FILD", SDTX86Fild,

39

[SDNPHasChain]>;

40

def X86fildflag: SDNode<"X86ISD::FILD_FLAG",SDTX86Fild,

41

[SDNPHasChain, SDNPOutFlag]>;

42

def X86fp_to_i16mem : SDNode<"X86ISD::FP_TO_INT16_IN_MEM", SDTX86FpToIMem,

43

[SDNPHasChain]>;

44

def X86fp_to_i32mem : SDNode<"X86ISD::FP_TO_INT32_IN_MEM", SDTX86FpToIMem,

45

[SDNPHasChain]>;

46

def X86fp_to_i64mem : SDNode<"X86ISD::FP_TO_INT64_IN_MEM", SDTX86FpToIMem,

47

[SDNPHasChain]>;

48

49

//===----------------------------------------------------------------------===//

Evan Cheng

4f67492

2006-03-17 19:55:52 +0000

[diff] [blame]

50

// FPStack pattern fragments

51

//===----------------------------------------------------------------------===//

52

53

def fp32imm0 : PatLeaf<(f32 fpimm), [{

54

return N->isExactlyValue(+0.0);

55

}]>;

56

57

def fp64imm0 : PatLeaf<(f64 fpimm), [{

58

return N->isExactlyValue(+0.0);

59

}]>;

60

61

def fp64immneg0 : PatLeaf<(f64 fpimm), [{

62

return N->isExactlyValue(-0.0);

63

}]>;

64

65

def fp64imm1 : PatLeaf<(f64 fpimm), [{

66

return N->isExactlyValue(+1.0);

67

}]>;

68

69

def fp64immneg1 : PatLeaf<(f64 fpimm), [{

70

return N->isExactlyValue(-1.0);

71

}]>;

72

73

def extloadf64f32 : PatFrag<(ops node:$ptr), (f64 (extload node:$ptr, f32))>;

74

Evan Cheng

d584781

2006-02-21 20:00:20 +0000

[diff] [blame]

75

// Some 'special' instructions

76

let usesCustomDAGSchedInserter = 1 in { // Expanded by the scheduler.

77

def FP_TO_INT16_IN_MEM : I<0, Pseudo,

78

(ops i16mem:$dst, RFP:$src),

79

"#FP_TO_INT16_IN_MEM PSEUDO!",

80

[(X86fp_to_i16mem RFP:$src, addr:$dst)]>;

81

def FP_TO_INT32_IN_MEM : I<0, Pseudo,

82

(ops i32mem:$dst, RFP:$src),

83

"#FP_TO_INT32_IN_MEM PSEUDO!",

84

[(X86fp_to_i32mem RFP:$src, addr:$dst)]>;

85

def FP_TO_INT64_IN_MEM : I<0, Pseudo,

86

(ops i64mem:$dst, RFP:$src),

87

"#FP_TO_INT64_IN_MEM PSEUDO!",

88

[(X86fp_to_i64mem RFP:$src, addr:$dst)]>;

89

}

90

91

let isTerminator = 1 in

92

let Defs = [FP0, FP1, FP2, FP3, FP4, FP5, FP6] in

93

def FP_REG_KILL : I<0, Pseudo, (ops), "#FP_REG_KILL", []>;

94

Evan Cheng

6e595b9

2006-02-21 19:13:53 +0000

[diff] [blame]

95

// All FP Stack operations are represented with two instructions here. The

96

// first instruction, generated by the instruction selector, uses "RFP"

97

// registers: a traditional register file to reference floating point values.

98

// These instructions are all psuedo instructions and use the "Fp" prefix.

99

// The second instruction is defined with FPI, which is the actual instruction

100

// emitted by the assembler. The FP stackifier pass converts one to the other

101

// after register allocation occurs.

102

//

103

// Note that the FpI instruction should have instruction selection info (e.g.

104

// a pattern) and the FPI instruction should have emission info (e.g. opcode

105

// encoding and asm printing info).

106

107

// FPI - Floating Point Instruction template.

108

class FPI<bits<8> o, Format F, dag ops, string asm> : I<o, F, ops, asm, []> {}

109

110

// FpI_ - Floating Point Psuedo Instruction template. Not Predicated.

111

class FpI_<dag ops, FPFormat fp, list<dag> pattern>

112

: X86Inst<0, Pseudo, NoImm, ops, ""> {

113

let FPForm = fp; let FPFormBits = FPForm.Value;

114

let Pattern = pattern;

115

}

116

117

// Random Pseudo Instructions.

118

def FpGETRESULT : FpI_<(ops RFP:$dst), SpecialFP,

119

[(set RFP:$dst, X86fpget)]>; // FPR = ST(0)

120

121

let noResults = 1 in

122

def FpSETRESULT : FpI_<(ops RFP:$src), SpecialFP,

123

[(X86fpset RFP:$src)]>, Imp<[], [ST0]>; // ST(0) = FPR

124

125

// FpI - Floating Point Psuedo Instruction template. Predicated on FPStack.

126

class FpI<dag ops, FPFormat fp, list<dag> pattern> :

127

FpI_<ops, fp, pattern>, Requires<[FPStack]>;

128

129

130

def FpMOV : FpI<(ops RFP:$dst, RFP:$src), SpecialFP, []>; // f1 = fmov f2

131

132

// Arithmetic

133

// Add, Sub, Mul, Div.

134

def FpADD : FpI<(ops RFP:$dst, RFP:$src1, RFP:$src2), TwoArgFP,

135

[(set RFP:$dst, (fadd RFP:$src1, RFP:$src2))]>;

136

def FpSUB : FpI<(ops RFP:$dst, RFP:$src1, RFP:$src2), TwoArgFP,

137

[(set RFP:$dst, (fsub RFP:$src1, RFP:$src2))]>;

138

def FpMUL : FpI<(ops RFP:$dst, RFP:$src1, RFP:$src2), TwoArgFP,

139

[(set RFP:$dst, (fmul RFP:$src1, RFP:$src2))]>;

140

def FpDIV : FpI<(ops RFP:$dst, RFP:$src1, RFP:$src2), TwoArgFP,

141

[(set RFP:$dst, (fdiv RFP:$src1, RFP:$src2))]>;

142

143

class FPST0rInst<bits<8> o, string asm>

144

: FPI<o, AddRegFrm, (ops RST:$op), asm>, D8;

145

class FPrST0Inst<bits<8> o, string asm>

146

: FPI<o, AddRegFrm, (ops RST:$op), asm>, DC;

147

class FPrST0PInst<bits<8> o, string asm>

148

: FPI<o, AddRegFrm, (ops RST:$op), asm>, DE;

149

150

// Binary Ops with a memory source.

151

def FpADD32m : FpI<(ops RFP:$dst, RFP:$src1, f32mem:$src2), OneArgFPRW,

152

[(set RFP:$dst, (fadd RFP:$src1,

153

(extloadf64f32 addr:$src2)))]>;

154

// ST(0) = ST(0) + [mem32]

155

def FpADD64m : FpI<(ops RFP:$dst, RFP:$src1, f64mem:$src2), OneArgFPRW,

156

[(set RFP:$dst, (fadd RFP:$src1, (loadf64 addr:$src2)))]>;

157

// ST(0) = ST(0) + [mem64]

158

def FpMUL32m : FpI<(ops RFP:$dst, RFP:$src1, f32mem:$src2), OneArgFPRW,

159

[(set RFP:$dst, (fmul RFP:$src1,

160

(extloadf64f32 addr:$src2)))]>;

161

// ST(0) = ST(0) * [mem32]

162

def FpMUL64m : FpI<(ops RFP:$dst, RFP:$src1, f64mem:$src2), OneArgFPRW,

163

[(set RFP:$dst, (fmul RFP:$src1, (loadf64 addr:$src2)))]>;

164

// ST(0) = ST(0) * [mem64]

165

def FpSUB32m : FpI<(ops RFP:$dst, RFP:$src1, f32mem:$src2), OneArgFPRW,

166

[(set RFP:$dst, (fsub RFP:$src1,

167

(extloadf64f32 addr:$src2)))]>;

168

// ST(0) = ST(0) - [mem32]

169

def FpSUB64m : FpI<(ops RFP:$dst, RFP:$src1, f64mem:$src2), OneArgFPRW,

170

[(set RFP:$dst, (fsub RFP:$src1, (loadf64 addr:$src2)))]>;

171

// ST(0) = ST(0) - [mem64]

172

def FpSUBR32m : FpI<(ops RFP:$dst, RFP:$src1, f32mem:$src2), OneArgFPRW,

173

[(set RFP:$dst, (fsub (extloadf64f32 addr:$src2),

174

RFP:$src1))]>;

175

// ST(0) = [mem32] - ST(0)

176

def FpSUBR64m : FpI<(ops RFP:$dst, RFP:$src1, f64mem:$src2), OneArgFPRW,

177

[(set RFP:$dst, (fsub (loadf64 addr:$src2), RFP:$src1))]>;

178

// ST(0) = [mem64] - ST(0)

179

def FpDIV32m : FpI<(ops RFP:$dst, RFP:$src1, f32mem:$src2), OneArgFPRW,

180

[(set RFP:$dst, (fdiv RFP:$src1,

181

(extloadf64f32 addr:$src2)))]>;

182

// ST(0) = ST(0) / [mem32]

183

def FpDIV64m : FpI<(ops RFP:$dst, RFP:$src1, f64mem:$src2), OneArgFPRW,

184

[(set RFP:$dst, (fdiv RFP:$src1, (loadf64 addr:$src2)))]>;

185

// ST(0) = ST(0) / [mem64]

186

def FpDIVR32m : FpI<(ops RFP:$dst, RFP:$src1, f32mem:$src2), OneArgFPRW,

187

[(set RFP:$dst, (fdiv (extloadf64f32 addr:$src2),

188

RFP:$src1))]>;

189

// ST(0) = [mem32] / ST(0)

190

def FpDIVR64m : FpI<(ops RFP:$dst, RFP:$src1, f64mem:$src2), OneArgFPRW,

191

[(set RFP:$dst, (fdiv (loadf64 addr:$src2), RFP:$src1))]>;

192

// ST(0) = [mem64] / ST(0)

193

194

195

def FADD32m : FPI<0xD8, MRM0m, (ops f32mem:$src), "fadd{s} $src">;

196

def FADD64m : FPI<0xDC, MRM0m, (ops f64mem:$src), "fadd{l} $src">;

197

def FMUL32m : FPI<0xD8, MRM1m, (ops f32mem:$src), "fmul{s} $src">;

198

def FMUL64m : FPI<0xDC, MRM1m, (ops f64mem:$src), "fmul{l} $src">;

199

def FSUB32m : FPI<0xD8, MRM4m, (ops f32mem:$src), "fsub{s} $src">;

200

def FSUB64m : FPI<0xDC, MRM4m, (ops f64mem:$src), "fsub{l} $src">;

201

def FSUBR32m : FPI<0xD8, MRM5m, (ops f32mem:$src), "fsubr{s} $src">;

202

def FSUBR64m : FPI<0xDC, MRM5m, (ops f64mem:$src), "fsubr{l} $src">;

203

def FDIV32m : FPI<0xD8, MRM6m, (ops f32mem:$src), "fdiv{s} $src">;

204

def FDIV64m : FPI<0xDC, MRM6m, (ops f64mem:$src), "fdiv{l} $src">;

205

def FDIVR32m : FPI<0xD8, MRM7m, (ops f32mem:$src), "fdivr{s} $src">;

206

def FDIVR64m : FPI<0xDC, MRM7m, (ops f64mem:$src), "fdivr{l} $src">;

207

208

def FpIADD16m : FpI<(ops RFP:$dst, RFP:$src1, i16mem:$src2), OneArgFPRW,

209

[(set RFP:$dst, (fadd RFP:$src1,

210

(X86fild addr:$src2, i16)))]>;

211

// ST(0) = ST(0) + [mem16int]

212

def FpIADD32m : FpI<(ops RFP:$dst, RFP:$src1, i32mem:$src2), OneArgFPRW,

213

[(set RFP:$dst, (fadd RFP:$src1,

214

(X86fild addr:$src2, i32)))]>;

215

// ST(0) = ST(0) + [mem32int]

216

def FpIMUL16m : FpI<(ops RFP:$dst, RFP:$src1, i16mem:$src2), OneArgFPRW,

217

[(set RFP:$dst, (fmul RFP:$src1,

218

(X86fild addr:$src2, i16)))]>;

219

// ST(0) = ST(0) * [mem16int]

220

def FpIMUL32m : FpI<(ops RFP:$dst, RFP:$src1, i32mem:$src2), OneArgFPRW,

221

[(set RFP:$dst, (fmul RFP:$src1,

222

(X86fild addr:$src2, i32)))]>;

223

// ST(0) = ST(0) * [mem32int]

224

def FpISUB16m : FpI<(ops RFP:$dst, RFP:$src1, i16mem:$src2), OneArgFPRW,

225

[(set RFP:$dst, (fsub RFP:$src1,

226

(X86fild addr:$src2, i16)))]>;

227

// ST(0) = ST(0) - [mem16int]

228

def FpISUB32m : FpI<(ops RFP:$dst, RFP:$src1, i32mem:$src2), OneArgFPRW,

229

[(set RFP:$dst, (fsub RFP:$src1,

230

(X86fild addr:$src2, i32)))]>;

231

// ST(0) = ST(0) - [mem32int]

232

def FpISUBR16m : FpI<(ops RFP:$dst, RFP:$src1, i16mem:$src2), OneArgFPRW,

233

[(set RFP:$dst, (fsub (X86fild addr:$src2, i16),

234

RFP:$src1))]>;

235

// ST(0) = [mem16int] - ST(0)

236

def FpISUBR32m : FpI<(ops RFP:$dst, RFP:$src1, i32mem:$src2), OneArgFPRW,

237

[(set RFP:$dst, (fsub (X86fild addr:$src2, i32),

238

RFP:$src1))]>;

239

// ST(0) = [mem32int] - ST(0)

240

def FpIDIV16m : FpI<(ops RFP:$dst, RFP:$src1, i16mem:$src2), OneArgFPRW,

241

[(set RFP:$dst, (fdiv RFP:$src1,

242

(X86fild addr:$src2, i16)))]>;

243

// ST(0) = ST(0) / [mem16int]

244

def FpIDIV32m : FpI<(ops RFP:$dst, RFP:$src1, i32mem:$src2), OneArgFPRW,

245

[(set RFP:$dst, (fdiv RFP:$src1,

246

(X86fild addr:$src2, i32)))]>;

247

// ST(0) = ST(0) / [mem32int]

248

def FpIDIVR16m : FpI<(ops RFP:$dst, RFP:$src1, i16mem:$src2), OneArgFPRW,

249

[(set RFP:$dst, (fdiv (X86fild addr:$src2, i16),

250

RFP:$src1))]>;

251

// ST(0) = [mem16int] / ST(0)

252

def FpIDIVR32m : FpI<(ops RFP:$dst, RFP:$src1, i32mem:$src2), OneArgFPRW,

253

[(set RFP:$dst, (fdiv (X86fild addr:$src2, i32),

254

RFP:$src1))]>;

255

// ST(0) = [mem32int] / ST(0)

256

257

def FIADD16m : FPI<0xDE, MRM0m, (ops i16mem:$src), "fiadd{s} $src">;

258

def FIADD32m : FPI<0xDA, MRM0m, (ops i32mem:$src), "fiadd{l} $src">;

259

def FIMUL16m : FPI<0xDE, MRM1m, (ops i16mem:$src), "fimul{s} $src">;

260

def FIMUL32m : FPI<0xDA, MRM1m, (ops i32mem:$src), "fimul{l} $src">;

261

def FISUB16m : FPI<0xDE, MRM4m, (ops i16mem:$src), "fisub{s} $src">;

262

def FISUB32m : FPI<0xDA, MRM4m, (ops i32mem:$src), "fisub{l} $src">;

263

def FISUBR16m : FPI<0xDE, MRM5m, (ops i16mem:$src), "fisubr{s} $src">;

264

def FISUBR32m : FPI<0xDA, MRM5m, (ops i32mem:$src), "fisubr{l} $src">;

265

def FIDIV16m : FPI<0xDE, MRM6m, (ops i16mem:$src), "fidiv{s} $src">;

266

def FIDIV32m : FPI<0xDA, MRM6m, (ops i32mem:$src), "fidiv{l} $src">;

267

def FIDIVR16m : FPI<0xDE, MRM7m, (ops i16mem:$src), "fidivr{s} $src">;

268

def FIDIVR32m : FPI<0xDA, MRM7m, (ops i32mem:$src), "fidivr{l} $src">;

269

270

// NOTE: GAS and apparently all other AT&T style assemblers have a broken notion

271

// of some of the 'reverse' forms of the fsub and fdiv instructions. As such,

272

// we have to put some 'r's in and take them out of weird places.

273

def FADDST0r : FPST0rInst <0xC0, "fadd $op">;

274

def FADDrST0 : FPrST0Inst <0xC0, "fadd {%st(0), $op|$op, %ST(0)}">;

275

def FADDPrST0 : FPrST0PInst<0xC0, "faddp $op">;

276

def FSUBRST0r : FPST0rInst <0xE8, "fsubr $op">;

277

def FSUBrST0 : FPrST0Inst <0xE8, "fsub{r} {%st(0), $op|$op, %ST(0)}">;

278

def FSUBPrST0 : FPrST0PInst<0xE8, "fsub{r}p $op">;

279

def FSUBST0r : FPST0rInst <0xE0, "fsub $op">;

280

def FSUBRrST0 : FPrST0Inst <0xE0, "fsub{|r} {%st(0), $op|$op, %ST(0)}">;

281

def FSUBRPrST0 : FPrST0PInst<0xE0, "fsub{|r}p $op">;

282

def FMULST0r : FPST0rInst <0xC8, "fmul $op">;

283

def FMULrST0 : FPrST0Inst <0xC8, "fmul {%st(0), $op|$op, %ST(0)}">;

284

def FMULPrST0 : FPrST0PInst<0xC8, "fmulp $op">;

285

def FDIVRST0r : FPST0rInst <0xF8, "fdivr $op">;

286

def FDIVrST0 : FPrST0Inst <0xF8, "fdiv{r} {%st(0), $op|$op, %ST(0)}">;

287

def FDIVPrST0 : FPrST0PInst<0xF8, "fdiv{r}p $op">;

288

def FDIVST0r : FPST0rInst <0xF0, "fdiv $op">;

289

def FDIVRrST0 : FPrST0Inst <0xF0, "fdiv{|r} {%st(0), $op|$op, %ST(0)}">;

290

def FDIVRPrST0 : FPrST0PInst<0xF0, "fdiv{|r}p $op">;

// Unary operations.

def FpCHS : FpI<(ops RFP:$dst, RFP:$src), OneArgFPRW,

295

[(set RFP:$dst, (fneg RFP:$src))]>;

296

def FpABS : FpI<(ops RFP:$dst, RFP:$src), OneArgFPRW,

297

[(set RFP:$dst, (fabs RFP:$src))]>;

298

def FpSQRT : FpI<(ops RFP:$dst, RFP:$src), OneArgFPRW,

299

[(set RFP:$dst, (fsqrt RFP:$src))]>;

300

def FpSIN : FpI<(ops RFP:$dst, RFP:$src), OneArgFPRW,

301

[(set RFP:$dst, (fsin RFP:$src))]>;

302

def FpCOS : FpI<(ops RFP:$dst, RFP:$src), OneArgFPRW,

303

[(set RFP:$dst, (fcos RFP:$src))]>;

304

def FpTST : FpI<(ops RFP:$src), OneArgFP,

305

[]>;

306

307

def FCHS : FPI<0xE0, RawFrm, (ops), "fchs">, D9;

308

def FABS : FPI<0xE1, RawFrm, (ops), "fabs">, D9;

309

def FSQRT : FPI<0xFA, RawFrm, (ops), "fsqrt">, D9;

310

def FSIN : FPI<0xFE, RawFrm, (ops), "fsin">, D9;

311

def FCOS : FPI<0xFF, RawFrm, (ops), "fcos">, D9;

312

def FTST : FPI<0xE4, RawFrm, (ops), "ftst">, D9;

313

314

315

// Floating point cmovs.

316

let isTwoAddress = 1 in {

317

def FpCMOVB : FpI<(ops RFP:$dst, RFP:$src1, RFP:$src2), CondMovFP,

318