blob: 36ae14585bc0f02993c5350c6f7f6f2aa6038819 [file] [log] [blame]
Evan Chengffcb95b2006-02-21 19:13:53 +00001//====- X86InstrSSE.td - Describe the X86 Instruction Set -------*- C++ -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file was developed by the Evan Cheng and is distributed under
6// the University of Illinois Open Source License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file describes the X86 SSE instruction set, defining the instructions,
11// and properties of the instructions which are needed for code generation,
12// machine code emission, and analysis.
13//
14//===----------------------------------------------------------------------===//
15
Evan Cheng4e4c71e2006-02-21 20:00:20 +000016//===----------------------------------------------------------------------===//
Evan Cheng2246f842006-03-18 01:23:20 +000017// SSE specific DAG Nodes.
18//===----------------------------------------------------------------------===//
19
Evan Chengb9df0ca2006-03-22 02:53:00 +000020def SDTX86Unpcklp : SDTypeProfile<1, 2,
21 [SDTCisSameAs<0, 1>, SDTCisSameAs<0, 2>]>;
22
23def X86loadp : SDNode<"X86ISD::LOAD_PACK", SDTLoad,
24 [SDNPHasChain]>;
25def X86fand : SDNode<"X86ISD::FAND", SDTFPBinOp,
26 [SDNPCommutative, SDNPAssociative]>;
27def X86fxor : SDNode<"X86ISD::FXOR", SDTFPBinOp,
28 [SDNPCommutative, SDNPAssociative]>;
29def X86s2vec : SDNode<"X86ISD::SCALAR_TO_VECTOR",
30 SDTypeProfile<1, 1, []>, []>;
31def X86unpcklp : SDNode<"X86ISD::UNPCKLP",
32 SDTX86Unpcklp, []>;
Evan Cheng2246f842006-03-18 01:23:20 +000033
34//===----------------------------------------------------------------------===//
Evan Cheng06a8aa12006-03-17 19:55:52 +000035// SSE pattern fragments
36//===----------------------------------------------------------------------===//
37
38def X86loadpf32 : PatFrag<(ops node:$ptr), (f32 (X86loadp node:$ptr))>;
39def X86loadpf64 : PatFrag<(ops node:$ptr), (f64 (X86loadp node:$ptr))>;
40
Evan Cheng2246f842006-03-18 01:23:20 +000041def loadv4f32 : PatFrag<(ops node:$ptr), (v4f32 (load node:$ptr))>;
42def loadv2f64 : PatFrag<(ops node:$ptr), (v2f64 (load node:$ptr))>;
Evan Cheng24dc1f52006-03-23 07:44:07 +000043def loadv16i8 : PatFrag<(ops node:$ptr), (v16i8 (load node:$ptr))>;
44def loadv8i16 : PatFrag<(ops node:$ptr), (v8i16 (load node:$ptr))>;
45def loadv4i32 : PatFrag<(ops node:$ptr), (v4i32 (load node:$ptr))>;
46def loadv2i64 : PatFrag<(ops node:$ptr), (v2i64 (load node:$ptr))>;
Evan Cheng06a8aa12006-03-17 19:55:52 +000047
Evan Cheng386031a2006-03-24 07:29:27 +000048def fp32imm0 : PatLeaf<(f32 fpimm), [{
49 return N->isExactlyValue(+0.0);
50}]>;
51
52def vecimm0 : PatLeaf<(build_vector), [{
53 return X86::isZeroVector(N);
54}]>;
55
Evan Cheng63d33002006-03-22 08:01:21 +000056// SHUFFLE_get_shuf_imm xform function: convert vector_shuffle mask to PSHUF*,
57// SHUFP* etc. imm.
58def SHUFFLE_get_shuf_imm : SDNodeXForm<build_vector, [{
59 return getI8Imm(X86::getShuffleSHUFImmediate(N));
Evan Chengb9df0ca2006-03-22 02:53:00 +000060}]>;
61
Evan Cheng63d33002006-03-22 08:01:21 +000062def SHUFP_splat_mask : PatLeaf<(build_vector), [{
63 return X86::isSplatMask(N);
64}], SHUFFLE_get_shuf_imm>;
65
Evan Cheng1bffadd2006-03-22 19:16:21 +000066def MOVLHPS_splat_mask : PatLeaf<(build_vector), [{
Evan Cheng0188ecb2006-03-22 18:59:22 +000067 return X86::isSplatMask(N);
68}]>;
69
Evan Cheng2c0dbd02006-03-24 02:58:06 +000070def MOVLHPSorUNPCKLPD_shuffle_mask : PatLeaf<(build_vector), [{
71 return X86::isMOVLHPSorUNPCKLPDMask(N);
72}], SHUFFLE_get_shuf_imm>;
73
74def MOVHLPS_shuffle_mask : PatLeaf<(build_vector), [{
75 return X86::isMOVHLPSMask(N);
76}], SHUFFLE_get_shuf_imm>;
77
78def UNPCKHPD_shuffle_mask : PatLeaf<(build_vector), [{
79 return X86::isUNPCKHPDMask(N);
80}], SHUFFLE_get_shuf_imm>;
81
Evan Cheng0188ecb2006-03-22 18:59:22 +000082// Only use PSHUF if it is not a splat.
83def PSHUFD_shuffle_mask : PatLeaf<(build_vector), [{
84 return !X86::isSplatMask(N) && X86::isPSHUFDMask(N);
Evan Cheng14aed5e2006-03-24 01:18:28 +000085}], SHUFFLE_get_shuf_imm>;
Evan Cheng0188ecb2006-03-22 18:59:22 +000086
Evan Cheng14aed5e2006-03-24 01:18:28 +000087def SHUFP_shuffle_mask : PatLeaf<(build_vector), [{
88 return X86::isSHUFPMask(N);
89}], SHUFFLE_get_shuf_imm>;
Evan Chengb9df0ca2006-03-22 02:53:00 +000090
Evan Cheng06a8aa12006-03-17 19:55:52 +000091//===----------------------------------------------------------------------===//
Evan Cheng4e4c71e2006-02-21 20:00:20 +000092// SSE scalar FP Instructions
93//===----------------------------------------------------------------------===//
94
Evan Cheng470a6ad2006-02-22 02:26:30 +000095// Instruction templates
96// SSI - SSE1 instructions with XS prefix.
97// SDI - SSE2 instructions with XD prefix.
98// PSI - SSE1 instructions with TB prefix.
99// PDI - SSE2 instructions with TB and OpSize prefixes.
Evan Cheng2da953f2006-03-22 07:10:28 +0000100// PSIi8 - SSE1 instructions with ImmT == Imm8 and TB prefix.
101// PDIi8 - SSE2 instructions with ImmT == Imm8 and TB and OpSize prefixes.
Evan Cheng470a6ad2006-02-22 02:26:30 +0000102class SSI<bits<8> o, Format F, dag ops, string asm, list<dag> pattern>
103 : I<o, F, ops, asm, pattern>, XS, Requires<[HasSSE1]>;
104class SDI<bits<8> o, Format F, dag ops, string asm, list<dag> pattern>
105 : I<o, F, ops, asm, pattern>, XD, Requires<[HasSSE2]>;
106class PSI<bits<8> o, Format F, dag ops, string asm, list<dag> pattern>
107 : I<o, F, ops, asm, pattern>, TB, Requires<[HasSSE1]>;
108class PDI<bits<8> o, Format F, dag ops, string asm, list<dag> pattern>
109 : I<o, F, ops, asm, pattern>, TB, OpSize, Requires<[HasSSE2]>;
Evan Cheng2da953f2006-03-22 07:10:28 +0000110class PSIi8<bits<8> o, Format F, dag ops, string asm, list<dag> pattern>
111 : X86Inst<o, F, Imm8, ops, asm>, TB, Requires<[HasSSE1]> {
112 let Pattern = pattern;
113}
114class PDIi8<bits<8> o, Format F, dag ops, string asm, list<dag> pattern>
115 : X86Inst<o, F, Imm8, ops, asm>, TB, OpSize, Requires<[HasSSE2]> {
116 let Pattern = pattern;
117}
Evan Cheng470a6ad2006-02-22 02:26:30 +0000118
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000119// Some 'special' instructions
120def IMPLICIT_DEF_FR32 : I<0, Pseudo, (ops FR32:$dst),
121 "#IMPLICIT_DEF $dst",
122 [(set FR32:$dst, (undef))]>, Requires<[HasSSE2]>;
123def IMPLICIT_DEF_FR64 : I<0, Pseudo, (ops FR64:$dst),
124 "#IMPLICIT_DEF $dst",
125 [(set FR64:$dst, (undef))]>, Requires<[HasSSE2]>;
126
127// CMOV* - Used to implement the SSE SELECT DAG operation. Expanded by the
128// scheduler into a branch sequence.
129let usesCustomDAGSchedInserter = 1 in { // Expanded by the scheduler.
130 def CMOV_FR32 : I<0, Pseudo,
131 (ops FR32:$dst, FR32:$t, FR32:$f, i8imm:$cond),
132 "#CMOV_FR32 PSEUDO!",
133 [(set FR32:$dst, (X86cmov FR32:$t, FR32:$f, imm:$cond))]>;
134 def CMOV_FR64 : I<0, Pseudo,
135 (ops FR64:$dst, FR64:$t, FR64:$f, i8imm:$cond),
136 "#CMOV_FR64 PSEUDO!",
137 [(set FR64:$dst, (X86cmov FR64:$t, FR64:$f, imm:$cond))]>;
138}
139
140// Move Instructions
Evan Cheng470a6ad2006-02-22 02:26:30 +0000141def MOVSSrr : SSI<0x10, MRMSrcReg, (ops FR32:$dst, FR32:$src),
142 "movss {$src, $dst|$dst, $src}", []>;
143def MOVSSrm : SSI<0x10, MRMSrcMem, (ops FR32:$dst, f32mem:$src),
144 "movss {$src, $dst|$dst, $src}",
145 [(set FR32:$dst, (loadf32 addr:$src))]>;
146def MOVSDrr : SDI<0x10, MRMSrcReg, (ops FR64:$dst, FR64:$src),
147 "movsd {$src, $dst|$dst, $src}", []>;
148def MOVSDrm : SDI<0x10, MRMSrcMem, (ops FR64:$dst, f64mem:$src),
149 "movsd {$src, $dst|$dst, $src}",
150 [(set FR64:$dst, (loadf64 addr:$src))]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000151
Evan Cheng470a6ad2006-02-22 02:26:30 +0000152def MOVSSmr : SSI<0x11, MRMDestMem, (ops f32mem:$dst, FR32:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000153 "movss {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000154 [(store FR32:$src, addr:$dst)]>;
155def MOVSDmr : SDI<0x11, MRMDestMem, (ops f64mem:$dst, FR64:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000156 "movsd {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000157 [(store FR64:$src, addr:$dst)]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000158
159// Conversion instructions
Evan Cheng470a6ad2006-02-22 02:26:30 +0000160def CVTTSS2SIrr: SSI<0x2C, MRMSrcReg, (ops R32:$dst, FR32:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000161 "cvttss2si {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000162 [(set R32:$dst, (fp_to_sint FR32:$src))]>;
163def CVTTSS2SIrm: SSI<0x2C, MRMSrcMem, (ops R32:$dst, f32mem:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000164 "cvttss2si {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000165 [(set R32:$dst, (fp_to_sint (loadf32 addr:$src)))]>;
166def CVTTSD2SIrr: SDI<0x2C, MRMSrcReg, (ops R32:$dst, FR64:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000167 "cvttsd2si {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000168 [(set R32:$dst, (fp_to_sint FR64:$src))]>;
169def CVTTSD2SIrm: SDI<0x2C, MRMSrcMem, (ops R32:$dst, f64mem:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000170 "cvttsd2si {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000171 [(set R32:$dst, (fp_to_sint (loadf64 addr:$src)))]>;
172def CVTSD2SSrr: SDI<0x5A, MRMSrcReg, (ops FR32:$dst, FR64:$src),
173 "cvtsd2ss {$src, $dst|$dst, $src}",
174 [(set FR32:$dst, (fround FR64:$src))]>;
175def CVTSD2SSrm: SDI<0x5A, MRMSrcMem, (ops FR32:$dst, f64mem:$src),
176 "cvtsd2ss {$src, $dst|$dst, $src}",
177 [(set FR32:$dst, (fround (loadf64 addr:$src)))]>;
178def CVTSI2SSrr: SSI<0x2A, MRMSrcReg, (ops FR32:$dst, R32:$src),
179 "cvtsi2ss {$src, $dst|$dst, $src}",
180 [(set FR32:$dst, (sint_to_fp R32:$src))]>;
181def CVTSI2SSrm: SSI<0x2A, MRMSrcMem, (ops FR32:$dst, i32mem:$src),
182 "cvtsi2ss {$src, $dst|$dst, $src}",
183 [(set FR32:$dst, (sint_to_fp (loadi32 addr:$src)))]>;
184def CVTSI2SDrr: SDI<0x2A, MRMSrcReg, (ops FR64:$dst, R32:$src),
185 "cvtsi2sd {$src, $dst|$dst, $src}",
186 [(set FR64:$dst, (sint_to_fp R32:$src))]>;
187def CVTSI2SDrm: SDI<0x2A, MRMSrcMem, (ops FR64:$dst, i32mem:$src),
188 "cvtsi2sd {$src, $dst|$dst, $src}",
189 [(set FR64:$dst, (sint_to_fp (loadi32 addr:$src)))]>;
190// SSE2 instructions with XS prefix
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000191def CVTSS2SDrr: I<0x5A, MRMSrcReg, (ops FR64:$dst, FR32:$src),
192 "cvtss2sd {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000193 [(set FR64:$dst, (fextend FR32:$src))]>, XS,
194 Requires<[HasSSE2]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000195def CVTSS2SDrm: I<0x5A, MRMSrcMem, (ops FR64:$dst, f32mem:$src),
196 "cvtss2sd {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000197 [(set FR64:$dst, (fextend (loadf32 addr:$src)))]>, XS,
198 Requires<[HasSSE2]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000199
200// Arithmetic instructions
201let isTwoAddress = 1 in {
202let isCommutable = 1 in {
Evan Cheng470a6ad2006-02-22 02:26:30 +0000203def ADDSSrr : SSI<0x58, MRMSrcReg, (ops FR32:$dst, FR32:$src1, FR32:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000204 "addss {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000205 [(set FR32:$dst, (fadd FR32:$src1, FR32:$src2))]>;
206def ADDSDrr : SDI<0x58, MRMSrcReg, (ops FR64:$dst, FR64:$src1, FR64:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000207 "addsd {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000208 [(set FR64:$dst, (fadd FR64:$src1, FR64:$src2))]>;
209def MULSSrr : SSI<0x59, MRMSrcReg, (ops FR32:$dst, FR32:$src1, FR32:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000210 "mulss {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000211 [(set FR32:$dst, (fmul FR32:$src1, FR32:$src2))]>;
212def MULSDrr : SDI<0x59, MRMSrcReg, (ops FR64:$dst, FR64:$src1, FR64:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000213 "mulsd {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000214 [(set FR64:$dst, (fmul FR64:$src1, FR64:$src2))]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000215}
216
Evan Cheng470a6ad2006-02-22 02:26:30 +0000217def ADDSSrm : SSI<0x58, MRMSrcMem, (ops FR32:$dst, FR32:$src1, f32mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000218 "addss {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000219 [(set FR32:$dst, (fadd FR32:$src1, (loadf32 addr:$src2)))]>;
220def ADDSDrm : SDI<0x58, MRMSrcMem, (ops FR64:$dst, FR64:$src1, f64mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000221 "addsd {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000222 [(set FR64:$dst, (fadd FR64:$src1, (loadf64 addr:$src2)))]>;
223def MULSSrm : SSI<0x59, MRMSrcMem, (ops FR32:$dst, FR32:$src1, f32mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000224 "mulss {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000225 [(set FR32:$dst, (fmul FR32:$src1, (loadf32 addr:$src2)))]>;
226def MULSDrm : SDI<0x59, MRMSrcMem, (ops FR64:$dst, FR64:$src1, f64mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000227 "mulsd {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000228 [(set FR64:$dst, (fmul FR64:$src1, (loadf64 addr:$src2)))]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000229
Evan Cheng470a6ad2006-02-22 02:26:30 +0000230def DIVSSrr : SSI<0x5E, MRMSrcReg, (ops FR32:$dst, FR32:$src1, FR32:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000231 "divss {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000232 [(set FR32:$dst, (fdiv FR32:$src1, FR32:$src2))]>;
233def DIVSSrm : SSI<0x5E, MRMSrcMem, (ops FR32:$dst, FR32:$src1, f32mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000234 "divss {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000235 [(set FR32:$dst, (fdiv FR32:$src1, (loadf32 addr:$src2)))]>;
236def DIVSDrr : SDI<0x5E, MRMSrcReg, (ops FR64:$dst, FR64:$src1, FR64:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000237 "divsd {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000238 [(set FR64:$dst, (fdiv FR64:$src1, FR64:$src2))]>;
239def DIVSDrm : SDI<0x5E, MRMSrcMem, (ops FR64:$dst, FR64:$src1, f64mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000240 "divsd {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000241 [(set FR64:$dst, (fdiv FR64:$src1, (loadf64 addr:$src2)))]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000242
Evan Cheng470a6ad2006-02-22 02:26:30 +0000243def SUBSSrr : SSI<0x5C, MRMSrcReg, (ops FR32:$dst, FR32:$src1, FR32:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000244 "subss {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000245 [(set FR32:$dst, (fsub FR32:$src1, FR32:$src2))]>;
246def SUBSSrm : SSI<0x5C, MRMSrcMem, (ops FR32:$dst, FR32:$src1, f32mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000247 "subss {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000248 [(set FR32:$dst, (fsub FR32:$src1, (loadf32 addr:$src2)))]>;
249def SUBSDrr : SDI<0x5C, MRMSrcReg, (ops FR64:$dst, FR64:$src1, FR64:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000250 "subsd {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000251 [(set FR64:$dst, (fsub FR64:$src1, FR64:$src2))]>;
252def SUBSDrm : SDI<0x5C, MRMSrcMem, (ops FR64:$dst, FR64:$src1, f64mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000253 "subsd {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000254 [(set FR64:$dst, (fsub FR64:$src1, (loadf64 addr:$src2)))]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000255}
256
Evan Cheng470a6ad2006-02-22 02:26:30 +0000257def SQRTSSrr : SSI<0x51, MRMSrcReg, (ops FR32:$dst, FR32:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000258 "sqrtss {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000259 [(set FR32:$dst, (fsqrt FR32:$src))]>;
260def SQRTSSrm : SSI<0x51, MRMSrcMem, (ops FR32:$dst, f32mem:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000261 "sqrtss {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000262 [(set FR32:$dst, (fsqrt (loadf32 addr:$src)))]>;
263def SQRTSDrr : SDI<0x51, MRMSrcReg, (ops FR64:$dst, FR64:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000264 "sqrtsd {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000265 [(set FR64:$dst, (fsqrt FR64:$src))]>;
266def SQRTSDrm : SDI<0x51, MRMSrcMem, (ops FR64:$dst, f64mem:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000267 "sqrtsd {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000268 [(set FR64:$dst, (fsqrt (loadf64 addr:$src)))]>;
269
270def RSQRTSSrr : SSI<0x52, MRMSrcReg, (ops FR32:$dst, FR32:$src),
271 "rsqrtss {$src, $dst|$dst, $src}", []>;
272def RSQRTSSrm : SSI<0x52, MRMSrcMem, (ops FR32:$dst, f32mem:$src),
273 "rsqrtss {$src, $dst|$dst, $src}", []>;
274def RCPSSrr : SSI<0x53, MRMSrcReg, (ops FR32:$dst, FR32:$src),
275 "rcpss {$src, $dst|$dst, $src}", []>;
276def RCPSSrm : SSI<0x53, MRMSrcMem, (ops FR32:$dst, f32mem:$src),
277 "rcpss {$src, $dst|$dst, $src}", []>;
278
279def MAXSSrr : SSI<0x5F, MRMSrcReg, (ops FR32:$dst, FR32:$src),
280 "maxss {$src, $dst|$dst, $src}", []>;
281def MAXSSrm : SSI<0x5F, MRMSrcMem, (ops FR32:$dst, f32mem:$src),
282 "maxss {$src, $dst|$dst, $src}", []>;
283def MAXSDrr : SDI<0x5F, MRMSrcReg, (ops FR64:$dst, FR64:$src),
284 "maxsd {$src, $dst|$dst, $src}", []>;
285def MAXSDrm : SDI<0x5F, MRMSrcMem, (ops FR64:$dst, f64mem:$src),
286 "maxsd {$src, $dst|$dst, $src}", []>;
287def MINSSrr : SSI<0x5D, MRMSrcReg, (ops FR32:$dst, FR32:$src),
288 "minss {$src, $dst|$dst, $src}", []>;
289def MINSSrm : SSI<0x5D, MRMSrcMem, (ops FR32:$dst, f32mem:$src),
290 "minss {$src, $dst|$dst, $src}", []>;
291def MINSDrr : SDI<0x5D, MRMSrcReg, (ops FR64:$dst, FR64:$src),
292 "minsd {$src, $dst|$dst, $src}", []>;
293def MINSDrm : SDI<0x5D, MRMSrcMem, (ops FR64:$dst, f64mem:$src),
294 "minsd {$src, $dst|$dst, $src}", []>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000295
296// Comparison instructions
297let isTwoAddress = 1 in {
Evan Cheng470a6ad2006-02-22 02:26:30 +0000298def CMPSSrr : SSI<0xC2, MRMSrcReg,
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000299 (ops FR32:$dst, FR32:$src1, FR32:$src, SSECC:$cc),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000300 "cmp${cc}ss {$src, $dst|$dst, $src}", []>;
301def CMPSSrm : SSI<0xC2, MRMSrcMem,
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000302 (ops FR32:$dst, FR32:$src1, f32mem:$src, SSECC:$cc),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000303 "cmp${cc}ss {$src, $dst|$dst, $src}", []>;
304def CMPSDrr : SDI<0xC2, MRMSrcReg,
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000305 (ops FR64:$dst, FR64:$src1, FR64:$src, SSECC:$cc),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000306 "cmp${cc}sd {$src, $dst|$dst, $src}", []>;
307def CMPSDrm : SDI<0xC2, MRMSrcMem,
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000308 (ops FR64:$dst, FR64:$src1, f64mem:$src, SSECC:$cc),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000309 "cmp${cc}sd {$src, $dst|$dst, $src}", []>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000310}
311
Evan Cheng470a6ad2006-02-22 02:26:30 +0000312def UCOMISSrr: PSI<0x2E, MRMSrcReg, (ops FR32:$src1, FR32:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000313 "ucomiss {$src2, $src1|$src1, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000314 [(X86cmp FR32:$src1, FR32:$src2)]>;
315def UCOMISSrm: PSI<0x2E, MRMSrcMem, (ops FR32:$src1, f32mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000316 "ucomiss {$src2, $src1|$src1, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000317 [(X86cmp FR32:$src1, (loadf32 addr:$src2))]>;
318def UCOMISDrr: PDI<0x2E, MRMSrcReg, (ops FR64:$src1, FR64:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000319 "ucomisd {$src2, $src1|$src1, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000320 [(X86cmp FR64:$src1, FR64:$src2)]>;
321def UCOMISDrm: PDI<0x2E, MRMSrcMem, (ops FR64:$src1, f64mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000322 "ucomisd {$src2, $src1|$src1, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000323 [(X86cmp FR64:$src1, (loadf64 addr:$src2))]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000324
325// Aliases of packed instructions for scalar use. These all have names that
326// start with 'Fs'.
327
328// Alias instructions that map fld0 to pxor for sse.
329// FIXME: remove when we can teach regalloc that xor reg, reg is ok.
330def FsFLD0SS : I<0xEF, MRMInitReg, (ops FR32:$dst),
331 "pxor $dst, $dst", [(set FR32:$dst, fp32imm0)]>,
332 Requires<[HasSSE1]>, TB, OpSize;
333def FsFLD0SD : I<0xEF, MRMInitReg, (ops FR64:$dst),
334 "pxor $dst, $dst", [(set FR64:$dst, fp64imm0)]>,
335 Requires<[HasSSE2]>, TB, OpSize;
336
337// Alias instructions to do FR32 / FR64 reg-to-reg copy using movaps / movapd.
338// Upper bits are disregarded.
Evan Cheng470a6ad2006-02-22 02:26:30 +0000339def FsMOVAPSrr : PSI<0x28, MRMSrcReg, (ops FR32:$dst, FR32:$src),
340 "movaps {$src, $dst|$dst, $src}", []>;
341def FsMOVAPDrr : PDI<0x28, MRMSrcReg, (ops FR64:$dst, FR64:$src),
342 "movapd {$src, $dst|$dst, $src}", []>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000343
344// Alias instructions to load FR32 / FR64 from f128mem using movaps / movapd.
345// Upper bits are disregarded.
Evan Cheng470a6ad2006-02-22 02:26:30 +0000346def FsMOVAPSrm : PSI<0x28, MRMSrcMem, (ops FR32:$dst, f128mem:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000347 "movaps {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000348 [(set FR32:$dst, (X86loadpf32 addr:$src))]>;
349def FsMOVAPDrm : PDI<0x28, MRMSrcMem, (ops FR64:$dst, f128mem:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000350 "movapd {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000351 [(set FR64:$dst, (X86loadpf64 addr:$src))]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000352
353// Alias bitwise logical operations using SSE logical ops on packed FP values.
354let isTwoAddress = 1 in {
355let isCommutable = 1 in {
Evan Cheng470a6ad2006-02-22 02:26:30 +0000356def FsANDPSrr : PSI<0x54, MRMSrcReg, (ops FR32:$dst, FR32:$src1, FR32:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000357 "andps {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000358 [(set FR32:$dst, (X86fand FR32:$src1, FR32:$src2))]>;
359def FsANDPDrr : PDI<0x54, MRMSrcReg, (ops FR64:$dst, FR64:$src1, FR64:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000360 "andpd {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000361 [(set FR64:$dst, (X86fand FR64:$src1, FR64:$src2))]>;
362def FsORPSrr : PSI<0x56, MRMSrcReg, (ops FR32:$dst, FR32:$src1, FR32:$src2),
363 "orps {$src2, $dst|$dst, $src2}", []>;
364def FsORPDrr : PDI<0x56, MRMSrcReg, (ops FR64:$dst, FR64:$src1, FR64:$src2),
365 "orpd {$src2, $dst|$dst, $src2}", []>;
366def FsXORPSrr : PSI<0x57, MRMSrcReg, (ops FR32:$dst, FR32:$src1, FR32:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000367 "xorps {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000368 [(set FR32:$dst, (X86fxor FR32:$src1, FR32:$src2))]>;
369def FsXORPDrr : PDI<0x57, MRMSrcReg, (ops FR64:$dst, FR64:$src1, FR64:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000370 "xorpd {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000371 [(set FR64:$dst, (X86fxor FR64:$src1, FR64:$src2))]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000372}
Evan Cheng470a6ad2006-02-22 02:26:30 +0000373def FsANDPSrm : PSI<0x54, MRMSrcMem, (ops FR32:$dst, FR32:$src1, f128mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000374 "andps {$src2, $dst|$dst, $src2}",
375 [(set FR32:$dst, (X86fand FR32:$src1,
Evan Cheng470a6ad2006-02-22 02:26:30 +0000376 (X86loadpf32 addr:$src2)))]>;
377def FsANDPDrm : PDI<0x54, MRMSrcMem, (ops FR64:$dst, FR64:$src1, f128mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000378 "andpd {$src2, $dst|$dst, $src2}",
379 [(set FR64:$dst, (X86fand FR64:$src1,
Evan Cheng470a6ad2006-02-22 02:26:30 +0000380 (X86loadpf64 addr:$src2)))]>;
381def FsORPSrm : PSI<0x56, MRMSrcMem, (ops FR32:$dst, FR32:$src1, f128mem:$src2),
382 "orps {$src2, $dst|$dst, $src2}", []>;
383def FsORPDrm : PDI<0x56, MRMSrcMem, (ops FR64:$dst, FR64:$src1, f128mem:$src2),
384 "orpd {$src2, $dst|$dst, $src2}", []>;
385def FsXORPSrm : PSI<0x57, MRMSrcMem, (ops FR32:$dst, FR32:$src1, f128mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000386 "xorps {$src2, $dst|$dst, $src2}",
387 [(set FR32:$dst, (X86fxor FR32:$src1,
Evan Cheng470a6ad2006-02-22 02:26:30 +0000388 (X86loadpf32 addr:$src2)))]>;
389def FsXORPDrm : PDI<0x57, MRMSrcMem, (ops FR64:$dst, FR64:$src1, f128mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000390 "xorpd {$src2, $dst|$dst, $src2}",
391 [(set FR64:$dst, (X86fxor FR64:$src1,
Evan Cheng470a6ad2006-02-22 02:26:30 +0000392 (X86loadpf64 addr:$src2)))]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000393
Evan Cheng470a6ad2006-02-22 02:26:30 +0000394def FsANDNPSrr : PSI<0x55, MRMSrcReg, (ops FR32:$dst, FR32:$src1, FR32:$src2),
395 "andnps {$src2, $dst|$dst, $src2}", []>;
396def FsANDNPSrm : PSI<0x55, MRMSrcMem, (ops FR32:$dst, FR32:$src1, f128mem:$src2),
397 "andnps {$src2, $dst|$dst, $src2}", []>;
398def FsANDNPDrr : PDI<0x55, MRMSrcReg, (ops FR64:$dst, FR64:$src1, FR64:$src2),
399 "andnpd {$src2, $dst|$dst, $src2}", []>;
400def FsANDNPDrm : PDI<0x55, MRMSrcMem, (ops FR64:$dst, FR64:$src1, f128mem:$src2),
401 "andnpd {$src2, $dst|$dst, $src2}", []>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000402}
403
404//===----------------------------------------------------------------------===//
405// SSE packed FP Instructions
406//===----------------------------------------------------------------------===//
407
Evan Chengc12e6c42006-03-19 09:38:54 +0000408// Some 'special' instructions
409def IMPLICIT_DEF_VR128 : I<0, Pseudo, (ops VR128:$dst),
410 "#IMPLICIT_DEF $dst",
411 [(set VR128:$dst, (v4f32 (undef)))]>,
412 Requires<[HasSSE1]>;
413
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000414// Move Instructions
Evan Cheng2246f842006-03-18 01:23:20 +0000415def MOVAPSrr : PSI<0x28, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000416 "movaps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000417def MOVAPSrm : PSI<0x28, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000418 "movaps {$src, $dst|$dst, $src}",
Evan Cheng2246f842006-03-18 01:23:20 +0000419 [(set VR128:$dst, (loadv4f32 addr:$src))]>;
420def MOVAPDrr : PDI<0x28, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000421 "movapd {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000422def MOVAPDrm : PDI<0x28, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000423 "movapd {$src, $dst|$dst, $src}",
Evan Cheng2246f842006-03-18 01:23:20 +0000424 [(set VR128:$dst, (loadv2f64 addr:$src))]>;
Evan Chengffcb95b2006-02-21 19:13:53 +0000425
Evan Cheng2246f842006-03-18 01:23:20 +0000426def MOVAPSmr : PSI<0x29, MRMDestMem, (ops f128mem:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000427 "movaps {$src, $dst|$dst, $src}",
Evan Cheng2246f842006-03-18 01:23:20 +0000428 [(store (v4f32 VR128:$src), addr:$dst)]>;
429def MOVAPDmr : PDI<0x29, MRMDestMem, (ops f128mem:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000430 "movapd {$src, $dst|$dst, $src}",
Evan Cheng2246f842006-03-18 01:23:20 +0000431 [(store (v2f64 VR128:$src), addr:$dst)]>;
Evan Cheng470a6ad2006-02-22 02:26:30 +0000432
Evan Cheng2246f842006-03-18 01:23:20 +0000433def MOVUPSrr : PSI<0x10, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000434 "movups {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000435def MOVUPSrm : PSI<0x10, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000436 "movups {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000437def MOVUPSmr : PSI<0x11, MRMDestMem, (ops f128mem:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000438 "movups {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000439def MOVUPDrr : PDI<0x10, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000440 "movupd {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000441def MOVUPDrm : PDI<0x10, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000442 "movupd {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000443def MOVUPDmr : PDI<0x11, MRMDestMem, (ops f128mem:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000444 "movupd {$src, $dst|$dst, $src}", []>;
445
Evan Cheng2246f842006-03-18 01:23:20 +0000446def MOVLPSrm : PSI<0x12, MRMSrcMem, (ops VR128:$dst, f64mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000447 "movlps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000448def MOVLPSmr : PSI<0x13, MRMDestMem, (ops f64mem:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000449 "movlps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000450def MOVLPDrm : PDI<0x12, MRMSrcMem, (ops VR128:$dst, f64mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000451 "movlpd {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000452def MOVLPDmr : PDI<0x13, MRMDestMem, (ops f64mem:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000453 "movlpd {$src, $dst|$dst, $src}", []>;
454
Evan Cheng2246f842006-03-18 01:23:20 +0000455def MOVHPSrm : PSI<0x16, MRMSrcMem, (ops VR128:$dst, f64mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000456 "movhps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000457def MOVHPSmr : PSI<0x17, MRMDestMem, (ops f64mem:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000458 "movhps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000459def MOVHPDrm : PDI<0x16, MRMSrcMem, (ops VR128:$dst, f64mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000460 "movhpd {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000461def MOVHPDmr : PDI<0x17, MRMDestMem, (ops f64mem:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000462 "movhpd {$src, $dst|$dst, $src}", []>;
463
Evan Cheng14aed5e2006-03-24 01:18:28 +0000464let isTwoAddress = 1 in {
465def MOVLHPSrr : PSI<0x16, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
466 "movlhps {$src2, $dst|$dst, $src2}", []>;
Evan Cheng2c0dbd02006-03-24 02:58:06 +0000467
Evan Cheng14aed5e2006-03-24 01:18:28 +0000468def MOVHLPSrr : PSI<0x12, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
469 "movlhps {$src2, $dst|$dst, $src2}", []>;
470}
Evan Cheng470a6ad2006-02-22 02:26:30 +0000471
Evan Cheng2246f842006-03-18 01:23:20 +0000472def MOVMSKPSrr : PSI<0x50, MRMSrcReg, (ops R32:$dst, VR128:$src),
Chris Lattnerac53ead2006-03-24 21:49:18 +0000473 "movmskps {$src, $dst|$dst, $src}",
474 [(set R32:$dst, (int_x86_sse_movmskps VR128:$src))]>;
Evan Cheng2246f842006-03-18 01:23:20 +0000475def MOVMSKPDrr : PSI<0x50, MRMSrcReg, (ops R32:$dst, VR128:$src),
Chris Lattnerac53ead2006-03-24 21:49:18 +0000476 "movmskpd {$src, $dst|$dst, $src}",
477 [(set R32:$dst, (int_x86_sse2_movmskpd VR128:$src))]>;
Evan Cheng470a6ad2006-02-22 02:26:30 +0000478
479// Conversion instructions
Evan Cheng2246f842006-03-18 01:23:20 +0000480def CVTPI2PSrr : PSI<0x2A, MRMSrcReg, (ops VR128:$dst, VR64:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000481 "cvtpi2ps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000482def CVTPI2PSrm : PSI<0x2A, MRMSrcMem, (ops VR128:$dst, i64mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000483 "cvtpi2ps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000484def CVTPI2PDrr : PDI<0x2A, MRMSrcReg, (ops VR128:$dst, VR64:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000485 "cvtpi2pd {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000486def CVTPI2PDrm : PDI<0x2A, MRMSrcMem, (ops VR128:$dst, i64mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000487 "cvtpi2pd {$src, $dst|$dst, $src}", []>;
488
489// SSE2 instructions without OpSize prefix
Evan Cheng2246f842006-03-18 01:23:20 +0000490def CVTDQ2PSrr : I<0x5B, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000491 "cvtdq2ps {$src, $dst|$dst, $src}", []>, TB,
492 Requires<[HasSSE2]>;
Evan Cheng2246f842006-03-18 01:23:20 +0000493def CVTDQ2PSrm : I<0x5B, MRMSrcMem, (ops VR128:$dst, i128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000494 "cvtdq2ps {$src, $dst|$dst, $src}", []>, TB,
495 Requires<[HasSSE2]>;
496
497// SSE2 instructions with XS prefix
Evan Cheng2246f842006-03-18 01:23:20 +0000498def CVTDQ2PDrr : I<0xE6, MRMSrcReg, (ops VR128:$dst, VR64:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000499 "cvtdq2pd {$src, $dst|$dst, $src}", []>,
500 XS, Requires<[HasSSE2]>;
Evan Cheng2246f842006-03-18 01:23:20 +0000501def CVTDQ2PDrm : I<0xE6, MRMSrcMem, (ops VR128:$dst, i64mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000502 "cvtdq2pd {$src, $dst|$dst, $src}", []>,
503 XS, Requires<[HasSSE2]>;
504
Evan Cheng2246f842006-03-18 01:23:20 +0000505def CVTPS2PIrr : PSI<0x2D, MRMSrcReg, (ops VR64:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000506 "cvtps2pi {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000507def CVTPS2PIrm : PSI<0x2D, MRMSrcMem, (ops VR64:$dst, f64mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000508 "cvtps2pi {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000509def CVTPD2PIrr : PDI<0x2D, MRMSrcReg, (ops VR64:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000510 "cvtpd2pi {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000511def CVTPD2PIrm : PDI<0x2D, MRMSrcMem, (ops VR64:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000512 "cvtpd2pi {$src, $dst|$dst, $src}", []>;
513
Evan Cheng2246f842006-03-18 01:23:20 +0000514def CVTPS2DQrr : PDI<0x5B, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000515 "cvtps2dq {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000516def CVTPS2DQrm : PDI<0x5B, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000517 "cvtps2dq {$src, $dst|$dst, $src}", []>;
518// SSE2 packed instructions with XD prefix
Evan Cheng2246f842006-03-18 01:23:20 +0000519def CVTPD2DQrr : SDI<0xE6, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000520 "cvtpd2dq {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000521def CVTPD2DQrm : SDI<0xE6, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000522 "cvtpd2dq {$src, $dst|$dst, $src}", []>;
523
524// SSE2 instructions without OpSize prefix
Evan Cheng2246f842006-03-18 01:23:20 +0000525def CVTPS2PDrr : I<0x5A, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000526 "cvtps2pd {$src, $dst|$dst, $src}", []>, TB,
527 Requires<[HasSSE2]>;
Evan Cheng2246f842006-03-18 01:23:20 +0000528def CVTPS2PDrm : I<0x5A, MRMSrcReg, (ops VR128:$dst, f64mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000529 "cvtps2pd {$src, $dst|$dst, $src}", []>, TB,
530 Requires<[HasSSE2]>;
531
Evan Cheng2246f842006-03-18 01:23:20 +0000532def CVTPD2PSrr : PDI<0x5A, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000533 "cvtpd2ps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000534def CVTPD2PSrm : PDI<0x5A, MRMSrcReg, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000535 "cvtpd2ps {$src, $dst|$dst, $src}", []>;
536
537// Arithmetic
538let isTwoAddress = 1 in {
539let isCommutable = 1 in {
Evan Cheng2246f842006-03-18 01:23:20 +0000540def ADDPSrr : PSI<0x58, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000541 "addps {$src2, $dst|$dst, $src2}",
Evan Cheng2246f842006-03-18 01:23:20 +0000542 [(set VR128:$dst, (v4f32 (fadd VR128:$src1, VR128:$src2)))]>;
543def ADDPDrr : PDI<0x58, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000544 "addpd {$src2, $dst|$dst, $src2}",
Evan Cheng2246f842006-03-18 01:23:20 +0000545 [(set VR128:$dst, (v2f64 (fadd VR128:$src1, VR128:$src2)))]>;
546def MULPSrr : PSI<0x59, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000547 "mulps {$src2, $dst|$dst, $src2}",
Evan Cheng2246f842006-03-18 01:23:20 +0000548 [(set VR128:$dst, (v4f32 (fmul VR128:$src1, VR128:$src2)))]>;
549def MULPDrr : PDI<0x59, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000550 "mulpd {$src2, $dst|$dst, $src2}",
Evan Cheng2246f842006-03-18 01:23:20 +0000551 [(set VR128:$dst, (v2f64 (fmul VR128:$src1, VR128:$src2)))]>;
Evan Cheng470a6ad2006-02-22 02:26:30 +0000552}
553
Evan Cheng2246f842006-03-18 01:23:20 +0000554def ADDPSrm : PSI<0x58, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000555 "addps {$src2, $dst|$dst, $src2}",
Evan Cheng2246f842006-03-18 01:23:20 +0000556 [(set VR128:$dst, (v4f32 (fadd VR128:$src1,
557 (load addr:$src2))))]>;
558def ADDPDrm : PDI<0x58, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000559 "addpd {$src2, $dst|$dst, $src2}",
Evan Cheng2246f842006-03-18 01:23:20 +0000560 [(set VR128:$dst, (v2f64 (fadd VR128:$src1,
561 (load addr:$src2))))]>;
562def MULPSrm : PSI<0x59, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000563 "mulps {$src2, $dst|$dst, $src2}",
Evan Cheng2246f842006-03-18 01:23:20 +0000564 [(set VR128:$dst, (v4f32 (fmul VR128:$src1,
565 (load addr:$src2))))]>;
566def MULPDrm : PDI<0x59, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000567 "mulpd {$src2, $dst|$dst, $src2}",
Evan Cheng2246f842006-03-18 01:23:20 +0000568 [(set VR128:$dst, (v2f64 (fmul VR128:$src1,
569 (load addr:$src2))))]>;
Evan Cheng470a6ad2006-02-22 02:26:30 +0000570
Evan Cheng2246f842006-03-18 01:23:20 +0000571def DIVPSrr : PSI<0x5E, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
572 "divps {$src2, $dst|$dst, $src2}",
573 [(set VR128:$dst, (v4f32 (fdiv VR128:$src1, VR128:$src2)))]>;
574def DIVPSrm : PSI<0x5E, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
575 "divps {$src2, $dst|$dst, $src2}",
576 [(set VR128:$dst, (v4f32 (fdiv VR128:$src1,
577 (load addr:$src2))))]>;
578def DIVPDrr : PDI<0x5E, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000579 "divpd {$src2, $dst|$dst, $src2}",
Evan Cheng2246f842006-03-18 01:23:20 +0000580 [(set VR128:$dst, (v2f64 (fdiv VR128:$src1, VR128:$src2)))]>;
581def DIVPDrm : PDI<0x5E, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000582 "divpd {$src2, $dst|$dst, $src2}",
Evan Cheng2246f842006-03-18 01:23:20 +0000583 [(set VR128:$dst, (v2f64 (fdiv VR128:$src1,
584 (load addr:$src2))))]>;
Evan Cheng470a6ad2006-02-22 02:26:30 +0000585
Evan Cheng2246f842006-03-18 01:23:20 +0000586def SUBPSrr : PSI<0x5C, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
587 "subps {$src2, $dst|$dst, $src2}",
588 [(set VR128:$dst, (v4f32 (fsub VR128:$src1, VR128:$src2)))]>;
589def SUBPSrm : PSI<0x5C, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
590 "subps {$src2, $dst|$dst, $src2}",
591 [(set VR128:$dst, (v4f32 (fsub VR128:$src1,
592 (load addr:$src2))))]>;
593def SUBPDrr : PDI<0x5C, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
594 "subpd {$src2, $dst|$dst, $src2}",
Evan Cheng2c0dbd02006-03-24 02:58:06 +0000595 [(set VR128:$dst, (v2f64 (fsub VR128:$src1, VR128:$src2)))]>;
Evan Cheng2246f842006-03-18 01:23:20 +0000596def SUBPDrm : PDI<0x5C, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
597 "subpd {$src2, $dst|$dst, $src2}",
Evan Cheng2c0dbd02006-03-24 02:58:06 +0000598 [(set VR128:$dst, (v2f64 (fsub VR128:$src1,
599 (load addr:$src2))))]>;
Evan Cheng470a6ad2006-02-22 02:26:30 +0000600}
601
Evan Cheng2246f842006-03-18 01:23:20 +0000602def SQRTPSrr : PSI<0x51, MRMSrcReg, (ops VR128:$dst, VR128:$src),
603 "sqrtps {$src, $dst|$dst, $src}",
604 [(set VR128:$dst, (v4f32 (fsqrt VR128:$src)))]>;
605def SQRTPSrm : PSI<0x51, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
606 "sqrtps {$src, $dst|$dst, $src}",
607 [(set VR128:$dst, (v4f32 (fsqrt (load addr:$src))))]>;
608def SQRTPDrr : PDI<0x51, MRMSrcReg, (ops VR128:$dst, VR128:$src),
609 "sqrtpd {$src, $dst|$dst, $src}",
610 [(set VR128:$dst, (v2f64 (fsqrt VR128:$src)))]>;
611def SQRTPDrm : PDI<0x51, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
612 "sqrtpd {$src, $dst|$dst, $src}",
613 [(set VR128:$dst, (v2f64 (fsqrt (load addr:$src))))]>;
Evan Cheng470a6ad2006-02-22 02:26:30 +0000614
Evan Cheng2246f842006-03-18 01:23:20 +0000615def RSQRTPSrr : PSI<0x52, MRMSrcReg, (ops VR128:$dst, VR128:$src),
616 "rsqrtps {$src, $dst|$dst, $src}", []>;
617def RSQRTPSrm : PSI<0x52, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
618 "rsqrtps {$src, $dst|$dst, $src}", []>;
619def RCPPSrr : PSI<0x53, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000620 "rcpps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000621def RCPPSrm : PSI<0x53, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000622 "rcpps {$src, $dst|$dst, $src}", []>;
623
Evan Cheng2246f842006-03-18 01:23:20 +0000624def MAXPSrr : PSI<0x5F, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000625 "maxps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000626def MAXPSrm : PSI<0x5F, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000627 "maxps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000628def MAXPDrr : PDI<0x5F, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000629 "maxpd {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000630def MAXPDrm : PDI<0x5F, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000631 "maxpd {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000632def MINPSrr : PSI<0x5D, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000633 "minps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000634def MINPSrm : PSI<0x5D, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000635 "minps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000636def MINPDrr : PDI<0x5D, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000637 "minpd {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000638def MINPDrm : PDI<0x5D, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000639 "minpd {$src, $dst|$dst, $src}", []>;
Evan Chengffcb95b2006-02-21 19:13:53 +0000640
641// Logical
642let isTwoAddress = 1 in {
643let isCommutable = 1 in {
Evan Cheng2246f842006-03-18 01:23:20 +0000644def ANDPSrr : PSI<0x54, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
645 "andps {$src2, $dst|$dst, $src2}",
646 [(set VR128:$dst, (v4i32 (and VR128:$src1, VR128:$src2)))]>;
647def ANDPDrr : PDI<0x54, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
Evan Chengffcb95b2006-02-21 19:13:53 +0000648 "andpd {$src2, $dst|$dst, $src2}",
Evan Cheng2246f842006-03-18 01:23:20 +0000649 [(set VR128:$dst, (v2i64 (and VR128:$src1, VR128:$src2)))]>;
650def ORPSrr : PSI<0x56, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
651 "orps {$src2, $dst|$dst, $src2}",
652 [(set VR128:$dst, (v4i32 (or VR128:$src1, VR128:$src2)))]>;
653def ORPDrr : PDI<0x56, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
654 "orpd {$src2, $dst|$dst, $src2}",
655 [(set VR128:$dst, (v2i64 (or VR128:$src1, VR128:$src2)))]>;
656def XORPSrr : PSI<0x57, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
657 "xorps {$src2, $dst|$dst, $src2}",
658 [(set VR128:$dst, (v4i32 (xor VR128:$src1, VR128:$src2)))]>;
659def XORPDrr : PDI<0x57, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
660 "xorpd {$src2, $dst|$dst, $src2}",
661 [(set VR128:$dst, (v2i64 (xor VR128:$src1, VR128:$src2)))]>;
Evan Chengffcb95b2006-02-21 19:13:53 +0000662}
Evan Cheng2246f842006-03-18 01:23:20 +0000663def ANDPSrm : PSI<0x54, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
664 "andps {$src2, $dst|$dst, $src2}",
665 [(set VR128:$dst, (v4i32 (and VR128:$src1,
666 (load addr:$src2))))]>;
667def ANDPDrm : PDI<0x54, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
668 "andpd {$src2, $dst|$dst, $src2}",
669 [(set VR128:$dst, (v2i64 (and VR128:$src1,
670 (load addr:$src2))))]>;
671def ORPSrm : PSI<0x56, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
672 "orps {$src2, $dst|$dst, $src2}",
673 [(set VR128:$dst, (v4i32 (or VR128:$src1,
674 (load addr:$src2))))]>;
675def ORPDrm : PDI<0x56, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
676 "orpd {$src2, $dst|$dst, $src2}",
677 [(set VR128:$dst, (v2i64 (or VR128:$src1,
678 (load addr:$src2))))]>;
679def XORPSrm : PSI<0x57, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
680 "xorps {$src2, $dst|$dst, $src2}",
681 [(set VR128:$dst, (v4i32 (xor VR128:$src1,
682 (load addr:$src2))))]>;
683def XORPDrm : PDI<0x57, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
684 "xorpd {$src2, $dst|$dst, $src2}",
685 [(set VR128:$dst, (v2i64 (xor VR128:$src1,
686 (load addr:$src2))))]>;
687def ANDNPSrr : PSI<0x55, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
688 "andnps {$src2, $dst|$dst, $src2}",
689 [(set VR128:$dst, (v4i32 (and (not VR128:$src1),
690 VR128:$src2)))]>;
691def ANDNPSrm : PSI<0x55, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
692 "andnps {$src2, $dst|$dst, $src2}",
693 [(set VR128:$dst, (v4i32 (and (not VR128:$src1),
694 (load addr:$src2))))]>;
695def ANDNPDrr : PDI<0x55, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
696 "andnpd {$src2, $dst|$dst, $src2}",
697 [(set VR128:$dst, (v2i64 (and (not VR128:$src1),
698 VR128:$src2)))]>;
699
700def ANDNPDrm : PDI<0x55, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
701 "andnpd {$src2, $dst|$dst, $src2}",
702 [(set VR128:$dst, (v2i64 (and VR128:$src1,
703 (load addr:$src2))))]>;
Evan Chengffcb95b2006-02-21 19:13:53 +0000704}
Evan Chengbf156d12006-02-21 19:26:52 +0000705
Evan Cheng470a6ad2006-02-22 02:26:30 +0000706let isTwoAddress = 1 in {
707def CMPPSrr : PSI<0xC2, MRMSrcReg,
Evan Cheng2246f842006-03-18 01:23:20 +0000708 (ops VR128:$dst, VR128:$src1, VR128:$src, SSECC:$cc),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000709 "cmp${cc}ps {$src, $dst|$dst, $src}", []>;
710def CMPPSrm : PSI<0xC2, MRMSrcMem,
Evan Cheng2246f842006-03-18 01:23:20 +0000711 (ops VR128:$dst, VR128:$src1, f128mem:$src, SSECC:$cc),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000712 "cmp${cc}ps {$src, $dst|$dst, $src}", []>;
713def CMPPDrr : PDI<0xC2, MRMSrcReg,
Evan Cheng2246f842006-03-18 01:23:20 +0000714 (ops VR128:$dst, VR128:$src1, VR128:$src, SSECC:$cc),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000715 "cmp${cc}pd {$src, $dst|$dst, $src}", []>;
716def CMPPDrm : PDI<0xC2, MRMSrcMem,
Evan Cheng2246f842006-03-18 01:23:20 +0000717 (ops VR128:$dst, VR128:$src1, f128mem:$src, SSECC:$cc),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000718 "cmp${cc}pd {$src, $dst|$dst, $src}", []>;
719}
720
721// Shuffle and unpack instructions
Evan Cheng2da953f2006-03-22 07:10:28 +0000722def PSHUFWrr : PSIi8<0x70, MRMDestReg,
723 (ops VR64:$dst, VR64:$src1, i8imm:$src2),
724 "pshufw {$src2, $src1, $dst|$dst, $src1, $src2}", []>;
725def PSHUFWrm : PSIi8<0x70, MRMSrcMem,
726 (ops VR64:$dst, i64mem:$src1, i8imm:$src2),
727 "pshufw {$src2, $src1, $dst|$dst, $src1, $src2}", []>;
728def PSHUFDrr : PDIi8<0x70, MRMDestReg,
729 (ops VR128:$dst, VR128:$src1, i8imm:$src2),
Evan Cheng0188ecb2006-03-22 18:59:22 +0000730 "pshufd {$src2, $src1, $dst|$dst, $src1, $src2}", []>;
Evan Cheng2da953f2006-03-22 07:10:28 +0000731def PSHUFDrm : PDIi8<0x70, MRMSrcMem,
732 (ops VR128:$dst, i128mem:$src1, i8imm:$src2),
733 "pshufd {$src2, $src1, $dst|$dst, $src1, $src2}", []>;
Evan Chengb9df0ca2006-03-22 02:53:00 +0000734
Evan Cheng0cea6d22006-03-22 20:08:18 +0000735let isTwoAddress = 1 in {
Evan Cheng2da953f2006-03-22 07:10:28 +0000736def SHUFPSrr : PSIi8<0xC6, MRMSrcReg,
737 (ops VR128:$dst, VR128:$src1, VR128:$src2, i8imm:$src3),
Evan Cheng14aed5e2006-03-24 01:18:28 +0000738 "shufps {$src3, $src2, $dst|$dst, $src2, $src3}",
739 [(set VR128:$dst, (vector_shuffle
740 (v4f32 VR128:$src1), (v4f32 VR128:$src2),
741 SHUFP_shuffle_mask:$src3))]>;
Evan Cheng2da953f2006-03-22 07:10:28 +0000742def SHUFPSrm : PSIi8<0xC6, MRMSrcMem,
743 (ops VR128:$dst, VR128:$src1, f128mem:$src2, i8imm:$src3),
744 "shufps {$src3, $src2, $dst|$dst, $src2, $src3}", []>;
745def SHUFPDrr : PDIi8<0xC6, MRMSrcReg,
746 (ops VR128:$dst, VR128:$src1, VR128:$src2, i8imm:$src3),
Evan Cheng14aed5e2006-03-24 01:18:28 +0000747 "shufpd {$src3, $src2, $dst|$dst, $src2, $src3}",
748 [(set VR128:$dst, (vector_shuffle
749 (v2f64 VR128:$src1), (v2f64 VR128:$src2),
750 SHUFP_shuffle_mask:$src3))]>;
Evan Cheng2da953f2006-03-22 07:10:28 +0000751def SHUFPDrm : PDIi8<0xC6, MRMSrcMem,
752 (ops VR128:$dst, VR128:$src1, f128mem:$src2, i8imm:$src3),
753 "shufpd {$src3, $src2, $dst|$dst, $src2, $src3}", []>;
Evan Cheng470a6ad2006-02-22 02:26:30 +0000754
755def UNPCKHPSrr : PSI<0x15, MRMSrcReg,
Evan Cheng2246f842006-03-18 01:23:20 +0000756 (ops VR128:$dst, VR128:$src1, VR128:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000757 "unpckhps {$src2, $dst|$dst, $src2}", []>;
758def UNPCKHPSrm : PSI<0x15, MRMSrcMem,
Evan Cheng2246f842006-03-18 01:23:20 +0000759 (ops VR128:$dst, VR128:$src1, f128mem:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000760 "unpckhps {$src2, $dst|$dst, $src2}", []>;
761def UNPCKHPDrr : PDI<0x15, MRMSrcReg,
Evan Cheng2246f842006-03-18 01:23:20 +0000762 (ops VR128:$dst, VR128:$src1, VR128:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000763 "unpckhpd {$src2, $dst|$dst, $src2}", []>;
764def UNPCKHPDrm : PDI<0x15, MRMSrcMem,
Evan Cheng2246f842006-03-18 01:23:20 +0000765 (ops VR128:$dst, VR128:$src1, f128mem:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000766 "unpckhpd {$src2, $dst|$dst, $src2}", []>;
767def UNPCKLPSrr : PSI<0x14, MRMSrcReg,
Evan Cheng2246f842006-03-18 01:23:20 +0000768 (ops VR128:$dst, VR128:$src1, VR128:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000769 "unpcklps {$src2, $dst|$dst, $src2}", []>;
770def UNPCKLPSrm : PSI<0x14, MRMSrcMem,
Evan Cheng2246f842006-03-18 01:23:20 +0000771 (ops VR128:$dst, VR128:$src1, f128mem:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000772 "unpcklps {$src2, $dst|$dst, $src2}", []>;
773def UNPCKLPDrr : PDI<0x14, MRMSrcReg,
Evan Cheng2246f842006-03-18 01:23:20 +0000774 (ops VR128:$dst, VR128:$src1, VR128:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000775 "unpcklpd {$src2, $dst|$dst, $src2}", []>;
776def UNPCKLPDrm : PDI<0x14, MRMSrcMem,
Evan Cheng2246f842006-03-18 01:23:20 +0000777 (ops VR128:$dst, VR128:$src1, f128mem:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000778 "unpcklpd {$src2, $dst|$dst, $src2}", []>;
Evan Cheng2c0dbd02006-03-24 02:58:06 +0000779}
Evan Cheng470a6ad2006-02-22 02:26:30 +0000780
Evan Chengbf156d12006-02-21 19:26:52 +0000781//===----------------------------------------------------------------------===//
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000782// SSE integer instructions
Evan Chengbf156d12006-02-21 19:26:52 +0000783//===----------------------------------------------------------------------===//
784
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000785// Move Instructions
Evan Cheng470a6ad2006-02-22 02:26:30 +0000786def MOVD128rr : PDI<0x6E, MRMSrcReg, (ops VR128:$dst, R32:$src),
Evan Cheng24dc1f52006-03-23 07:44:07 +0000787 "movd {$src, $dst|$dst, $src}",
Evan Cheng48090aa2006-03-21 23:01:21 +0000788 [(set VR128:$dst,
789 (v4i32 (scalar_to_vector R32:$src)))]>;
Evan Cheng470a6ad2006-02-22 02:26:30 +0000790def MOVD128rm : PDI<0x6E, MRMSrcMem, (ops VR128:$dst, i32mem:$src),
791 "movd {$src, $dst|$dst, $src}", []>;
792def MOVD128mr : PDI<0x7E, MRMDestMem, (ops i32mem:$dst, VR128:$src),
793 "movd {$src, $dst|$dst, $src}", []>;
Evan Chengbf156d12006-02-21 19:26:52 +0000794
Evan Cheng24dc1f52006-03-23 07:44:07 +0000795def MOVDQArr : PDI<0x6F, MRMSrcReg, (ops VR128:$dst, VR128:$src),
796 "movdqa {$src, $dst|$dst, $src}", []>;
797def MOVDQArm : PDI<0x6F, MRMSrcMem, (ops VR128:$dst, i128mem:$src),
798 "movdqa {$src, $dst|$dst, $src}",
799 [(set VR128:$dst, (loadv4i32 addr:$src))]>;
800def MOVDQAmr : PDI<0x7F, MRMDestMem, (ops i128mem:$dst, VR128:$src),
801 "movdqa {$src, $dst|$dst, $src}",
802 [(store (v4i32 VR128:$src), addr:$dst)]>;
803
Evan Cheng470a6ad2006-02-22 02:26:30 +0000804// SSE2 instructions with XS prefix
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000805def MOVQ128rr : I<0x7E, MRMSrcReg, (ops VR128:$dst, VR64:$src),
Evan Cheng48090aa2006-03-21 23:01:21 +0000806 "movq {$src, $dst|$dst, $src}",
807 [(set VR128:$dst,
808 (v2i64 (scalar_to_vector VR64:$src)))]>, XS,
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000809 Requires<[HasSSE2]>;
810def MOVQ128rm : I<0x7E, MRMSrcMem, (ops VR128:$dst, i64mem:$src),
Evan Cheng48090aa2006-03-21 23:01:21 +0000811 "movq {$src, $dst|$dst, $src}", []>, XS;
Evan Cheng470a6ad2006-02-22 02:26:30 +0000812
813def MOVQ128mr : PDI<0xD6, MRMSrcMem, (ops i64mem:$dst, VR128:$src),
814 "movq {$src, $dst|$dst, $src}", []>;
Evan Cheng82521dd2006-03-21 07:09:35 +0000815
Evan Chenga971f6f2006-03-23 01:57:24 +0000816// 128-bit Integer Arithmetic
817let isTwoAddress = 1 in {
818let isCommutable = 1 in {
819def PADDBrr : PDI<0xFC, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
820 "paddb {$src2, $dst|$dst, $src2}",
821 [(set VR128:$dst, (v16i8 (add VR128:$src1, VR128:$src2)))]>;
822def PADDWrr : PDI<0xFD, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
823 "paddw {$src2, $dst|$dst, $src2}",
824 [(set VR128:$dst, (v8i16 (add VR128:$src1, VR128:$src2)))]>;
825def PADDDrr : PDI<0xFE, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
826 "paddd {$src2, $dst|$dst, $src2}",
827 [(set VR128:$dst, (v4i32 (add VR128:$src1, VR128:$src2)))]>;
828}
829def PADDBrm : PDI<0xFC, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
830 "paddb {$src2, $dst|$dst, $src2}",
831 [(set VR128:$dst, (v16i8 (add VR128:$src1,
832 (load addr:$src2))))]>;
833def PADDWrm : PDI<0xFD, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
834 "paddw {$src2, $dst|$dst, $src2}",
835 [(set VR128:$dst, (v8i16 (add VR128:$src1,
836 (load addr:$src2))))]>;
837def PADDDrm : PDI<0xFE, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
838 "paddd {$src2, $dst|$dst, $src2}",
839 [(set VR128:$dst, (v4i32 (add VR128:$src1,
840 (load addr:$src2))))]>;
841}
Evan Cheng82521dd2006-03-21 07:09:35 +0000842
843//===----------------------------------------------------------------------===//
844// Alias Instructions
845//===----------------------------------------------------------------------===//
846
Evan Cheng386031a2006-03-24 07:29:27 +0000847// Alias instructions that map zero vector to xorp* for sse.
848// FIXME: remove when we can teach regalloc that xor reg, reg is ok.
849def VZEROv16i8 : I<0xEF, MRMInitReg, (ops VR128:$dst),
850 "pxor $dst, $dst", [(set VR128:$dst, (v16i8 vecimm0))]>,
851 Requires<[HasSSE2]>, TB, OpSize;
852def VZEROv8i16 : I<0xEF, MRMInitReg, (ops VR128:$dst),
853 "pxor $dst, $dst", [(set VR128:$dst, (v8i16 vecimm0))]>,
854 Requires<[HasSSE2]>, TB, OpSize;
855def VZEROv4i32 : I<0xEF, MRMInitReg, (ops VR128:$dst),
856 "pxor $dst, $dst", [(set VR128:$dst, (v4i32 vecimm0))]>,
857 Requires<[HasSSE2]>, TB, OpSize;
858def VZEROv2i64 : I<0xEF, MRMInitReg, (ops VR128:$dst),
859 "pxor $dst, $dst", [(set VR128:$dst, (v2i64 vecimm0))]>,
860 Requires<[HasSSE2]>, TB, OpSize;
861def VZEROv4f32 : PSI<0x57, MRMInitReg, (ops VR128:$dst),
862 "xorps $dst, $dst", [(set VR128:$dst, (v4f32 vecimm0))]>;
863def VZEROv2f64 : PDI<0x57, MRMInitReg, (ops VR128:$dst),
864 "xorpd $dst, $dst", [(set VR128:$dst, (v2f64 vecimm0))]>;
865
Evan Cheng82521dd2006-03-21 07:09:35 +0000866def FR32ToV4F32 : PSI<0x28, MRMSrcReg, (ops VR128:$dst, FR32:$src),
867 "movaps {$src, $dst|$dst, $src}",
868 [(set VR128:$dst,
869 (v4f32 (scalar_to_vector FR32:$src)))]>;
870
871def FR64ToV2F64 : PDI<0x28, MRMSrcReg, (ops VR128:$dst, FR64:$src),
872 "movapd {$src, $dst|$dst, $src}",
873 [(set VR128:$dst,
874 (v2f64 (scalar_to_vector FR64:$src)))]>;
Evan Cheng48090aa2006-03-21 23:01:21 +0000875
876//===----------------------------------------------------------------------===//
877// Non-Instruction Patterns
878//===----------------------------------------------------------------------===//
879
880// 128-bit vector undef's.
881def : Pat<(v2f64 (undef)), (IMPLICIT_DEF_VR128)>, Requires<[HasSSE2]>;
882def : Pat<(v16i8 (undef)), (IMPLICIT_DEF_VR128)>, Requires<[HasSSE2]>;
883def : Pat<(v8i16 (undef)), (IMPLICIT_DEF_VR128)>, Requires<[HasSSE2]>;
884def : Pat<(v4i32 (undef)), (IMPLICIT_DEF_VR128)>, Requires<[HasSSE2]>;
885def : Pat<(v2i64 (undef)), (IMPLICIT_DEF_VR128)>, Requires<[HasSSE2]>;
886
Evan Chenga971f6f2006-03-23 01:57:24 +0000887// Load 128-bit integer vector values.
Evan Cheng24dc1f52006-03-23 07:44:07 +0000888def : Pat<(v16i8 (load addr:$src)), (MOVDQArm addr:$src)>,
889 Requires<[HasSSE2]>;
890def : Pat<(v8i16 (load addr:$src)), (MOVDQArm addr:$src)>,
891 Requires<[HasSSE2]>;
892def : Pat<(v4i32 (load addr:$src)), (MOVDQArm addr:$src)>,
893 Requires<[HasSSE2]>;
894def : Pat<(v2i64 (load addr:$src)), (MOVDQArm addr:$src)>,
Evan Chenga971f6f2006-03-23 01:57:24 +0000895 Requires<[HasSSE2]>;
896
Evan Cheng48090aa2006-03-21 23:01:21 +0000897// Store 128-bit integer vector values.
Evan Cheng24dc1f52006-03-23 07:44:07 +0000898def : Pat<(store (v16i8 VR128:$src), addr:$dst),
899 (MOVDQAmr addr:$dst, VR128:$src)>, Requires<[HasSSE1]>;
900def : Pat<(store (v8i16 VR128:$src), addr:$dst),
901 (MOVDQAmr addr:$dst, VR128:$src)>, Requires<[HasSSE1]>;
902def : Pat<(store (v4i32 VR128:$src), addr:$dst),
903 (MOVDQAmr addr:$dst, VR128:$src)>, Requires<[HasSSE1]>;
904def : Pat<(store (v2i64 VR128:$src), addr:$dst),
905 (MOVDQAmr addr:$dst, VR128:$src)>, Requires<[HasSSE2]>;
Evan Cheng48090aa2006-03-21 23:01:21 +0000906
907// Scalar to v8i16 / v16i8. The source may be a R32, but only the lower 8 or
908// 16-bits matter.
909def : Pat<(v8i16 (X86s2vec R32:$src)), (MOVD128rr R32:$src)>,
910 Requires<[HasSSE2]>;
911def : Pat<(v16i8 (X86s2vec R32:$src)), (MOVD128rr R32:$src)>,
912 Requires<[HasSSE2]>;
913
Evan Cheng2c0dbd02006-03-24 02:58:06 +0000914// bit_convert
915def : Pat<(v4i32 (bitconvert (v4f32 VR128:$src))), (v4i32 VR128:$src)>;
916def : Pat<(v4f32 (bitconvert (v4i32 VR128:$src))), (v4f32 VR128:$src)>;
Evan Chengb9df0ca2006-03-22 02:53:00 +0000917
918// Splat v4f32 / v4i32
Evan Cheng63d33002006-03-22 08:01:21 +0000919def : Pat<(vector_shuffle (v4f32 VR128:$src), (undef), SHUFP_splat_mask:$sm),
Evan Cheng1bffadd2006-03-22 19:16:21 +0000920 (v4f32 (SHUFPSrr VR128:$src, VR128:$src, SHUFP_splat_mask:$sm))>,
921 Requires<[HasSSE1]>;
Evan Cheng63d33002006-03-22 08:01:21 +0000922def : Pat<(vector_shuffle (v4i32 VR128:$src), (undef), SHUFP_splat_mask:$sm),
Evan Cheng1bffadd2006-03-22 19:16:21 +0000923 (v4i32 (SHUFPSrr VR128:$src, VR128:$src, SHUFP_splat_mask:$sm))>,
924 Requires<[HasSSE1]>;
Evan Chengb9df0ca2006-03-22 02:53:00 +0000925
926// Splat v2f64 / v2i64
Evan Cheng1bffadd2006-03-22 19:16:21 +0000927def : Pat<(vector_shuffle (v2f64 VR128:$src), (undef), MOVLHPS_splat_mask:$sm),
Evan Cheng14aed5e2006-03-24 01:18:28 +0000928 (v2f64 (MOVLHPSrr VR128:$src, VR128:$src))>, Requires<[HasSSE1]>;
Evan Cheng1bffadd2006-03-22 19:16:21 +0000929def : Pat<(vector_shuffle (v2i64 VR128:$src), (undef), MOVLHPS_splat_mask:$sm),
Evan Cheng14aed5e2006-03-24 01:18:28 +0000930 (v2i64 (MOVLHPSrr VR128:$src, VR128:$src))>, Requires<[HasSSE1]>;
Evan Cheng63d33002006-03-22 08:01:21 +0000931
Evan Cheng0188ecb2006-03-22 18:59:22 +0000932// Shuffle v4f32 / v4i32, undef. These should only match if splat cases do not.
933def : Pat<(vector_shuffle (v4f32 VR128:$src), (undef), PSHUFD_shuffle_mask:$sm),
Evan Cheng1bffadd2006-03-22 19:16:21 +0000934 (v4f32 (PSHUFDrr VR128:$src, PSHUFD_shuffle_mask:$sm))>,
935 Requires<[HasSSE2]>;
Evan Cheng0188ecb2006-03-22 18:59:22 +0000936def : Pat<(vector_shuffle (v4i32 VR128:$src), (undef), PSHUFD_shuffle_mask:$sm),
Evan Cheng1bffadd2006-03-22 19:16:21 +0000937 (v4i32 (PSHUFDrr VR128:$src, PSHUFD_shuffle_mask:$sm))>,
938 Requires<[HasSSE2]>;
Evan Cheng3b047f72006-03-23 02:36:37 +0000939
Evan Cheng2c0dbd02006-03-24 02:58:06 +0000940// Shuffle v2f64 / v2i64
941def : Pat<(vector_shuffle (v2f64 VR128:$src1), (v2f64 VR128:$src2),
942 MOVLHPSorUNPCKLPD_shuffle_mask:$sm),
943 (v2f64 (MOVLHPSrr VR128:$src1, VR128:$src2))>, Requires<[HasSSE1]>;
944def : Pat<(vector_shuffle (v2f64 VR128:$src1), (v2f64 VR128:$src2),
945 MOVHLPS_shuffle_mask:$sm),
946 (v2f64 (MOVHLPSrr VR128:$src1, VR128:$src2))>, Requires<[HasSSE1]>;
947def : Pat<(vector_shuffle (v2f64 VR128:$src1), (v2f64 VR128:$src2),
948 UNPCKHPD_shuffle_mask:$sm),
949 (v2f64 (UNPCKHPDrr VR128:$src1, VR128:$src2))>, Requires<[HasSSE2]>;
950def : Pat<(vector_shuffle (v2f64 VR128:$src1), (loadv2f64 addr:$src2),
951 MOVLHPSorUNPCKLPD_shuffle_mask:$sm),
952 (v2f64 (UNPCKLPDrm VR128:$src1, addr:$src2))>, Requires<[HasSSE2]>;
953
954def : Pat<(vector_shuffle (v2i64 VR128:$src1), (v2i64 VR128:$src2),
955 MOVLHPSorUNPCKLPD_shuffle_mask:$sm),
956 (v2i64 (MOVLHPSrr VR128:$src1, VR128:$src2))>, Requires<[HasSSE1]>;
957def : Pat<(vector_shuffle (v2i64 VR128:$src1), (v2i64 VR128:$src2),
958 MOVHLPS_shuffle_mask:$sm),
959 (v2i64 (MOVHLPSrr VR128:$src1, VR128:$src2))>, Requires<[HasSSE1]>;
960def : Pat<(vector_shuffle (v2i64 VR128:$src1), (v2i64 VR128:$src2),
961 UNPCKHPD_shuffle_mask:$sm),
962 (v2i64 (UNPCKHPDrr VR128:$src1, VR128:$src2))>, Requires<[HasSSE2]>;
963def : Pat<(vector_shuffle (v2i64 VR128:$src1), (loadv2i64 addr:$src2),
964 MOVLHPSorUNPCKLPD_shuffle_mask:$sm),
965 (v2i64 (UNPCKLPDrm VR128:$src1, addr:$src2))>, Requires<[HasSSE2]>;