blob: b7f4b20bd7787de1ea43cded818e8a9c28cd8e6b [file] [log] [blame]
Evan Chengffcb95b2006-02-21 19:13:53 +00001//====- X86InstrSSE.td - Describe the X86 Instruction Set -------*- C++ -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file was developed by the Evan Cheng and is distributed under
6// the University of Illinois Open Source License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file describes the X86 SSE instruction set, defining the instructions,
11// and properties of the instructions which are needed for code generation,
12// machine code emission, and analysis.
13//
14//===----------------------------------------------------------------------===//
15
Evan Cheng4e4c71e2006-02-21 20:00:20 +000016//===----------------------------------------------------------------------===//
Evan Cheng2246f842006-03-18 01:23:20 +000017// SSE specific DAG Nodes.
18//===----------------------------------------------------------------------===//
19
Evan Chengb9df0ca2006-03-22 02:53:00 +000020def X86loadp : SDNode<"X86ISD::LOAD_PACK", SDTLoad,
21 [SDNPHasChain]>;
22def X86fand : SDNode<"X86ISD::FAND", SDTFPBinOp,
23 [SDNPCommutative, SDNPAssociative]>;
24def X86fxor : SDNode<"X86ISD::FXOR", SDTFPBinOp,
25 [SDNPCommutative, SDNPAssociative]>;
Evan Chengbc4832b2006-03-24 23:15:12 +000026def X86s2vec : SDNode<"X86ISD::S2VEC",
Evan Chengb9df0ca2006-03-22 02:53:00 +000027 SDTypeProfile<1, 1, []>, []>;
Evan Chengbc4832b2006-03-24 23:15:12 +000028def X86zexts2vec : SDNode<"X86ISD::ZEXT_S2VEC",
29 SDTypeProfile<1, 1, []>, []>;
Evan Cheng2246f842006-03-18 01:23:20 +000030
Evan Chengc60bd972006-03-25 09:37:23 +000031def SDTUnpckl : SDTypeProfile<1, 2,
32 [SDTCisSameAs<0, 1>, SDTCisSameAs<1, 2>]>;
33def X86unpckl : SDNode<"X86ISD::UNPCKL", SDTUnpckl,
34 []>;
35
Evan Cheng2246f842006-03-18 01:23:20 +000036//===----------------------------------------------------------------------===//
Evan Cheng06a8aa12006-03-17 19:55:52 +000037// SSE pattern fragments
38//===----------------------------------------------------------------------===//
39
40def X86loadpf32 : PatFrag<(ops node:$ptr), (f32 (X86loadp node:$ptr))>;
41def X86loadpf64 : PatFrag<(ops node:$ptr), (f64 (X86loadp node:$ptr))>;
42
Evan Cheng2246f842006-03-18 01:23:20 +000043def loadv4f32 : PatFrag<(ops node:$ptr), (v4f32 (load node:$ptr))>;
44def loadv2f64 : PatFrag<(ops node:$ptr), (v2f64 (load node:$ptr))>;
Evan Cheng24dc1f52006-03-23 07:44:07 +000045def loadv16i8 : PatFrag<(ops node:$ptr), (v16i8 (load node:$ptr))>;
46def loadv8i16 : PatFrag<(ops node:$ptr), (v8i16 (load node:$ptr))>;
47def loadv4i32 : PatFrag<(ops node:$ptr), (v4i32 (load node:$ptr))>;
48def loadv2i64 : PatFrag<(ops node:$ptr), (v2i64 (load node:$ptr))>;
Evan Cheng06a8aa12006-03-17 19:55:52 +000049
Evan Cheng386031a2006-03-24 07:29:27 +000050def fp32imm0 : PatLeaf<(f32 fpimm), [{
51 return N->isExactlyValue(+0.0);
52}]>;
53
Evan Cheng63d33002006-03-22 08:01:21 +000054// SHUFFLE_get_shuf_imm xform function: convert vector_shuffle mask to PSHUF*,
55// SHUFP* etc. imm.
56def SHUFFLE_get_shuf_imm : SDNodeXForm<build_vector, [{
57 return getI8Imm(X86::getShuffleSHUFImmediate(N));
Evan Chengb9df0ca2006-03-22 02:53:00 +000058}]>;
59
Evan Cheng63d33002006-03-22 08:01:21 +000060def SHUFP_splat_mask : PatLeaf<(build_vector), [{
61 return X86::isSplatMask(N);
62}], SHUFFLE_get_shuf_imm>;
63
Evan Cheng1bffadd2006-03-22 19:16:21 +000064def MOVLHPS_splat_mask : PatLeaf<(build_vector), [{
Evan Cheng0188ecb2006-03-22 18:59:22 +000065 return X86::isSplatMask(N);
66}]>;
67
Evan Cheng2c0dbd02006-03-24 02:58:06 +000068def MOVLHPSorUNPCKLPD_shuffle_mask : PatLeaf<(build_vector), [{
69 return X86::isMOVLHPSorUNPCKLPDMask(N);
70}], SHUFFLE_get_shuf_imm>;
71
72def MOVHLPS_shuffle_mask : PatLeaf<(build_vector), [{
73 return X86::isMOVHLPSMask(N);
74}], SHUFFLE_get_shuf_imm>;
75
76def UNPCKHPD_shuffle_mask : PatLeaf<(build_vector), [{
77 return X86::isUNPCKHPDMask(N);
78}], SHUFFLE_get_shuf_imm>;
79
Evan Cheng0188ecb2006-03-22 18:59:22 +000080// Only use PSHUF if it is not a splat.
81def PSHUFD_shuffle_mask : PatLeaf<(build_vector), [{
82 return !X86::isSplatMask(N) && X86::isPSHUFDMask(N);
Evan Cheng14aed5e2006-03-24 01:18:28 +000083}], SHUFFLE_get_shuf_imm>;
Evan Cheng0188ecb2006-03-22 18:59:22 +000084
Evan Cheng14aed5e2006-03-24 01:18:28 +000085def SHUFP_shuffle_mask : PatLeaf<(build_vector), [{
86 return X86::isSHUFPMask(N);
87}], SHUFFLE_get_shuf_imm>;
Evan Chengb9df0ca2006-03-22 02:53:00 +000088
Evan Cheng06a8aa12006-03-17 19:55:52 +000089//===----------------------------------------------------------------------===//
Evan Cheng4e4c71e2006-02-21 20:00:20 +000090// SSE scalar FP Instructions
91//===----------------------------------------------------------------------===//
92
Evan Cheng470a6ad2006-02-22 02:26:30 +000093// Instruction templates
94// SSI - SSE1 instructions with XS prefix.
95// SDI - SSE2 instructions with XD prefix.
96// PSI - SSE1 instructions with TB prefix.
97// PDI - SSE2 instructions with TB and OpSize prefixes.
Evan Cheng2da953f2006-03-22 07:10:28 +000098// PSIi8 - SSE1 instructions with ImmT == Imm8 and TB prefix.
99// PDIi8 - SSE2 instructions with ImmT == Imm8 and TB and OpSize prefixes.
Evan Cheng470a6ad2006-02-22 02:26:30 +0000100class SSI<bits<8> o, Format F, dag ops, string asm, list<dag> pattern>
101 : I<o, F, ops, asm, pattern>, XS, Requires<[HasSSE1]>;
102class SDI<bits<8> o, Format F, dag ops, string asm, list<dag> pattern>
103 : I<o, F, ops, asm, pattern>, XD, Requires<[HasSSE2]>;
104class PSI<bits<8> o, Format F, dag ops, string asm, list<dag> pattern>
105 : I<o, F, ops, asm, pattern>, TB, Requires<[HasSSE1]>;
106class PDI<bits<8> o, Format F, dag ops, string asm, list<dag> pattern>
107 : I<o, F, ops, asm, pattern>, TB, OpSize, Requires<[HasSSE2]>;
Evan Cheng2da953f2006-03-22 07:10:28 +0000108class PSIi8<bits<8> o, Format F, dag ops, string asm, list<dag> pattern>
109 : X86Inst<o, F, Imm8, ops, asm>, TB, Requires<[HasSSE1]> {
110 let Pattern = pattern;
111}
112class PDIi8<bits<8> o, Format F, dag ops, string asm, list<dag> pattern>
113 : X86Inst<o, F, Imm8, ops, asm>, TB, OpSize, Requires<[HasSSE2]> {
114 let Pattern = pattern;
115}
Evan Cheng470a6ad2006-02-22 02:26:30 +0000116
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000117// Some 'special' instructions
118def IMPLICIT_DEF_FR32 : I<0, Pseudo, (ops FR32:$dst),
119 "#IMPLICIT_DEF $dst",
120 [(set FR32:$dst, (undef))]>, Requires<[HasSSE2]>;
121def IMPLICIT_DEF_FR64 : I<0, Pseudo, (ops FR64:$dst),
122 "#IMPLICIT_DEF $dst",
123 [(set FR64:$dst, (undef))]>, Requires<[HasSSE2]>;
124
125// CMOV* - Used to implement the SSE SELECT DAG operation. Expanded by the
126// scheduler into a branch sequence.
127let usesCustomDAGSchedInserter = 1 in { // Expanded by the scheduler.
128 def CMOV_FR32 : I<0, Pseudo,
129 (ops FR32:$dst, FR32:$t, FR32:$f, i8imm:$cond),
130 "#CMOV_FR32 PSEUDO!",
131 [(set FR32:$dst, (X86cmov FR32:$t, FR32:$f, imm:$cond))]>;
132 def CMOV_FR64 : I<0, Pseudo,
133 (ops FR64:$dst, FR64:$t, FR64:$f, i8imm:$cond),
134 "#CMOV_FR64 PSEUDO!",
135 [(set FR64:$dst, (X86cmov FR64:$t, FR64:$f, imm:$cond))]>;
136}
137
138// Move Instructions
Evan Cheng470a6ad2006-02-22 02:26:30 +0000139def MOVSSrr : SSI<0x10, MRMSrcReg, (ops FR32:$dst, FR32:$src),
140 "movss {$src, $dst|$dst, $src}", []>;
141def MOVSSrm : SSI<0x10, MRMSrcMem, (ops FR32:$dst, f32mem:$src),
142 "movss {$src, $dst|$dst, $src}",
143 [(set FR32:$dst, (loadf32 addr:$src))]>;
144def MOVSDrr : SDI<0x10, MRMSrcReg, (ops FR64:$dst, FR64:$src),
145 "movsd {$src, $dst|$dst, $src}", []>;
146def MOVSDrm : SDI<0x10, MRMSrcMem, (ops FR64:$dst, f64mem:$src),
147 "movsd {$src, $dst|$dst, $src}",
148 [(set FR64:$dst, (loadf64 addr:$src))]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000149
Evan Cheng470a6ad2006-02-22 02:26:30 +0000150def MOVSSmr : SSI<0x11, MRMDestMem, (ops f32mem:$dst, FR32:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000151 "movss {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000152 [(store FR32:$src, addr:$dst)]>;
153def MOVSDmr : SDI<0x11, MRMDestMem, (ops f64mem:$dst, FR64:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000154 "movsd {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000155 [(store FR64:$src, addr:$dst)]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000156
Evan Chengbc4832b2006-03-24 23:15:12 +0000157// FR32 / FR64 to 128-bit vector conversion.
158def MOVSS128rr : SSI<0x10, MRMSrcReg, (ops VR128:$dst, FR32:$src),
159 "movss {$src, $dst|$dst, $src}",
160 [(set VR128:$dst,
161 (v4f32 (scalar_to_vector FR32:$src)))]>;
162def MOVSS128rm : SSI<0x10, MRMSrcMem, (ops VR128:$dst, f32mem:$src),
163 "movss {$src, $dst|$dst, $src}",
164 [(set VR128:$dst,
165 (v4f32 (scalar_to_vector (loadf32 addr:$src))))]>;
166def MOVSD128rr : SDI<0x10, MRMSrcReg, (ops VR128:$dst, FR64:$src),
167 "movsd {$src, $dst|$dst, $src}",
168 [(set VR128:$dst,
169 (v2f64 (scalar_to_vector FR64:$src)))]>;
170def MOVSD128rm : SDI<0x10, MRMSrcMem, (ops VR128:$dst, f64mem:$src),
171 "movsd {$src, $dst|$dst, $src}",
172 [(set VR128:$dst,
173 (v4f32 (scalar_to_vector (loadf64 addr:$src))))]>;
174
175
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000176// Conversion instructions
Evan Cheng7dda4052006-03-25 01:00:18 +0000177def CVTSS2SIrr: SSI<0x2D, MRMSrcReg, (ops R32:$dst, FR32:$src),
178 "cvtss2si {$src, $dst|$dst, $src}", []>;
179def CVTSS2SIrm: SSI<0x2D, MRMSrcMem, (ops R32:$dst, f32mem:$src),
180 "cvtss2si {$src, $dst|$dst, $src}", []>;
181
Evan Cheng470a6ad2006-02-22 02:26:30 +0000182def CVTTSS2SIrr: SSI<0x2C, MRMSrcReg, (ops R32:$dst, FR32:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000183 "cvttss2si {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000184 [(set R32:$dst, (fp_to_sint FR32:$src))]>;
185def CVTTSS2SIrm: SSI<0x2C, MRMSrcMem, (ops R32:$dst, f32mem:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000186 "cvttss2si {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000187 [(set R32:$dst, (fp_to_sint (loadf32 addr:$src)))]>;
188def CVTTSD2SIrr: SDI<0x2C, MRMSrcReg, (ops R32:$dst, FR64:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000189 "cvttsd2si {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000190 [(set R32:$dst, (fp_to_sint FR64:$src))]>;
191def CVTTSD2SIrm: SDI<0x2C, MRMSrcMem, (ops R32:$dst, f64mem:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000192 "cvttsd2si {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000193 [(set R32:$dst, (fp_to_sint (loadf64 addr:$src)))]>;
194def CVTSD2SSrr: SDI<0x5A, MRMSrcReg, (ops FR32:$dst, FR64:$src),
195 "cvtsd2ss {$src, $dst|$dst, $src}",
196 [(set FR32:$dst, (fround FR64:$src))]>;
197def CVTSD2SSrm: SDI<0x5A, MRMSrcMem, (ops FR32:$dst, f64mem:$src),
198 "cvtsd2ss {$src, $dst|$dst, $src}",
199 [(set FR32:$dst, (fround (loadf64 addr:$src)))]>;
200def CVTSI2SSrr: SSI<0x2A, MRMSrcReg, (ops FR32:$dst, R32:$src),
201 "cvtsi2ss {$src, $dst|$dst, $src}",
202 [(set FR32:$dst, (sint_to_fp R32:$src))]>;
203def CVTSI2SSrm: SSI<0x2A, MRMSrcMem, (ops FR32:$dst, i32mem:$src),
204 "cvtsi2ss {$src, $dst|$dst, $src}",
205 [(set FR32:$dst, (sint_to_fp (loadi32 addr:$src)))]>;
206def CVTSI2SDrr: SDI<0x2A, MRMSrcReg, (ops FR64:$dst, R32:$src),
207 "cvtsi2sd {$src, $dst|$dst, $src}",
208 [(set FR64:$dst, (sint_to_fp R32:$src))]>;
209def CVTSI2SDrm: SDI<0x2A, MRMSrcMem, (ops FR64:$dst, i32mem:$src),
210 "cvtsi2sd {$src, $dst|$dst, $src}",
211 [(set FR64:$dst, (sint_to_fp (loadi32 addr:$src)))]>;
212// SSE2 instructions with XS prefix
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000213def CVTSS2SDrr: I<0x5A, MRMSrcReg, (ops FR64:$dst, FR32:$src),
214 "cvtss2sd {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000215 [(set FR64:$dst, (fextend FR32:$src))]>, XS,
216 Requires<[HasSSE2]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000217def CVTSS2SDrm: I<0x5A, MRMSrcMem, (ops FR64:$dst, f32mem:$src),
218 "cvtss2sd {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000219 [(set FR64:$dst, (fextend (loadf32 addr:$src)))]>, XS,
220 Requires<[HasSSE2]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000221
222// Arithmetic instructions
223let isTwoAddress = 1 in {
224let isCommutable = 1 in {
Evan Cheng470a6ad2006-02-22 02:26:30 +0000225def ADDSSrr : SSI<0x58, MRMSrcReg, (ops FR32:$dst, FR32:$src1, FR32:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000226 "addss {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000227 [(set FR32:$dst, (fadd FR32:$src1, FR32:$src2))]>;
228def ADDSDrr : SDI<0x58, MRMSrcReg, (ops FR64:$dst, FR64:$src1, FR64:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000229 "addsd {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000230 [(set FR64:$dst, (fadd FR64:$src1, FR64:$src2))]>;
231def MULSSrr : SSI<0x59, MRMSrcReg, (ops FR32:$dst, FR32:$src1, FR32:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000232 "mulss {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000233 [(set FR32:$dst, (fmul FR32:$src1, FR32:$src2))]>;
234def MULSDrr : SDI<0x59, MRMSrcReg, (ops FR64:$dst, FR64:$src1, FR64:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000235 "mulsd {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000236 [(set FR64:$dst, (fmul FR64:$src1, FR64:$src2))]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000237}
238
Evan Cheng470a6ad2006-02-22 02:26:30 +0000239def ADDSSrm : SSI<0x58, MRMSrcMem, (ops FR32:$dst, FR32:$src1, f32mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000240 "addss {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000241 [(set FR32:$dst, (fadd FR32:$src1, (loadf32 addr:$src2)))]>;
242def ADDSDrm : SDI<0x58, MRMSrcMem, (ops FR64:$dst, FR64:$src1, f64mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000243 "addsd {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000244 [(set FR64:$dst, (fadd FR64:$src1, (loadf64 addr:$src2)))]>;
245def MULSSrm : SSI<0x59, MRMSrcMem, (ops FR32:$dst, FR32:$src1, f32mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000246 "mulss {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000247 [(set FR32:$dst, (fmul FR32:$src1, (loadf32 addr:$src2)))]>;
248def MULSDrm : SDI<0x59, MRMSrcMem, (ops FR64:$dst, FR64:$src1, f64mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000249 "mulsd {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000250 [(set FR64:$dst, (fmul FR64:$src1, (loadf64 addr:$src2)))]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000251
Evan Cheng470a6ad2006-02-22 02:26:30 +0000252def DIVSSrr : SSI<0x5E, MRMSrcReg, (ops FR32:$dst, FR32:$src1, FR32:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000253 "divss {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000254 [(set FR32:$dst, (fdiv FR32:$src1, FR32:$src2))]>;
255def DIVSSrm : SSI<0x5E, MRMSrcMem, (ops FR32:$dst, FR32:$src1, f32mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000256 "divss {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000257 [(set FR32:$dst, (fdiv FR32:$src1, (loadf32 addr:$src2)))]>;
258def DIVSDrr : SDI<0x5E, MRMSrcReg, (ops FR64:$dst, FR64:$src1, FR64:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000259 "divsd {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000260 [(set FR64:$dst, (fdiv FR64:$src1, FR64:$src2))]>;
261def DIVSDrm : SDI<0x5E, MRMSrcMem, (ops FR64:$dst, FR64:$src1, f64mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000262 "divsd {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000263 [(set FR64:$dst, (fdiv FR64:$src1, (loadf64 addr:$src2)))]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000264
Evan Cheng470a6ad2006-02-22 02:26:30 +0000265def SUBSSrr : SSI<0x5C, MRMSrcReg, (ops FR32:$dst, FR32:$src1, FR32:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000266 "subss {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000267 [(set FR32:$dst, (fsub FR32:$src1, FR32:$src2))]>;
268def SUBSSrm : SSI<0x5C, MRMSrcMem, (ops FR32:$dst, FR32:$src1, f32mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000269 "subss {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000270 [(set FR32:$dst, (fsub FR32:$src1, (loadf32 addr:$src2)))]>;
271def SUBSDrr : SDI<0x5C, MRMSrcReg, (ops FR64:$dst, FR64:$src1, FR64:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000272 "subsd {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000273 [(set FR64:$dst, (fsub FR64:$src1, FR64:$src2))]>;
274def SUBSDrm : SDI<0x5C, MRMSrcMem, (ops FR64:$dst, FR64:$src1, f64mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000275 "subsd {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000276 [(set FR64:$dst, (fsub FR64:$src1, (loadf64 addr:$src2)))]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000277}
278
Evan Cheng470a6ad2006-02-22 02:26:30 +0000279def SQRTSSrr : SSI<0x51, MRMSrcReg, (ops FR32:$dst, FR32:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000280 "sqrtss {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000281 [(set FR32:$dst, (fsqrt FR32:$src))]>;
282def SQRTSSrm : SSI<0x51, MRMSrcMem, (ops FR32:$dst, f32mem:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000283 "sqrtss {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000284 [(set FR32:$dst, (fsqrt (loadf32 addr:$src)))]>;
285def SQRTSDrr : SDI<0x51, MRMSrcReg, (ops FR64:$dst, FR64:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000286 "sqrtsd {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000287 [(set FR64:$dst, (fsqrt FR64:$src))]>;
288def SQRTSDrm : SDI<0x51, MRMSrcMem, (ops FR64:$dst, f64mem:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000289 "sqrtsd {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000290 [(set FR64:$dst, (fsqrt (loadf64 addr:$src)))]>;
291
292def RSQRTSSrr : SSI<0x52, MRMSrcReg, (ops FR32:$dst, FR32:$src),
293 "rsqrtss {$src, $dst|$dst, $src}", []>;
294def RSQRTSSrm : SSI<0x52, MRMSrcMem, (ops FR32:$dst, f32mem:$src),
295 "rsqrtss {$src, $dst|$dst, $src}", []>;
296def RCPSSrr : SSI<0x53, MRMSrcReg, (ops FR32:$dst, FR32:$src),
297 "rcpss {$src, $dst|$dst, $src}", []>;
298def RCPSSrm : SSI<0x53, MRMSrcMem, (ops FR32:$dst, f32mem:$src),
299 "rcpss {$src, $dst|$dst, $src}", []>;
300
301def MAXSSrr : SSI<0x5F, MRMSrcReg, (ops FR32:$dst, FR32:$src),
302 "maxss {$src, $dst|$dst, $src}", []>;
303def MAXSSrm : SSI<0x5F, MRMSrcMem, (ops FR32:$dst, f32mem:$src),
304 "maxss {$src, $dst|$dst, $src}", []>;
305def MAXSDrr : SDI<0x5F, MRMSrcReg, (ops FR64:$dst, FR64:$src),
306 "maxsd {$src, $dst|$dst, $src}", []>;
307def MAXSDrm : SDI<0x5F, MRMSrcMem, (ops FR64:$dst, f64mem:$src),
308 "maxsd {$src, $dst|$dst, $src}", []>;
309def MINSSrr : SSI<0x5D, MRMSrcReg, (ops FR32:$dst, FR32:$src),
310 "minss {$src, $dst|$dst, $src}", []>;
311def MINSSrm : SSI<0x5D, MRMSrcMem, (ops FR32:$dst, f32mem:$src),
312 "minss {$src, $dst|$dst, $src}", []>;
313def MINSDrr : SDI<0x5D, MRMSrcReg, (ops FR64:$dst, FR64:$src),
314 "minsd {$src, $dst|$dst, $src}", []>;
315def MINSDrm : SDI<0x5D, MRMSrcMem, (ops FR64:$dst, f64mem:$src),
316 "minsd {$src, $dst|$dst, $src}", []>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000317
318// Comparison instructions
319let isTwoAddress = 1 in {
Evan Cheng470a6ad2006-02-22 02:26:30 +0000320def CMPSSrr : SSI<0xC2, MRMSrcReg,
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000321 (ops FR32:$dst, FR32:$src1, FR32:$src, SSECC:$cc),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000322 "cmp${cc}ss {$src, $dst|$dst, $src}", []>;
323def CMPSSrm : SSI<0xC2, MRMSrcMem,
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000324 (ops FR32:$dst, FR32:$src1, f32mem:$src, SSECC:$cc),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000325 "cmp${cc}ss {$src, $dst|$dst, $src}", []>;
326def CMPSDrr : SDI<0xC2, MRMSrcReg,
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000327 (ops FR64:$dst, FR64:$src1, FR64:$src, SSECC:$cc),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000328 "cmp${cc}sd {$src, $dst|$dst, $src}", []>;
329def CMPSDrm : SDI<0xC2, MRMSrcMem,
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000330 (ops FR64:$dst, FR64:$src1, f64mem:$src, SSECC:$cc),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000331 "cmp${cc}sd {$src, $dst|$dst, $src}", []>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000332}
333
Evan Cheng470a6ad2006-02-22 02:26:30 +0000334def UCOMISSrr: PSI<0x2E, MRMSrcReg, (ops FR32:$src1, FR32:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000335 "ucomiss {$src2, $src1|$src1, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000336 [(X86cmp FR32:$src1, FR32:$src2)]>;
337def UCOMISSrm: PSI<0x2E, MRMSrcMem, (ops FR32:$src1, f32mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000338 "ucomiss {$src2, $src1|$src1, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000339 [(X86cmp FR32:$src1, (loadf32 addr:$src2))]>;
340def UCOMISDrr: PDI<0x2E, MRMSrcReg, (ops FR64:$src1, FR64:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000341 "ucomisd {$src2, $src1|$src1, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000342 [(X86cmp FR64:$src1, FR64:$src2)]>;
343def UCOMISDrm: PDI<0x2E, MRMSrcMem, (ops FR64:$src1, f64mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000344 "ucomisd {$src2, $src1|$src1, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000345 [(X86cmp FR64:$src1, (loadf64 addr:$src2))]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000346
347// Aliases of packed instructions for scalar use. These all have names that
348// start with 'Fs'.
349
350// Alias instructions that map fld0 to pxor for sse.
351// FIXME: remove when we can teach regalloc that xor reg, reg is ok.
352def FsFLD0SS : I<0xEF, MRMInitReg, (ops FR32:$dst),
353 "pxor $dst, $dst", [(set FR32:$dst, fp32imm0)]>,
354 Requires<[HasSSE1]>, TB, OpSize;
355def FsFLD0SD : I<0xEF, MRMInitReg, (ops FR64:$dst),
356 "pxor $dst, $dst", [(set FR64:$dst, fp64imm0)]>,
357 Requires<[HasSSE2]>, TB, OpSize;
358
359// Alias instructions to do FR32 / FR64 reg-to-reg copy using movaps / movapd.
360// Upper bits are disregarded.
Evan Cheng470a6ad2006-02-22 02:26:30 +0000361def FsMOVAPSrr : PSI<0x28, MRMSrcReg, (ops FR32:$dst, FR32:$src),
362 "movaps {$src, $dst|$dst, $src}", []>;
363def FsMOVAPDrr : PDI<0x28, MRMSrcReg, (ops FR64:$dst, FR64:$src),
364 "movapd {$src, $dst|$dst, $src}", []>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000365
366// Alias instructions to load FR32 / FR64 from f128mem using movaps / movapd.
367// Upper bits are disregarded.
Evan Cheng470a6ad2006-02-22 02:26:30 +0000368def FsMOVAPSrm : PSI<0x28, MRMSrcMem, (ops FR32:$dst, f128mem:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000369 "movaps {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000370 [(set FR32:$dst, (X86loadpf32 addr:$src))]>;
371def FsMOVAPDrm : PDI<0x28, MRMSrcMem, (ops FR64:$dst, f128mem:$src),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000372 "movapd {$src, $dst|$dst, $src}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000373 [(set FR64:$dst, (X86loadpf64 addr:$src))]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000374
375// Alias bitwise logical operations using SSE logical ops on packed FP values.
376let isTwoAddress = 1 in {
377let isCommutable = 1 in {
Evan Cheng470a6ad2006-02-22 02:26:30 +0000378def FsANDPSrr : PSI<0x54, MRMSrcReg, (ops FR32:$dst, FR32:$src1, FR32:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000379 "andps {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000380 [(set FR32:$dst, (X86fand FR32:$src1, FR32:$src2))]>;
381def FsANDPDrr : PDI<0x54, MRMSrcReg, (ops FR64:$dst, FR64:$src1, FR64:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000382 "andpd {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000383 [(set FR64:$dst, (X86fand FR64:$src1, FR64:$src2))]>;
384def FsORPSrr : PSI<0x56, MRMSrcReg, (ops FR32:$dst, FR32:$src1, FR32:$src2),
385 "orps {$src2, $dst|$dst, $src2}", []>;
386def FsORPDrr : PDI<0x56, MRMSrcReg, (ops FR64:$dst, FR64:$src1, FR64:$src2),
387 "orpd {$src2, $dst|$dst, $src2}", []>;
388def FsXORPSrr : PSI<0x57, MRMSrcReg, (ops FR32:$dst, FR32:$src1, FR32:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000389 "xorps {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000390 [(set FR32:$dst, (X86fxor FR32:$src1, FR32:$src2))]>;
391def FsXORPDrr : PDI<0x57, MRMSrcReg, (ops FR64:$dst, FR64:$src1, FR64:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000392 "xorpd {$src2, $dst|$dst, $src2}",
Evan Cheng470a6ad2006-02-22 02:26:30 +0000393 [(set FR64:$dst, (X86fxor FR64:$src1, FR64:$src2))]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000394}
Evan Cheng470a6ad2006-02-22 02:26:30 +0000395def FsANDPSrm : PSI<0x54, MRMSrcMem, (ops FR32:$dst, FR32:$src1, f128mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000396 "andps {$src2, $dst|$dst, $src2}",
397 [(set FR32:$dst, (X86fand FR32:$src1,
Evan Cheng470a6ad2006-02-22 02:26:30 +0000398 (X86loadpf32 addr:$src2)))]>;
399def FsANDPDrm : PDI<0x54, MRMSrcMem, (ops FR64:$dst, FR64:$src1, f128mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000400 "andpd {$src2, $dst|$dst, $src2}",
401 [(set FR64:$dst, (X86fand FR64:$src1,
Evan Cheng470a6ad2006-02-22 02:26:30 +0000402 (X86loadpf64 addr:$src2)))]>;
403def FsORPSrm : PSI<0x56, MRMSrcMem, (ops FR32:$dst, FR32:$src1, f128mem:$src2),
404 "orps {$src2, $dst|$dst, $src2}", []>;
405def FsORPDrm : PDI<0x56, MRMSrcMem, (ops FR64:$dst, FR64:$src1, f128mem:$src2),
406 "orpd {$src2, $dst|$dst, $src2}", []>;
407def FsXORPSrm : PSI<0x57, MRMSrcMem, (ops FR32:$dst, FR32:$src1, f128mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000408 "xorps {$src2, $dst|$dst, $src2}",
409 [(set FR32:$dst, (X86fxor FR32:$src1,
Evan Cheng470a6ad2006-02-22 02:26:30 +0000410 (X86loadpf32 addr:$src2)))]>;
411def FsXORPDrm : PDI<0x57, MRMSrcMem, (ops FR64:$dst, FR64:$src1, f128mem:$src2),
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000412 "xorpd {$src2, $dst|$dst, $src2}",
413 [(set FR64:$dst, (X86fxor FR64:$src1,
Evan Cheng470a6ad2006-02-22 02:26:30 +0000414 (X86loadpf64 addr:$src2)))]>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000415
Evan Cheng470a6ad2006-02-22 02:26:30 +0000416def FsANDNPSrr : PSI<0x55, MRMSrcReg, (ops FR32:$dst, FR32:$src1, FR32:$src2),
417 "andnps {$src2, $dst|$dst, $src2}", []>;
418def FsANDNPSrm : PSI<0x55, MRMSrcMem, (ops FR32:$dst, FR32:$src1, f128mem:$src2),
419 "andnps {$src2, $dst|$dst, $src2}", []>;
420def FsANDNPDrr : PDI<0x55, MRMSrcReg, (ops FR64:$dst, FR64:$src1, FR64:$src2),
421 "andnpd {$src2, $dst|$dst, $src2}", []>;
422def FsANDNPDrm : PDI<0x55, MRMSrcMem, (ops FR64:$dst, FR64:$src1, f128mem:$src2),
423 "andnpd {$src2, $dst|$dst, $src2}", []>;
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000424}
425
426//===----------------------------------------------------------------------===//
427// SSE packed FP Instructions
428//===----------------------------------------------------------------------===//
429
Evan Chengc12e6c42006-03-19 09:38:54 +0000430// Some 'special' instructions
431def IMPLICIT_DEF_VR128 : I<0, Pseudo, (ops VR128:$dst),
432 "#IMPLICIT_DEF $dst",
433 [(set VR128:$dst, (v4f32 (undef)))]>,
434 Requires<[HasSSE1]>;
435
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000436// Move Instructions
Evan Cheng2246f842006-03-18 01:23:20 +0000437def MOVAPSrr : PSI<0x28, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000438 "movaps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000439def MOVAPSrm : PSI<0x28, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000440 "movaps {$src, $dst|$dst, $src}",
Evan Cheng2246f842006-03-18 01:23:20 +0000441 [(set VR128:$dst, (loadv4f32 addr:$src))]>;
442def MOVAPDrr : PDI<0x28, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000443 "movapd {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000444def MOVAPDrm : PDI<0x28, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000445 "movapd {$src, $dst|$dst, $src}",
Evan Cheng2246f842006-03-18 01:23:20 +0000446 [(set VR128:$dst, (loadv2f64 addr:$src))]>;
Evan Chengffcb95b2006-02-21 19:13:53 +0000447
Evan Cheng2246f842006-03-18 01:23:20 +0000448def MOVAPSmr : PSI<0x29, MRMDestMem, (ops f128mem:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000449 "movaps {$src, $dst|$dst, $src}",
Evan Cheng2246f842006-03-18 01:23:20 +0000450 [(store (v4f32 VR128:$src), addr:$dst)]>;
451def MOVAPDmr : PDI<0x29, MRMDestMem, (ops f128mem:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000452 "movapd {$src, $dst|$dst, $src}",
Evan Cheng2246f842006-03-18 01:23:20 +0000453 [(store (v2f64 VR128:$src), addr:$dst)]>;
Evan Cheng470a6ad2006-02-22 02:26:30 +0000454
Evan Cheng2246f842006-03-18 01:23:20 +0000455def MOVUPSrr : PSI<0x10, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000456 "movups {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000457def MOVUPSrm : PSI<0x10, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000458 "movups {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000459def MOVUPSmr : PSI<0x11, MRMDestMem, (ops f128mem:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000460 "movups {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000461def MOVUPDrr : PDI<0x10, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000462 "movupd {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000463def MOVUPDrm : PDI<0x10, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000464 "movupd {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000465def MOVUPDmr : PDI<0x11, MRMDestMem, (ops f128mem:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000466 "movupd {$src, $dst|$dst, $src}", []>;
467
Evan Cheng2246f842006-03-18 01:23:20 +0000468def MOVLPSrm : PSI<0x12, MRMSrcMem, (ops VR128:$dst, f64mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000469 "movlps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000470def MOVLPSmr : PSI<0x13, MRMDestMem, (ops f64mem:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000471 "movlps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000472def MOVLPDrm : PDI<0x12, MRMSrcMem, (ops VR128:$dst, f64mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000473 "movlpd {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000474def MOVLPDmr : PDI<0x13, MRMDestMem, (ops f64mem:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000475 "movlpd {$src, $dst|$dst, $src}", []>;
476
Evan Cheng2246f842006-03-18 01:23:20 +0000477def MOVHPSrm : PSI<0x16, MRMSrcMem, (ops VR128:$dst, f64mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000478 "movhps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000479def MOVHPSmr : PSI<0x17, MRMDestMem, (ops f64mem:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000480 "movhps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000481def MOVHPDrm : PDI<0x16, MRMSrcMem, (ops VR128:$dst, f64mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000482 "movhpd {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000483def MOVHPDmr : PDI<0x17, MRMDestMem, (ops f64mem:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000484 "movhpd {$src, $dst|$dst, $src}", []>;
485
Evan Cheng14aed5e2006-03-24 01:18:28 +0000486let isTwoAddress = 1 in {
487def MOVLHPSrr : PSI<0x16, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
488 "movlhps {$src2, $dst|$dst, $src2}", []>;
Evan Cheng2c0dbd02006-03-24 02:58:06 +0000489
Evan Cheng14aed5e2006-03-24 01:18:28 +0000490def MOVHLPSrr : PSI<0x12, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
491 "movlhps {$src2, $dst|$dst, $src2}", []>;
492}
Evan Cheng470a6ad2006-02-22 02:26:30 +0000493
Evan Cheng2246f842006-03-18 01:23:20 +0000494def MOVMSKPSrr : PSI<0x50, MRMSrcReg, (ops R32:$dst, VR128:$src),
Chris Lattnerac53ead2006-03-24 21:49:18 +0000495 "movmskps {$src, $dst|$dst, $src}",
496 [(set R32:$dst, (int_x86_sse_movmskps VR128:$src))]>;
Evan Cheng2246f842006-03-18 01:23:20 +0000497def MOVMSKPDrr : PSI<0x50, MRMSrcReg, (ops R32:$dst, VR128:$src),
Chris Lattnerac53ead2006-03-24 21:49:18 +0000498 "movmskpd {$src, $dst|$dst, $src}",
499 [(set R32:$dst, (int_x86_sse2_movmskpd VR128:$src))]>;
Evan Cheng470a6ad2006-02-22 02:26:30 +0000500
501// Conversion instructions
Evan Cheng2246f842006-03-18 01:23:20 +0000502def CVTPI2PSrr : PSI<0x2A, MRMSrcReg, (ops VR128:$dst, VR64:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000503 "cvtpi2ps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000504def CVTPI2PSrm : PSI<0x2A, MRMSrcMem, (ops VR128:$dst, i64mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000505 "cvtpi2ps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000506def CVTPI2PDrr : PDI<0x2A, MRMSrcReg, (ops VR128:$dst, VR64:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000507 "cvtpi2pd {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000508def CVTPI2PDrm : PDI<0x2A, MRMSrcMem, (ops VR128:$dst, i64mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000509 "cvtpi2pd {$src, $dst|$dst, $src}", []>;
510
511// SSE2 instructions without OpSize prefix
Evan Cheng2246f842006-03-18 01:23:20 +0000512def CVTDQ2PSrr : I<0x5B, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000513 "cvtdq2ps {$src, $dst|$dst, $src}", []>, TB,
514 Requires<[HasSSE2]>;
Evan Cheng2246f842006-03-18 01:23:20 +0000515def CVTDQ2PSrm : I<0x5B, MRMSrcMem, (ops VR128:$dst, i128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000516 "cvtdq2ps {$src, $dst|$dst, $src}", []>, TB,
517 Requires<[HasSSE2]>;
518
519// SSE2 instructions with XS prefix
Evan Cheng2246f842006-03-18 01:23:20 +0000520def CVTDQ2PDrr : I<0xE6, MRMSrcReg, (ops VR128:$dst, VR64:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000521 "cvtdq2pd {$src, $dst|$dst, $src}", []>,
522 XS, Requires<[HasSSE2]>;
Evan Cheng2246f842006-03-18 01:23:20 +0000523def CVTDQ2PDrm : I<0xE6, MRMSrcMem, (ops VR128:$dst, i64mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000524 "cvtdq2pd {$src, $dst|$dst, $src}", []>,
525 XS, Requires<[HasSSE2]>;
526
Evan Cheng2246f842006-03-18 01:23:20 +0000527def CVTPS2PIrr : PSI<0x2D, MRMSrcReg, (ops VR64:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000528 "cvtps2pi {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000529def CVTPS2PIrm : PSI<0x2D, MRMSrcMem, (ops VR64:$dst, f64mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000530 "cvtps2pi {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000531def CVTPD2PIrr : PDI<0x2D, MRMSrcReg, (ops VR64:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000532 "cvtpd2pi {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000533def CVTPD2PIrm : PDI<0x2D, MRMSrcMem, (ops VR64:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000534 "cvtpd2pi {$src, $dst|$dst, $src}", []>;
535
Evan Cheng2246f842006-03-18 01:23:20 +0000536def CVTPS2DQrr : PDI<0x5B, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000537 "cvtps2dq {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000538def CVTPS2DQrm : PDI<0x5B, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000539 "cvtps2dq {$src, $dst|$dst, $src}", []>;
540// SSE2 packed instructions with XD prefix
Evan Cheng2246f842006-03-18 01:23:20 +0000541def CVTPD2DQrr : SDI<0xE6, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000542 "cvtpd2dq {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000543def CVTPD2DQrm : SDI<0xE6, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000544 "cvtpd2dq {$src, $dst|$dst, $src}", []>;
545
546// SSE2 instructions without OpSize prefix
Evan Cheng2246f842006-03-18 01:23:20 +0000547def CVTPS2PDrr : I<0x5A, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000548 "cvtps2pd {$src, $dst|$dst, $src}", []>, TB,
549 Requires<[HasSSE2]>;
Evan Cheng2246f842006-03-18 01:23:20 +0000550def CVTPS2PDrm : I<0x5A, MRMSrcReg, (ops VR128:$dst, f64mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000551 "cvtps2pd {$src, $dst|$dst, $src}", []>, TB,
552 Requires<[HasSSE2]>;
553
Evan Cheng2246f842006-03-18 01:23:20 +0000554def CVTPD2PSrr : PDI<0x5A, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000555 "cvtpd2ps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000556def CVTPD2PSrm : PDI<0x5A, MRMSrcReg, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000557 "cvtpd2ps {$src, $dst|$dst, $src}", []>;
558
559// Arithmetic
560let isTwoAddress = 1 in {
561let isCommutable = 1 in {
Evan Cheng2246f842006-03-18 01:23:20 +0000562def ADDPSrr : PSI<0x58, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000563 "addps {$src2, $dst|$dst, $src2}",
Evan Cheng2246f842006-03-18 01:23:20 +0000564 [(set VR128:$dst, (v4f32 (fadd VR128:$src1, VR128:$src2)))]>;
565def ADDPDrr : PDI<0x58, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000566 "addpd {$src2, $dst|$dst, $src2}",
Evan Cheng2246f842006-03-18 01:23:20 +0000567 [(set VR128:$dst, (v2f64 (fadd VR128:$src1, VR128:$src2)))]>;
568def MULPSrr : PSI<0x59, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000569 "mulps {$src2, $dst|$dst, $src2}",
Evan Cheng2246f842006-03-18 01:23:20 +0000570 [(set VR128:$dst, (v4f32 (fmul VR128:$src1, VR128:$src2)))]>;
571def MULPDrr : PDI<0x59, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000572 "mulpd {$src2, $dst|$dst, $src2}",
Evan Cheng2246f842006-03-18 01:23:20 +0000573 [(set VR128:$dst, (v2f64 (fmul VR128:$src1, VR128:$src2)))]>;
Evan Cheng470a6ad2006-02-22 02:26:30 +0000574}
575
Evan Cheng2246f842006-03-18 01:23:20 +0000576def ADDPSrm : PSI<0x58, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000577 "addps {$src2, $dst|$dst, $src2}",
Evan Cheng2246f842006-03-18 01:23:20 +0000578 [(set VR128:$dst, (v4f32 (fadd VR128:$src1,
579 (load addr:$src2))))]>;
580def ADDPDrm : PDI<0x58, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000581 "addpd {$src2, $dst|$dst, $src2}",
Evan Cheng2246f842006-03-18 01:23:20 +0000582 [(set VR128:$dst, (v2f64 (fadd VR128:$src1,
583 (load addr:$src2))))]>;
584def MULPSrm : PSI<0x59, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000585 "mulps {$src2, $dst|$dst, $src2}",
Evan Cheng2246f842006-03-18 01:23:20 +0000586 [(set VR128:$dst, (v4f32 (fmul VR128:$src1,
587 (load addr:$src2))))]>;
588def MULPDrm : PDI<0x59, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000589 "mulpd {$src2, $dst|$dst, $src2}",
Evan Cheng2246f842006-03-18 01:23:20 +0000590 [(set VR128:$dst, (v2f64 (fmul VR128:$src1,
591 (load addr:$src2))))]>;
Evan Cheng470a6ad2006-02-22 02:26:30 +0000592
Evan Cheng2246f842006-03-18 01:23:20 +0000593def DIVPSrr : PSI<0x5E, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
594 "divps {$src2, $dst|$dst, $src2}",
595 [(set VR128:$dst, (v4f32 (fdiv VR128:$src1, VR128:$src2)))]>;
596def DIVPSrm : PSI<0x5E, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
597 "divps {$src2, $dst|$dst, $src2}",
598 [(set VR128:$dst, (v4f32 (fdiv VR128:$src1,
599 (load addr:$src2))))]>;
600def DIVPDrr : PDI<0x5E, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000601 "divpd {$src2, $dst|$dst, $src2}",
Evan Cheng2246f842006-03-18 01:23:20 +0000602 [(set VR128:$dst, (v2f64 (fdiv VR128:$src1, VR128:$src2)))]>;
603def DIVPDrm : PDI<0x5E, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000604 "divpd {$src2, $dst|$dst, $src2}",
Evan Cheng2246f842006-03-18 01:23:20 +0000605 [(set VR128:$dst, (v2f64 (fdiv VR128:$src1,
606 (load addr:$src2))))]>;
Evan Cheng470a6ad2006-02-22 02:26:30 +0000607
Evan Cheng2246f842006-03-18 01:23:20 +0000608def SUBPSrr : PSI<0x5C, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
609 "subps {$src2, $dst|$dst, $src2}",
610 [(set VR128:$dst, (v4f32 (fsub VR128:$src1, VR128:$src2)))]>;
611def SUBPSrm : PSI<0x5C, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
612 "subps {$src2, $dst|$dst, $src2}",
613 [(set VR128:$dst, (v4f32 (fsub VR128:$src1,
614 (load addr:$src2))))]>;
615def SUBPDrr : PDI<0x5C, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
616 "subpd {$src2, $dst|$dst, $src2}",
Evan Cheng2c0dbd02006-03-24 02:58:06 +0000617 [(set VR128:$dst, (v2f64 (fsub VR128:$src1, VR128:$src2)))]>;
Evan Cheng2246f842006-03-18 01:23:20 +0000618def SUBPDrm : PDI<0x5C, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
619 "subpd {$src2, $dst|$dst, $src2}",
Evan Cheng2c0dbd02006-03-24 02:58:06 +0000620 [(set VR128:$dst, (v2f64 (fsub VR128:$src1,
621 (load addr:$src2))))]>;
Evan Cheng470a6ad2006-02-22 02:26:30 +0000622}
623
Evan Cheng2246f842006-03-18 01:23:20 +0000624def SQRTPSrr : PSI<0x51, MRMSrcReg, (ops VR128:$dst, VR128:$src),
625 "sqrtps {$src, $dst|$dst, $src}",
626 [(set VR128:$dst, (v4f32 (fsqrt VR128:$src)))]>;
627def SQRTPSrm : PSI<0x51, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
628 "sqrtps {$src, $dst|$dst, $src}",
629 [(set VR128:$dst, (v4f32 (fsqrt (load addr:$src))))]>;
630def SQRTPDrr : PDI<0x51, MRMSrcReg, (ops VR128:$dst, VR128:$src),
631 "sqrtpd {$src, $dst|$dst, $src}",
632 [(set VR128:$dst, (v2f64 (fsqrt VR128:$src)))]>;
633def SQRTPDrm : PDI<0x51, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
634 "sqrtpd {$src, $dst|$dst, $src}",
635 [(set VR128:$dst, (v2f64 (fsqrt (load addr:$src))))]>;
Evan Cheng470a6ad2006-02-22 02:26:30 +0000636
Evan Cheng2246f842006-03-18 01:23:20 +0000637def RSQRTPSrr : PSI<0x52, MRMSrcReg, (ops VR128:$dst, VR128:$src),
638 "rsqrtps {$src, $dst|$dst, $src}", []>;
639def RSQRTPSrm : PSI<0x52, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
640 "rsqrtps {$src, $dst|$dst, $src}", []>;
641def RCPPSrr : PSI<0x53, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000642 "rcpps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000643def RCPPSrm : PSI<0x53, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000644 "rcpps {$src, $dst|$dst, $src}", []>;
645
Evan Cheng2246f842006-03-18 01:23:20 +0000646def MAXPSrr : PSI<0x5F, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000647 "maxps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000648def MAXPSrm : PSI<0x5F, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000649 "maxps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000650def MAXPDrr : PDI<0x5F, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000651 "maxpd {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000652def MAXPDrm : PDI<0x5F, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000653 "maxpd {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000654def MINPSrr : PSI<0x5D, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000655 "minps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000656def MINPSrm : PSI<0x5D, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000657 "minps {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000658def MINPDrr : PDI<0x5D, MRMSrcReg, (ops VR128:$dst, VR128:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000659 "minpd {$src, $dst|$dst, $src}", []>;
Evan Cheng2246f842006-03-18 01:23:20 +0000660def MINPDrm : PDI<0x5D, MRMSrcMem, (ops VR128:$dst, f128mem:$src),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000661 "minpd {$src, $dst|$dst, $src}", []>;
Evan Chengffcb95b2006-02-21 19:13:53 +0000662
663// Logical
664let isTwoAddress = 1 in {
665let isCommutable = 1 in {
Evan Cheng2246f842006-03-18 01:23:20 +0000666def ANDPSrr : PSI<0x54, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
667 "andps {$src2, $dst|$dst, $src2}",
668 [(set VR128:$dst, (v4i32 (and VR128:$src1, VR128:$src2)))]>;
669def ANDPDrr : PDI<0x54, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
Evan Chengffcb95b2006-02-21 19:13:53 +0000670 "andpd {$src2, $dst|$dst, $src2}",
Evan Cheng2246f842006-03-18 01:23:20 +0000671 [(set VR128:$dst, (v2i64 (and VR128:$src1, VR128:$src2)))]>;
672def ORPSrr : PSI<0x56, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
673 "orps {$src2, $dst|$dst, $src2}",
674 [(set VR128:$dst, (v4i32 (or VR128:$src1, VR128:$src2)))]>;
675def ORPDrr : PDI<0x56, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
676 "orpd {$src2, $dst|$dst, $src2}",
677 [(set VR128:$dst, (v2i64 (or VR128:$src1, VR128:$src2)))]>;
678def XORPSrr : PSI<0x57, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
679 "xorps {$src2, $dst|$dst, $src2}",
680 [(set VR128:$dst, (v4i32 (xor VR128:$src1, VR128:$src2)))]>;
681def XORPDrr : PDI<0x57, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
682 "xorpd {$src2, $dst|$dst, $src2}",
683 [(set VR128:$dst, (v2i64 (xor VR128:$src1, VR128:$src2)))]>;
Evan Chengffcb95b2006-02-21 19:13:53 +0000684}
Evan Cheng2246f842006-03-18 01:23:20 +0000685def ANDPSrm : PSI<0x54, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
686 "andps {$src2, $dst|$dst, $src2}",
687 [(set VR128:$dst, (v4i32 (and VR128:$src1,
688 (load addr:$src2))))]>;
689def ANDPDrm : PDI<0x54, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
690 "andpd {$src2, $dst|$dst, $src2}",
691 [(set VR128:$dst, (v2i64 (and VR128:$src1,
692 (load addr:$src2))))]>;
693def ORPSrm : PSI<0x56, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
694 "orps {$src2, $dst|$dst, $src2}",
695 [(set VR128:$dst, (v4i32 (or VR128:$src1,
696 (load addr:$src2))))]>;
697def ORPDrm : PDI<0x56, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
698 "orpd {$src2, $dst|$dst, $src2}",
699 [(set VR128:$dst, (v2i64 (or VR128:$src1,
700 (load addr:$src2))))]>;
701def XORPSrm : PSI<0x57, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
702 "xorps {$src2, $dst|$dst, $src2}",
703 [(set VR128:$dst, (v4i32 (xor VR128:$src1,
704 (load addr:$src2))))]>;
705def XORPDrm : PDI<0x57, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
706 "xorpd {$src2, $dst|$dst, $src2}",
707 [(set VR128:$dst, (v2i64 (xor VR128:$src1,
708 (load addr:$src2))))]>;
709def ANDNPSrr : PSI<0x55, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
710 "andnps {$src2, $dst|$dst, $src2}",
711 [(set VR128:$dst, (v4i32 (and (not VR128:$src1),
712 VR128:$src2)))]>;
713def ANDNPSrm : PSI<0x55, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
714 "andnps {$src2, $dst|$dst, $src2}",
715 [(set VR128:$dst, (v4i32 (and (not VR128:$src1),
716 (load addr:$src2))))]>;
717def ANDNPDrr : PDI<0x55, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
718 "andnpd {$src2, $dst|$dst, $src2}",
719 [(set VR128:$dst, (v2i64 (and (not VR128:$src1),
720 VR128:$src2)))]>;
721
722def ANDNPDrm : PDI<0x55, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
723 "andnpd {$src2, $dst|$dst, $src2}",
724 [(set VR128:$dst, (v2i64 (and VR128:$src1,
725 (load addr:$src2))))]>;
Evan Chengffcb95b2006-02-21 19:13:53 +0000726}
Evan Chengbf156d12006-02-21 19:26:52 +0000727
Evan Cheng470a6ad2006-02-22 02:26:30 +0000728let isTwoAddress = 1 in {
729def CMPPSrr : PSI<0xC2, MRMSrcReg,
Evan Cheng2246f842006-03-18 01:23:20 +0000730 (ops VR128:$dst, VR128:$src1, VR128:$src, SSECC:$cc),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000731 "cmp${cc}ps {$src, $dst|$dst, $src}", []>;
732def CMPPSrm : PSI<0xC2, MRMSrcMem,
Evan Cheng2246f842006-03-18 01:23:20 +0000733 (ops VR128:$dst, VR128:$src1, f128mem:$src, SSECC:$cc),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000734 "cmp${cc}ps {$src, $dst|$dst, $src}", []>;
735def CMPPDrr : PDI<0xC2, MRMSrcReg,
Evan Cheng2246f842006-03-18 01:23:20 +0000736 (ops VR128:$dst, VR128:$src1, VR128:$src, SSECC:$cc),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000737 "cmp${cc}pd {$src, $dst|$dst, $src}", []>;
738def CMPPDrm : PDI<0xC2, MRMSrcMem,
Evan Cheng2246f842006-03-18 01:23:20 +0000739 (ops VR128:$dst, VR128:$src1, f128mem:$src, SSECC:$cc),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000740 "cmp${cc}pd {$src, $dst|$dst, $src}", []>;
741}
742
743// Shuffle and unpack instructions
Evan Cheng2da953f2006-03-22 07:10:28 +0000744def PSHUFWrr : PSIi8<0x70, MRMDestReg,
745 (ops VR64:$dst, VR64:$src1, i8imm:$src2),
746 "pshufw {$src2, $src1, $dst|$dst, $src1, $src2}", []>;
747def PSHUFWrm : PSIi8<0x70, MRMSrcMem,
748 (ops VR64:$dst, i64mem:$src1, i8imm:$src2),
749 "pshufw {$src2, $src1, $dst|$dst, $src1, $src2}", []>;
750def PSHUFDrr : PDIi8<0x70, MRMDestReg,
751 (ops VR128:$dst, VR128:$src1, i8imm:$src2),
Evan Cheng0188ecb2006-03-22 18:59:22 +0000752 "pshufd {$src2, $src1, $dst|$dst, $src1, $src2}", []>;
Evan Cheng2da953f2006-03-22 07:10:28 +0000753def PSHUFDrm : PDIi8<0x70, MRMSrcMem,
754 (ops VR128:$dst, i128mem:$src1, i8imm:$src2),
755 "pshufd {$src2, $src1, $dst|$dst, $src1, $src2}", []>;
Evan Chengb9df0ca2006-03-22 02:53:00 +0000756
Evan Cheng0cea6d22006-03-22 20:08:18 +0000757let isTwoAddress = 1 in {
Evan Cheng2da953f2006-03-22 07:10:28 +0000758def SHUFPSrr : PSIi8<0xC6, MRMSrcReg,
759 (ops VR128:$dst, VR128:$src1, VR128:$src2, i8imm:$src3),
Evan Cheng14aed5e2006-03-24 01:18:28 +0000760 "shufps {$src3, $src2, $dst|$dst, $src2, $src3}",
761 [(set VR128:$dst, (vector_shuffle
762 (v4f32 VR128:$src1), (v4f32 VR128:$src2),
763 SHUFP_shuffle_mask:$src3))]>;
Evan Cheng2da953f2006-03-22 07:10:28 +0000764def SHUFPSrm : PSIi8<0xC6, MRMSrcMem,
765 (ops VR128:$dst, VR128:$src1, f128mem:$src2, i8imm:$src3),
766 "shufps {$src3, $src2, $dst|$dst, $src2, $src3}", []>;
767def SHUFPDrr : PDIi8<0xC6, MRMSrcReg,
768 (ops VR128:$dst, VR128:$src1, VR128:$src2, i8imm:$src3),
Evan Cheng14aed5e2006-03-24 01:18:28 +0000769 "shufpd {$src3, $src2, $dst|$dst, $src2, $src3}",
770 [(set VR128:$dst, (vector_shuffle
771 (v2f64 VR128:$src1), (v2f64 VR128:$src2),
772 SHUFP_shuffle_mask:$src3))]>;
Evan Cheng2da953f2006-03-22 07:10:28 +0000773def SHUFPDrm : PDIi8<0xC6, MRMSrcMem,
774 (ops VR128:$dst, VR128:$src1, f128mem:$src2, i8imm:$src3),
775 "shufpd {$src3, $src2, $dst|$dst, $src2, $src3}", []>;
Evan Cheng470a6ad2006-02-22 02:26:30 +0000776
777def UNPCKHPSrr : PSI<0x15, MRMSrcReg,
Evan Cheng2246f842006-03-18 01:23:20 +0000778 (ops VR128:$dst, VR128:$src1, VR128:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000779 "unpckhps {$src2, $dst|$dst, $src2}", []>;
780def UNPCKHPSrm : PSI<0x15, MRMSrcMem,
Evan Cheng2246f842006-03-18 01:23:20 +0000781 (ops VR128:$dst, VR128:$src1, f128mem:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000782 "unpckhps {$src2, $dst|$dst, $src2}", []>;
783def UNPCKHPDrr : PDI<0x15, MRMSrcReg,
Evan Cheng2246f842006-03-18 01:23:20 +0000784 (ops VR128:$dst, VR128:$src1, VR128:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000785 "unpckhpd {$src2, $dst|$dst, $src2}", []>;
786def UNPCKHPDrm : PDI<0x15, MRMSrcMem,
Evan Cheng2246f842006-03-18 01:23:20 +0000787 (ops VR128:$dst, VR128:$src1, f128mem:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000788 "unpckhpd {$src2, $dst|$dst, $src2}", []>;
789def UNPCKLPSrr : PSI<0x14, MRMSrcReg,
Evan Cheng2246f842006-03-18 01:23:20 +0000790 (ops VR128:$dst, VR128:$src1, VR128:$src2),
Evan Chengc60bd972006-03-25 09:37:23 +0000791 "unpcklps {$src2, $dst|$dst, $src2}",
792 [(set VR128:$dst, (v4f32 (X86unpckl VR128:$src1,
793 VR128:$src2)))]>;
Evan Cheng470a6ad2006-02-22 02:26:30 +0000794def UNPCKLPSrm : PSI<0x14, MRMSrcMem,
Evan Cheng2246f842006-03-18 01:23:20 +0000795 (ops VR128:$dst, VR128:$src1, f128mem:$src2),
Evan Chengc60bd972006-03-25 09:37:23 +0000796 "unpcklps {$src2, $dst|$dst, $src2}",
797 [(set VR128:$dst, (v4f32 (X86unpckl VR128:$src1,
798 (load addr:$src2))))]>;
Evan Cheng470a6ad2006-02-22 02:26:30 +0000799def UNPCKLPDrr : PDI<0x14, MRMSrcReg,
Evan Cheng2246f842006-03-18 01:23:20 +0000800 (ops VR128:$dst, VR128:$src1, VR128:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000801 "unpcklpd {$src2, $dst|$dst, $src2}", []>;
802def UNPCKLPDrm : PDI<0x14, MRMSrcMem,
Evan Cheng2246f842006-03-18 01:23:20 +0000803 (ops VR128:$dst, VR128:$src1, f128mem:$src2),
Evan Cheng470a6ad2006-02-22 02:26:30 +0000804 "unpcklpd {$src2, $dst|$dst, $src2}", []>;
Evan Cheng2c0dbd02006-03-24 02:58:06 +0000805}
Evan Cheng470a6ad2006-02-22 02:26:30 +0000806
Evan Chengbf156d12006-02-21 19:26:52 +0000807//===----------------------------------------------------------------------===//
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000808// SSE integer instructions
Evan Chengbf156d12006-02-21 19:26:52 +0000809//===----------------------------------------------------------------------===//
810
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000811// Move Instructions
Evan Cheng470a6ad2006-02-22 02:26:30 +0000812def MOVD128rr : PDI<0x6E, MRMSrcReg, (ops VR128:$dst, R32:$src),
Evan Cheng24dc1f52006-03-23 07:44:07 +0000813 "movd {$src, $dst|$dst, $src}",
Evan Cheng48090aa2006-03-21 23:01:21 +0000814 [(set VR128:$dst,
815 (v4i32 (scalar_to_vector R32:$src)))]>;
Evan Cheng470a6ad2006-02-22 02:26:30 +0000816def MOVD128rm : PDI<0x6E, MRMSrcMem, (ops VR128:$dst, i32mem:$src),
Evan Chengbc4832b2006-03-24 23:15:12 +0000817 "movd {$src, $dst|$dst, $src}",
818 [(set VR128:$dst,
819 (v4i32 (scalar_to_vector (loadi32 addr:$src))))]>;
820
Evan Cheng470a6ad2006-02-22 02:26:30 +0000821def MOVD128mr : PDI<0x7E, MRMDestMem, (ops i32mem:$dst, VR128:$src),
822 "movd {$src, $dst|$dst, $src}", []>;
Evan Chengbf156d12006-02-21 19:26:52 +0000823
Evan Cheng24dc1f52006-03-23 07:44:07 +0000824def MOVDQArr : PDI<0x6F, MRMSrcReg, (ops VR128:$dst, VR128:$src),
825 "movdqa {$src, $dst|$dst, $src}", []>;
826def MOVDQArm : PDI<0x6F, MRMSrcMem, (ops VR128:$dst, i128mem:$src),
827 "movdqa {$src, $dst|$dst, $src}",
828 [(set VR128:$dst, (loadv4i32 addr:$src))]>;
829def MOVDQAmr : PDI<0x7F, MRMDestMem, (ops i128mem:$dst, VR128:$src),
830 "movdqa {$src, $dst|$dst, $src}",
831 [(store (v4i32 VR128:$src), addr:$dst)]>;
832
Evan Cheng470a6ad2006-02-22 02:26:30 +0000833// SSE2 instructions with XS prefix
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000834def MOVQ128rr : I<0x7E, MRMSrcReg, (ops VR128:$dst, VR64:$src),
Evan Cheng48090aa2006-03-21 23:01:21 +0000835 "movq {$src, $dst|$dst, $src}",
836 [(set VR128:$dst,
837 (v2i64 (scalar_to_vector VR64:$src)))]>, XS,
Evan Cheng4e4c71e2006-02-21 20:00:20 +0000838 Requires<[HasSSE2]>;
839def MOVQ128rm : I<0x7E, MRMSrcMem, (ops VR128:$dst, i64mem:$src),
Evan Chengbc4832b2006-03-24 23:15:12 +0000840 "movq {$src, $dst|$dst, $src}", []>, XS,
841 Requires<[HasSSE2]>;
Evan Cheng470a6ad2006-02-22 02:26:30 +0000842def MOVQ128mr : PDI<0xD6, MRMSrcMem, (ops i64mem:$dst, VR128:$src),
843 "movq {$src, $dst|$dst, $src}", []>;
Evan Cheng82521dd2006-03-21 07:09:35 +0000844
Evan Chenga971f6f2006-03-23 01:57:24 +0000845// 128-bit Integer Arithmetic
846let isTwoAddress = 1 in {
847let isCommutable = 1 in {
848def PADDBrr : PDI<0xFC, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
849 "paddb {$src2, $dst|$dst, $src2}",
850 [(set VR128:$dst, (v16i8 (add VR128:$src1, VR128:$src2)))]>;
851def PADDWrr : PDI<0xFD, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
852 "paddw {$src2, $dst|$dst, $src2}",
853 [(set VR128:$dst, (v8i16 (add VR128:$src1, VR128:$src2)))]>;
854def PADDDrr : PDI<0xFE, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
855 "paddd {$src2, $dst|$dst, $src2}",
856 [(set VR128:$dst, (v4i32 (add VR128:$src1, VR128:$src2)))]>;
857}
858def PADDBrm : PDI<0xFC, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
859 "paddb {$src2, $dst|$dst, $src2}",
860 [(set VR128:$dst, (v16i8 (add VR128:$src1,
861 (load addr:$src2))))]>;
862def PADDWrm : PDI<0xFD, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
863 "paddw {$src2, $dst|$dst, $src2}",
864 [(set VR128:$dst, (v8i16 (add VR128:$src1,
865 (load addr:$src2))))]>;
866def PADDDrm : PDI<0xFE, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
867 "paddd {$src2, $dst|$dst, $src2}",
868 [(set VR128:$dst, (v4i32 (add VR128:$src1,
869 (load addr:$src2))))]>;
Evan Cheng7b1d34b2006-03-25 01:33:37 +0000870
871def PSUBBrr : PDI<0xF8, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
872 "psubb {$src2, $dst|$dst, $src2}",
873 [(set VR128:$dst, (v16i8 (sub VR128:$src1, VR128:$src2)))]>;
874def PSUBWrr : PDI<0xF9, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
875 "psubw {$src2, $dst|$dst, $src2}",
876 [(set VR128:$dst, (v8i16 (sub VR128:$src1, VR128:$src2)))]>;
877def PSUBDrr : PDI<0xFA, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
878 "psubd {$src2, $dst|$dst, $src2}",
879 [(set VR128:$dst, (v4i32 (sub VR128:$src1, VR128:$src2)))]>;
880
881def PSUBBrm : PDI<0xF8, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
882 "psubb {$src2, $dst|$dst, $src2}",
883 [(set VR128:$dst, (v16i8 (sub VR128:$src1,
884 (load addr:$src2))))]>;
885def PSUBWrm : PDI<0xF9, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
886 "psubw {$src2, $dst|$dst, $src2}",
887 [(set VR128:$dst, (v8i16 (sub VR128:$src1,
888 (load addr:$src2))))]>;
889def PSUBDrm : PDI<0xFA, MRMSrcMem, (ops VR128:$dst, VR128:$src1, f128mem:$src2),
890 "psubd {$src2, $dst|$dst, $src2}",
891 [(set VR128:$dst, (v4i32 (sub VR128:$src1,
892 (load addr:$src2))))]>;
Evan Chengc60bd972006-03-25 09:37:23 +0000893
894// Unpack and interleave
895def PUNPCKLBWrr : PDI<0x60, MRMSrcReg,
896 (ops VR128:$dst, VR128:$src1, VR128:$src2),
897 "punpcklbw {$src2, $dst|$dst, $src2}",
898 [(set VR128:$dst, (v16i8 (X86unpckl VR128:$src1,
899 VR128:$src2)))]>;
900def PUNPCKLBWrm : PDI<0x60, MRMSrcMem,
901 (ops VR128:$dst, VR128:$src1, i128mem:$src2),
902 "punpcklbw {$src2, $dst|$dst, $src2}",
903 [(set VR128:$dst, (v16i8 (X86unpckl VR128:$src1,
904 (load addr:$src2))))]>;
905def PUNPCKLWDrr : PDI<0x61, MRMSrcReg,
906 (ops VR128:$dst, VR128:$src1, VR128:$src2),
907 "punpcklwd {$src2, $dst|$dst, $src2}",
908 [(set VR128:$dst, (v8i16 (X86unpckl VR128:$src1,
909 VR128:$src2)))]>;
910def PUNPCKLWDrm : PDI<0x61, MRMSrcMem,
911 (ops VR128:$dst, VR128:$src1, i128mem:$src2),
912 "punpcklwd {$src2, $dst|$dst, $src2}",
913 [(set VR128:$dst, (v8i16 (X86unpckl VR128:$src1,
914 (load addr:$src2))))]>;
915def PUNPCKLDQrr : PDI<0x62, MRMSrcReg,
916 (ops VR128:$dst, VR128:$src1, VR128:$src2),
917 "punpckldq {$src2, $dst|$dst, $src2}",
918 [(set VR128:$dst, (v4i32 (X86unpckl VR128:$src1,
919 VR128:$src2)))]>;
920def PUNPCKLDQrm : PDI<0x62, MRMSrcMem,
921 (ops VR128:$dst, VR128:$src1, i128mem:$src2),
922 "punpckldq {$src2, $dst|$dst, $src2}",
923 [(set VR128:$dst, (v4i32 (X86unpckl VR128:$src1,
924 (load addr:$src2))))]>;
925def PUNPCKLQDQrr : PDI<0x6C, MRMSrcReg,
926 (ops VR128:$dst, VR128:$src1, VR128:$src2),
927 "punpcklqdq {$src2, $dst|$dst, $src2}", []>;
928def PUNPCKLQDQrm : PDI<0x6C, MRMSrcMem,
929 (ops VR128:$dst, VR128:$src1, i128mem:$src2),
930 "punpcklqdq {$src2, $dst|$dst, $src2}", []>;
931
932def PUNPCKHBWrr : PDI<0x68, MRMSrcReg,
933 (ops VR128:$dst, VR128:$src1, VR128:$src2),
934 "punpckhbw {$src2, $dst|$dst, $src2}", []>;
935def PUNPCKHBWrm : PDI<0x68, MRMSrcMem,
936 (ops VR128:$dst, VR128:$src1, i128mem:$src2),
937 "punpckhbw {$src2, $dst|$dst, $src2}", []>;
938def PUNPCKHWDrr : PDI<0x69, MRMSrcReg,
939 (ops VR128:$dst, VR128:$src1, VR128:$src2),
940 "punpckhwd {$src2, $dst|$dst, $src2}", []>;
941def PUNPCKHWDrm : PDI<0x69, MRMSrcMem,
942 (ops VR128:$dst, VR128:$src1, i128mem:$src2),
943 "punpckhwd {$src2, $dst|$dst, $src2}", []>;
944def PUNPCKHDQrr : PDI<0x6A, MRMSrcReg,
945 (ops VR128:$dst, VR128:$src1, VR128:$src2),
946 "punpckhdq {$src2, $dst|$dst, $src2}", []>;
947def PUNPCKHDQrm : PDI<0x6A, MRMSrcMem,
948 (ops VR128:$dst, VR128:$src1, i128mem:$src2),
949 "punpckhdq {$src2, $dst|$dst, $src2}", []>;
950def PUNPCKHQDQrr : PDI<0x6D, MRMSrcReg,
951 (ops VR128:$dst, VR128:$src1, VR128:$src2),
952 "punpckhdq {$src2, $dst|$dst, $src2}", []>;
953def PUNPCKHQDQrm : PDI<0x6D, MRMSrcMem,
954 (ops VR128:$dst, VR128:$src1, i128mem:$src2),
955 "punpckhqdq {$src2, $dst|$dst, $src2}", []>;
Evan Chenga971f6f2006-03-23 01:57:24 +0000956}
Evan Cheng82521dd2006-03-21 07:09:35 +0000957
958//===----------------------------------------------------------------------===//
Evan Chengc653d482006-03-24 22:28:37 +0000959// Miscellaneous Instructions
960//===----------------------------------------------------------------------===//
961
Evan Chengecac9cb2006-03-25 06:03:26 +0000962// Prefetching loads
963def PREFETCHT0 : I<0x18, MRM1m, (ops i8mem:$src),
964 "prefetcht0 $src", []>, TB,
965 Requires<[HasSSE1]>;
966def PREFETCHT1 : I<0x18, MRM2m, (ops i8mem:$src),
967 "prefetcht0 $src", []>, TB,
968 Requires<[HasSSE1]>;
969def PREFETCHT2 : I<0x18, MRM3m, (ops i8mem:$src),
970 "prefetcht0 $src", []>, TB,
971 Requires<[HasSSE1]>;
972def PREFETCHTNTA : I<0x18, MRM0m, (ops i8mem:$src),
973 "prefetcht0 $src", []>, TB,
974 Requires<[HasSSE1]>;
975
976// Non-temporal stores
977def MOVNTQ : I<0xE7, MRMDestMem, (ops i64mem:$dst, VR64:$src),
978 "movntq {$src, $dst|$dst, $src}", []>, TB,
979 Requires<[HasSSE1]>;
980def MOVNTPS : I<0x2B, MRMDestMem, (ops i128mem:$dst, VR128:$src),
981 "movntps {$src, $dst|$dst, $src}", []>, TB,
982 Requires<[HasSSE1]>;
983def MASKMOVQ : I<0xF7, MRMDestMem, (ops i64mem:$dst, VR64:$src),
984 "maskmovq {$src, $dst|$dst, $src}", []>, TB,
985 Requires<[HasSSE1]>;
986
987// Store fence
988def SFENCE : I<0xAE, MRM7m, (ops),
989 "sfence", []>, TB, Requires<[HasSSE1]>;
990
991// Load MXCSR register
Evan Chengc653d482006-03-24 22:28:37 +0000992def LDMXCSR : I<0xAE, MRM2m, (ops i32mem:$src),
993 "ldmxcsr {$src|$src}", []>, TB, Requires<[HasSSE1]>;
994
995//===----------------------------------------------------------------------===//
Evan Cheng82521dd2006-03-21 07:09:35 +0000996// Alias Instructions
997//===----------------------------------------------------------------------===//
998
Evan Chengffea91e2006-03-26 09:53:12 +0000999// Alias instructions that map zero vector to pxor / xorp* for sse.
Evan Cheng386031a2006-03-24 07:29:27 +00001000// FIXME: remove when we can teach regalloc that xor reg, reg is ok.
Evan Chengffea91e2006-03-26 09:53:12 +00001001def V_SET0_PI : PDI<0xEF, MRMInitReg, (ops VR128:$dst),
1002 "pxor $dst, $dst",
1003 [(set VR128:$dst, (v2i64 immAllZerosV))]>;
1004def V_SET0_PS : PSI<0x57, MRMInitReg, (ops VR128:$dst),
1005 "xorps $dst, $dst",
1006 [(set VR128:$dst, (v4f32 immAllZerosV))]>;
1007def V_SET0_PD : PDI<0x57, MRMInitReg, (ops VR128:$dst),
1008 "xorpd $dst, $dst",
1009 [(set VR128:$dst, (v2f64 immAllZerosV))]>;
Evan Cheng386031a2006-03-24 07:29:27 +00001010
Evan Chenga0b3afb2006-03-27 07:00:16 +00001011def V_SETALLONES : PDI<0x76, MRMInitReg, (ops VR128:$dst),
1012 "pcmpeqd $dst, $dst",
1013 [(set VR128:$dst, (v2f64 immAllOnesV))]>;
1014
Evan Chengbc4832b2006-03-24 23:15:12 +00001015// Scalar to 128-bit vector with zero extension.
1016// Three operand (but two address) aliases.
1017let isTwoAddress = 1 in {
1018def MOVZSS128rr : SSI<0x10, MRMSrcReg, (ops VR128:$dst, VR128:$src1, FR32:$src2),
1019 "movss {$src2, $dst|$dst, $src2}", []>;
1020def MOVZSD128rr : SDI<0x10, MRMSrcReg, (ops VR128:$dst, VR128:$src1, FR64:$src2),
1021 "movsd {$src2, $dst|$dst, $src2}", []>;
1022def MOVZD128rr : PDI<0x6E, MRMSrcReg, (ops VR128:$dst, VR128:$src1, R32:$src2),
1023 "movd {$src2, $dst|$dst, $src2}", []>;
1024def MOVZQ128rr : I<0x7E, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR64:$src2),
1025 "movq {$src2, $dst|$dst, $src2}", []>;
1026}
Evan Cheng82521dd2006-03-21 07:09:35 +00001027
Evan Chengbc4832b2006-03-24 23:15:12 +00001028// Loading from memory automatically zeroing upper bits.
1029def MOVZSS128rm : SSI<0x10, MRMSrcMem, (ops VR128:$dst, f32mem:$src),
1030 "movss {$src, $dst|$dst, $src}",
Evan Cheng82521dd2006-03-21 07:09:35 +00001031 [(set VR128:$dst,
Evan Chengbc4832b2006-03-24 23:15:12 +00001032 (v4f32 (X86zexts2vec (loadf32 addr:$src))))]>;
1033def MOVZSD128rm : SDI<0x10, MRMSrcMem, (ops VR128:$dst, f64mem:$src),
1034 "movsd {$src, $dst|$dst, $src}",
1035 [(set VR128:$dst,
1036 (v2f64 (X86zexts2vec (loadf64 addr:$src))))]>;
1037def MOVZD128rm : PDI<0x6E, MRMSrcMem, (ops VR128:$dst, i32mem:$src),
1038 "movd {$src, $dst|$dst, $src}",
1039 [(set VR128:$dst,
1040 (v4i32 (X86zexts2vec (loadi32 addr:$src))))]>;
Evan Cheng48090aa2006-03-21 23:01:21 +00001041
1042//===----------------------------------------------------------------------===//
1043// Non-Instruction Patterns
1044//===----------------------------------------------------------------------===//
1045
1046// 128-bit vector undef's.
1047def : Pat<(v2f64 (undef)), (IMPLICIT_DEF_VR128)>, Requires<[HasSSE2]>;
1048def : Pat<(v16i8 (undef)), (IMPLICIT_DEF_VR128)>, Requires<[HasSSE2]>;
1049def : Pat<(v8i16 (undef)), (IMPLICIT_DEF_VR128)>, Requires<[HasSSE2]>;
1050def : Pat<(v4i32 (undef)), (IMPLICIT_DEF_VR128)>, Requires<[HasSSE2]>;
1051def : Pat<(v2i64 (undef)), (IMPLICIT_DEF_VR128)>, Requires<[HasSSE2]>;
1052
Evan Chengffea91e2006-03-26 09:53:12 +00001053// 128-bit vector all zero's.
1054def : Pat<(v16i8 immAllZerosV), (v16i8 (V_SET0_PI))>, Requires<[HasSSE2]>;
1055def : Pat<(v8i16 immAllZerosV), (v8i16 (V_SET0_PI))>, Requires<[HasSSE2]>;
1056def : Pat<(v4i32 immAllZerosV), (v4i32 (V_SET0_PI))>, Requires<[HasSSE2]>;
1057
Evan Chenga0b3afb2006-03-27 07:00:16 +00001058// 128-bit vector all one's.
1059def : Pat<(v16i8 immAllOnesV), (v16i8 (V_SETALLONES))>, Requires<[HasSSE2]>;
1060def : Pat<(v8i16 immAllOnesV), (v8i16 (V_SETALLONES))>, Requires<[HasSSE2]>;
1061def : Pat<(v4i32 immAllOnesV), (v4i32 (V_SETALLONES))>, Requires<[HasSSE2]>;
1062def : Pat<(v2i64 immAllOnesV), (v2i64 (V_SETALLONES))>, Requires<[HasSSE2]>;
1063def : Pat<(v4f32 immAllOnesV), (v4f32 (V_SETALLONES))>, Requires<[HasSSE1]>;
1064
Evan Chenga971f6f2006-03-23 01:57:24 +00001065// Load 128-bit integer vector values.
Evan Cheng24dc1f52006-03-23 07:44:07 +00001066def : Pat<(v16i8 (load addr:$src)), (MOVDQArm addr:$src)>,
Evan Chengffea91e2006-03-26 09:53:12 +00001067 Requires<[HasSSE2]>;
Evan Cheng24dc1f52006-03-23 07:44:07 +00001068def : Pat<(v8i16 (load addr:$src)), (MOVDQArm addr:$src)>,
Evan Chengffea91e2006-03-26 09:53:12 +00001069 Requires<[HasSSE2]>;
Evan Cheng24dc1f52006-03-23 07:44:07 +00001070def : Pat<(v4i32 (load addr:$src)), (MOVDQArm addr:$src)>,
Evan Chengffea91e2006-03-26 09:53:12 +00001071 Requires<[HasSSE2]>;
Evan Cheng24dc1f52006-03-23 07:44:07 +00001072def : Pat<(v2i64 (load addr:$src)), (MOVDQArm addr:$src)>,
Evan Chengffea91e2006-03-26 09:53:12 +00001073 Requires<[HasSSE2]>;
Evan Chenga971f6f2006-03-23 01:57:24 +00001074
Evan Cheng48090aa2006-03-21 23:01:21 +00001075// Store 128-bit integer vector values.
Evan Cheng24dc1f52006-03-23 07:44:07 +00001076def : Pat<(store (v16i8 VR128:$src), addr:$dst),
Evan Chengffea91e2006-03-26 09:53:12 +00001077 (MOVDQAmr addr:$dst, VR128:$src)>, Requires<[HasSSE2]>;
Evan Cheng24dc1f52006-03-23 07:44:07 +00001078def : Pat<(store (v8i16 VR128:$src), addr:$dst),
Evan Chengffea91e2006-03-26 09:53:12 +00001079 (MOVDQAmr addr:$dst, VR128:$src)>, Requires<[HasSSE2]>;
Evan Cheng24dc1f52006-03-23 07:44:07 +00001080def : Pat<(store (v4i32 VR128:$src), addr:$dst),
Evan Chengffea91e2006-03-26 09:53:12 +00001081 (MOVDQAmr addr:$dst, VR128:$src)>, Requires<[HasSSE2]>;
Evan Cheng24dc1f52006-03-23 07:44:07 +00001082def : Pat<(store (v2i64 VR128:$src), addr:$dst),
1083 (MOVDQAmr addr:$dst, VR128:$src)>, Requires<[HasSSE2]>;
Evan Cheng48090aa2006-03-21 23:01:21 +00001084
1085// Scalar to v8i16 / v16i8. The source may be a R32, but only the lower 8 or
1086// 16-bits matter.
1087def : Pat<(v8i16 (X86s2vec R32:$src)), (MOVD128rr R32:$src)>,
Evan Chengffea91e2006-03-26 09:53:12 +00001088 Requires<[HasSSE2]>;
Evan Cheng48090aa2006-03-21 23:01:21 +00001089def : Pat<(v16i8 (X86s2vec R32:$src)), (MOVD128rr R32:$src)>,
Evan Chengffea91e2006-03-26 09:53:12 +00001090 Requires<[HasSSE2]>;
Evan Cheng48090aa2006-03-21 23:01:21 +00001091
Evan Cheng2c0dbd02006-03-24 02:58:06 +00001092// bit_convert
Evan Chengffea91e2006-03-26 09:53:12 +00001093def : Pat<(v4i32 (bitconvert (v4f32 VR128:$src))), (v4i32 VR128:$src)>,
1094 Requires<[HasSSE2]>;
1095def : Pat<(v4f32 (bitconvert (v4i32 VR128:$src))), (v4f32 VR128:$src)>,
1096 Requires<[HasSSE2]>;
Evan Chengb9df0ca2006-03-22 02:53:00 +00001097
Evan Chengbc4832b2006-03-24 23:15:12 +00001098// Zeroing a VR128 then do a MOVS* to the lower bits.
1099def : Pat<(v2f64 (X86zexts2vec FR64:$src)),
Evan Chengffea91e2006-03-26 09:53:12 +00001100 (MOVZSD128rr (V_SET0_PD), FR64:$src)>, Requires<[HasSSE2]>;
Evan Chengbc4832b2006-03-24 23:15:12 +00001101def : Pat<(v4f32 (X86zexts2vec FR32:$src)),
Evan Chengffea91e2006-03-26 09:53:12 +00001102 (MOVZSS128rr (V_SET0_PS), FR32:$src)>, Requires<[HasSSE2]>;
Evan Chengbc4832b2006-03-24 23:15:12 +00001103def : Pat<(v2i64 (X86zexts2vec VR64:$src)),
Evan Chengffea91e2006-03-26 09:53:12 +00001104 (MOVZQ128rr (V_SET0_PI), VR64:$src)>, Requires<[HasSSE2]>;
Evan Chengbc4832b2006-03-24 23:15:12 +00001105def : Pat<(v4i32 (X86zexts2vec R32:$src)),
Evan Chengffea91e2006-03-26 09:53:12 +00001106 (MOVZD128rr (V_SET0_PI), R32:$src)>, Requires<[HasSSE2]>;
Evan Chengbc4832b2006-03-24 23:15:12 +00001107def : Pat<(v8i16 (X86zexts2vec R16:$src)),
Evan Chengffea91e2006-03-26 09:53:12 +00001108 (MOVZD128rr (V_SET0_PI), (MOVZX32rr16 R16:$src))>, Requires<[HasSSE2]>;
Evan Chengbc4832b2006-03-24 23:15:12 +00001109def : Pat<(v16i8 (X86zexts2vec R8:$src)),
Evan Chengffea91e2006-03-26 09:53:12 +00001110 (MOVZD128rr (V_SET0_PI), (MOVZX32rr8 R8:$src))>, Requires<[HasSSE2]>;
Evan Chengbc4832b2006-03-24 23:15:12 +00001111
Evan Chengb9df0ca2006-03-22 02:53:00 +00001112// Splat v4f32 / v4i32
Evan Cheng63d33002006-03-22 08:01:21 +00001113def : Pat<(vector_shuffle (v4f32 VR128:$src), (undef), SHUFP_splat_mask:$sm),
Evan Cheng1bffadd2006-03-22 19:16:21 +00001114 (v4f32 (SHUFPSrr VR128:$src, VR128:$src, SHUFP_splat_mask:$sm))>,
Evan Chengffea91e2006-03-26 09:53:12 +00001115 Requires<[HasSSE1]>;
Evan Cheng63d33002006-03-22 08:01:21 +00001116def : Pat<(vector_shuffle (v4i32 VR128:$src), (undef), SHUFP_splat_mask:$sm),
Evan Cheng1bffadd2006-03-22 19:16:21 +00001117 (v4i32 (SHUFPSrr VR128:$src, VR128:$src, SHUFP_splat_mask:$sm))>,
Evan Chengffea91e2006-03-26 09:53:12 +00001118 Requires<[HasSSE2]>;
Evan Chengb9df0ca2006-03-22 02:53:00 +00001119
1120// Splat v2f64 / v2i64
Evan Cheng1bffadd2006-03-22 19:16:21 +00001121def : Pat<(vector_shuffle (v2f64 VR128:$src), (undef), MOVLHPS_splat_mask:$sm),
Evan Chengffea91e2006-03-26 09:53:12 +00001122 (v2f64 (MOVLHPSrr VR128:$src, VR128:$src))>, Requires<[HasSSE2]>;
Evan Cheng1bffadd2006-03-22 19:16:21 +00001123def : Pat<(vector_shuffle (v2i64 VR128:$src), (undef), MOVLHPS_splat_mask:$sm),
Evan Chengffea91e2006-03-26 09:53:12 +00001124 (v2i64 (MOVLHPSrr VR128:$src, VR128:$src))>, Requires<[HasSSE2]>;
Evan Cheng63d33002006-03-22 08:01:21 +00001125
Evan Cheng0188ecb2006-03-22 18:59:22 +00001126// Shuffle v4f32 / v4i32, undef. These should only match if splat cases do not.
1127def : Pat<(vector_shuffle (v4f32 VR128:$src), (undef), PSHUFD_shuffle_mask:$sm),
Evan Cheng1bffadd2006-03-22 19:16:21 +00001128 (v4f32 (PSHUFDrr VR128:$src, PSHUFD_shuffle_mask:$sm))>,
Evan Chengffea91e2006-03-26 09:53:12 +00001129 Requires<[HasSSE2]>;
Evan Cheng0188ecb2006-03-22 18:59:22 +00001130def : Pat<(vector_shuffle (v4i32 VR128:$src), (undef), PSHUFD_shuffle_mask:$sm),
Evan Cheng1bffadd2006-03-22 19:16:21 +00001131 (v4i32 (PSHUFDrr VR128:$src, PSHUFD_shuffle_mask:$sm))>,
Evan Chengffea91e2006-03-26 09:53:12 +00001132 Requires<[HasSSE2]>;
Evan Cheng3b047f72006-03-23 02:36:37 +00001133
Evan Cheng2c0dbd02006-03-24 02:58:06 +00001134// Shuffle v2f64 / v2i64
1135def : Pat<(vector_shuffle (v2f64 VR128:$src1), (v2f64 VR128:$src2),
1136 MOVLHPSorUNPCKLPD_shuffle_mask:$sm),
Evan Chengffea91e2006-03-26 09:53:12 +00001137 (v2f64 (MOVLHPSrr VR128:$src1, VR128:$src2))>, Requires<[HasSSE2]>;
Evan Cheng2c0dbd02006-03-24 02:58:06 +00001138def : Pat<(vector_shuffle (v2f64 VR128:$src1), (v2f64 VR128:$src2),
1139 MOVHLPS_shuffle_mask:$sm),
Evan Chengffea91e2006-03-26 09:53:12 +00001140 (v2f64 (MOVHLPSrr VR128:$src1, VR128:$src2))>, Requires<[HasSSE2]>;
Evan Cheng2c0dbd02006-03-24 02:58:06 +00001141def : Pat<(vector_shuffle (v2f64 VR128:$src1), (v2f64 VR128:$src2),
1142 UNPCKHPD_shuffle_mask:$sm),
1143 (v2f64 (UNPCKHPDrr VR128:$src1, VR128:$src2))>, Requires<[HasSSE2]>;
1144def : Pat<(vector_shuffle (v2f64 VR128:$src1), (loadv2f64 addr:$src2),
1145 MOVLHPSorUNPCKLPD_shuffle_mask:$sm),
1146 (v2f64 (UNPCKLPDrm VR128:$src1, addr:$src2))>, Requires<[HasSSE2]>;
1147
1148def : Pat<(vector_shuffle (v2i64 VR128:$src1), (v2i64 VR128:$src2),
1149 MOVLHPSorUNPCKLPD_shuffle_mask:$sm),
Evan Chengffea91e2006-03-26 09:53:12 +00001150 (v2i64 (MOVLHPSrr VR128:$src1, VR128:$src2))>, Requires<[HasSSE2]>;
Evan Cheng2c0dbd02006-03-24 02:58:06 +00001151def : Pat<(vector_shuffle (v2i64 VR128:$src1), (v2i64 VR128:$src2),
1152 MOVHLPS_shuffle_mask:$sm),
Evan Chengffea91e2006-03-26 09:53:12 +00001153 (v2i64 (MOVHLPSrr VR128:$src1, VR128:$src2))>, Requires<[HasSSE2]>;
Evan Cheng2c0dbd02006-03-24 02:58:06 +00001154def : Pat<(vector_shuffle (v2i64 VR128:$src1), (v2i64 VR128:$src2),
1155 UNPCKHPD_shuffle_mask:$sm),
1156 (v2i64 (UNPCKHPDrr VR128:$src1, VR128:$src2))>, Requires<[HasSSE2]>;
1157def : Pat<(vector_shuffle (v2i64 VR128:$src1), (loadv2i64 addr:$src2),
1158 MOVLHPSorUNPCKLPD_shuffle_mask:$sm),
1159 (v2i64 (UNPCKLPDrm VR128:$src1, addr:$src2))>, Requires<[HasSSE2]>;