blob: cfe47c6d32c60f074b3f084db40a32df0f5aee47 [file] [log] [blame]
Scott Michel8b6b4202007-12-04 22:35:58 +00001//==- SPUInstrInfo.td - Describe the Cell SPU Instructions -*- tablegen -*-==//
2//
3// The LLVM Compiler Infrastructure
4//
Chris Lattner081ce942007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Scott Michel8b6b4202007-12-04 22:35:58 +00007//
8//===----------------------------------------------------------------------===//
9// Cell SPU Instructions:
10//===----------------------------------------------------------------------===//
11
12//===----------------------------------------------------------------------===//
13// TODO Items (not urgent today, but would be nice, low priority)
14//
15// ANDBI, ORBI: SPU constructs a 4-byte constant for these instructions by
16// concatenating the byte argument b as "bbbb". Could recognize this bit pattern
17// in 16-bit and 32-bit constants and reduce instruction count.
18//===----------------------------------------------------------------------===//
19
20//===----------------------------------------------------------------------===//
21// Pseudo instructions:
22//===----------------------------------------------------------------------===//
23
24let hasCtrlDep = 1, Defs = [R1], Uses = [R1] in {
25 def ADJCALLSTACKDOWN : Pseudo<(outs), (ins u16imm:$amt),
26 "${:comment} ADJCALLSTACKDOWN",
27 [(callseq_start imm:$amt)]>;
28 def ADJCALLSTACKUP : Pseudo<(outs), (ins u16imm:$amt),
29 "${:comment} ADJCALLSTACKUP",
30 [(callseq_end imm:$amt)]>;
31}
32
33//===----------------------------------------------------------------------===//
34// DWARF debugging Pseudo Instructions
35//===----------------------------------------------------------------------===//
36
37def DWARF_LOC : Pseudo<(outs), (ins i32imm:$line, i32imm:$col, i32imm:$file),
38 "${:comment} .loc $file, $line, $col",
39 [(dwarf_loc (i32 imm:$line), (i32 imm:$col),
40 (i32 imm:$file))]>;
41
42//===----------------------------------------------------------------------===//
43// Loads:
44// NB: The ordering is actually important, since the instruction selection
45// will try each of the instructions in sequence, i.e., the D-form first with
46// the 10-bit displacement, then the A-form with the 16 bit displacement, and
47// finally the X-form with the register-register.
48//===----------------------------------------------------------------------===//
49
Chris Lattner1a1932c2008-01-06 23:38:27 +000050let isSimpleLoad = 1 in {
Scott Michelf9f42e62008-01-29 02:16:57 +000051 class LoadDFormVec<ValueType vectype>
52 : RI10Form<0b00101100, (outs VECREG:$rT), (ins memri10:$src),
53 "lqd\t$rT, $src",
54 LoadStore,
55 [(set (vectype VECREG:$rT), (load dform_addr:$src))]>
56 { }
Scott Michel8b6b4202007-12-04 22:35:58 +000057
Scott Michelf9f42e62008-01-29 02:16:57 +000058 class LoadDForm<RegisterClass rclass>
59 : RI10Form<0b00101100, (outs rclass:$rT), (ins memri10:$src),
60 "lqd\t$rT, $src",
61 LoadStore,
62 [(set rclass:$rT, (load dform_addr:$src))]>
63 { }
Scott Michel8b6b4202007-12-04 22:35:58 +000064
Scott Michelf9f42e62008-01-29 02:16:57 +000065 multiclass LoadDForms
66 {
67 def v16i8: LoadDFormVec<v16i8>;
68 def v8i16: LoadDFormVec<v8i16>;
69 def v4i32: LoadDFormVec<v4i32>;
70 def v2i64: LoadDFormVec<v2i64>;
71 def v4f32: LoadDFormVec<v4f32>;
72 def v2f64: LoadDFormVec<v2f64>;
Scott Michel8b6b4202007-12-04 22:35:58 +000073
Scott Michelf9f42e62008-01-29 02:16:57 +000074 def r128: LoadDForm<GPRC>;
75 def r64: LoadDForm<R64C>;
76 def r32: LoadDForm<R32C>;
77 def f32: LoadDForm<R32FP>;
78 def f64: LoadDForm<R64FP>;
79 def r16: LoadDForm<R16C>;
80 def r8: LoadDForm<R8C>;
81 }
Scott Michel8b6b4202007-12-04 22:35:58 +000082
Scott Michelf9f42e62008-01-29 02:16:57 +000083 class LoadAFormVec<ValueType vectype>
84 : RI16Form<0b100001100, (outs VECREG:$rT), (ins addr256k:$src),
85 "lqa\t$rT, $src",
86 LoadStore,
87 [(set (vectype VECREG:$rT), (load aform_addr:$src))]>
88 { }
Scott Michel8b6b4202007-12-04 22:35:58 +000089
Scott Michelf9f42e62008-01-29 02:16:57 +000090 class LoadAForm<RegisterClass rclass>
91 : RI16Form<0b100001100, (outs rclass:$rT), (ins addr256k:$src),
92 "lqa\t$rT, $src",
93 LoadStore,
94 [(set rclass:$rT, (load aform_addr:$src))]>
95 { }
Scott Michel8b6b4202007-12-04 22:35:58 +000096
Scott Michelf9f42e62008-01-29 02:16:57 +000097 multiclass LoadAForms
98 {
99 def v16i8: LoadAFormVec<v16i8>;
100 def v8i16: LoadAFormVec<v8i16>;
101 def v4i32: LoadAFormVec<v4i32>;
102 def v2i64: LoadAFormVec<v2i64>;
103 def v4f32: LoadAFormVec<v4f32>;
104 def v2f64: LoadAFormVec<v2f64>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000105
Scott Michelf9f42e62008-01-29 02:16:57 +0000106 def r128: LoadAForm<GPRC>;
107 def r64: LoadAForm<R64C>;
108 def r32: LoadAForm<R32C>;
109 def f32: LoadAForm<R32FP>;
110 def f64: LoadAForm<R64FP>;
111 def r16: LoadAForm<R16C>;
112 def r8: LoadAForm<R8C>;
113 }
Scott Michel8b6b4202007-12-04 22:35:58 +0000114
Scott Michelf9f42e62008-01-29 02:16:57 +0000115 class LoadXFormVec<ValueType vectype>
116 : RRForm<0b00100011100, (outs VECREG:$rT), (ins memrr:$src),
117 "lqx\t$rT, $src",
118 LoadStore,
119 [(set (vectype VECREG:$rT), (load xform_addr:$src))]>
120 { }
Scott Michel8b6b4202007-12-04 22:35:58 +0000121
Scott Michelf9f42e62008-01-29 02:16:57 +0000122 class LoadXForm<RegisterClass rclass>
123 : RRForm<0b00100011100, (outs rclass:$rT), (ins memrr:$src),
124 "lqx\t$rT, $src",
125 LoadStore,
126 [(set rclass:$rT, (load xform_addr:$src))]>
127 { }
Scott Michel8b6b4202007-12-04 22:35:58 +0000128
Scott Michelf9f42e62008-01-29 02:16:57 +0000129 multiclass LoadXForms
130 {
131 def v16i8: LoadXFormVec<v16i8>;
132 def v8i16: LoadXFormVec<v8i16>;
133 def v4i32: LoadXFormVec<v4i32>;
134 def v2i64: LoadXFormVec<v2i64>;
135 def v4f32: LoadXFormVec<v4f32>;
136 def v2f64: LoadXFormVec<v2f64>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000137
Scott Michelf9f42e62008-01-29 02:16:57 +0000138 def r128: LoadXForm<GPRC>;
139 def r64: LoadXForm<R64C>;
140 def r32: LoadXForm<R32C>;
141 def f32: LoadXForm<R32FP>;
142 def f64: LoadXForm<R64FP>;
143 def r16: LoadXForm<R16C>;
144 def r8: LoadXForm<R8C>;
145 }
Scott Michel8b6b4202007-12-04 22:35:58 +0000146
Scott Michelf9f42e62008-01-29 02:16:57 +0000147 defm LQA : LoadAForms;
148 defm LQD : LoadDForms;
149 defm LQX : LoadXForms;
Scott Michel438be252007-12-17 22:32:34 +0000150
Scott Michel8b6b4202007-12-04 22:35:58 +0000151/* Load quadword, PC relative: Not much use at this point in time.
Scott Michelf9f42e62008-01-29 02:16:57 +0000152 Might be of use later for relocatable code. It's effectively the
153 same as LQA, but uses PC-relative addressing.
Scott Michel8b6b4202007-12-04 22:35:58 +0000154 def LQR : RI16Form<0b111001100, (outs VECREG:$rT), (ins s16imm:$disp),
155 "lqr\t$rT, $disp", LoadStore,
156 [(set VECREG:$rT, (load iaddr:$disp))]>;
157 */
Scott Michel8b6b4202007-12-04 22:35:58 +0000158}
159
160//===----------------------------------------------------------------------===//
161// Stores:
162//===----------------------------------------------------------------------===//
Scott Michelf9f42e62008-01-29 02:16:57 +0000163class StoreDFormVec<ValueType vectype>
164 : RI10Form<0b00100100, (outs), (ins VECREG:$rT, memri10:$src),
165 "stqd\t$rT, $src",
166 LoadStore,
167 [(store (vectype VECREG:$rT), dform_addr:$src)]>
168{ }
Scott Michel8b6b4202007-12-04 22:35:58 +0000169
Scott Michelf9f42e62008-01-29 02:16:57 +0000170class StoreDForm<RegisterClass rclass>
171 : RI10Form<0b00100100, (outs), (ins rclass:$rT, memri10:$src),
172 "stqd\t$rT, $src",
173 LoadStore,
174 [(store rclass:$rT, dform_addr:$src)]>
175{ }
Scott Michel8b6b4202007-12-04 22:35:58 +0000176
Scott Michelf9f42e62008-01-29 02:16:57 +0000177multiclass StoreDForms
178{
179 def v16i8: StoreDFormVec<v16i8>;
180 def v8i16: StoreDFormVec<v8i16>;
181 def v4i32: StoreDFormVec<v4i32>;
182 def v2i64: StoreDFormVec<v2i64>;
183 def v4f32: StoreDFormVec<v4f32>;
184 def v2f64: StoreDFormVec<v2f64>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000185
Scott Michelf9f42e62008-01-29 02:16:57 +0000186 def r128: StoreDForm<GPRC>;
187 def r64: StoreDForm<R64C>;
188 def r32: StoreDForm<R32C>;
189 def f32: StoreDForm<R32FP>;
190 def f64: StoreDForm<R64FP>;
191 def r16: StoreDForm<R16C>;
192 def r8: StoreDForm<R8C>;
193}
Scott Michel8b6b4202007-12-04 22:35:58 +0000194
Scott Michelf9f42e62008-01-29 02:16:57 +0000195class StoreAFormVec<ValueType vectype>
196 : RI16Form<0b0010010, (outs), (ins VECREG:$rT, addr256k:$src),
Scott Michel5a6f17b2008-01-30 02:55:46 +0000197 "stqa\t$rT, $src",
198 LoadStore,
199 [(store (vectype VECREG:$rT), aform_addr:$src)]>
Scott Michelf9f42e62008-01-29 02:16:57 +0000200{ }
Scott Michel8b6b4202007-12-04 22:35:58 +0000201
Scott Michelf9f42e62008-01-29 02:16:57 +0000202class StoreAForm<RegisterClass rclass>
203 : RI16Form<0b001001, (outs), (ins rclass:$rT, addr256k:$src),
Scott Michel5a6f17b2008-01-30 02:55:46 +0000204 "stqa\t$rT, $src",
205 LoadStore,
206 [(store rclass:$rT, aform_addr:$src)]>
Scott Michelf9f42e62008-01-29 02:16:57 +0000207{ }
Scott Michel8b6b4202007-12-04 22:35:58 +0000208
Scott Michelf9f42e62008-01-29 02:16:57 +0000209multiclass StoreAForms
210{
211 def v16i8: StoreAFormVec<v16i8>;
212 def v8i16: StoreAFormVec<v8i16>;
213 def v4i32: StoreAFormVec<v4i32>;
214 def v2i64: StoreAFormVec<v2i64>;
215 def v4f32: StoreAFormVec<v4f32>;
216 def v2f64: StoreAFormVec<v2f64>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000217
Scott Michelf9f42e62008-01-29 02:16:57 +0000218 def r128: StoreAForm<GPRC>;
219 def r64: StoreAForm<R64C>;
220 def r32: StoreAForm<R32C>;
221 def f32: StoreAForm<R32FP>;
222 def f64: StoreAForm<R64FP>;
223 def r16: StoreAForm<R16C>;
224 def r8: StoreAForm<R8C>;
225}
Scott Michel8b6b4202007-12-04 22:35:58 +0000226
Scott Michelf9f42e62008-01-29 02:16:57 +0000227class StoreXFormVec<ValueType vectype>
228 : RRForm<0b00100100, (outs), (ins VECREG:$rT, memrr:$src),
Scott Michel5a6f17b2008-01-30 02:55:46 +0000229 "stqx\t$rT, $src",
230 LoadStore,
231 [(store (vectype VECREG:$rT), xform_addr:$src)]>
Scott Michelf9f42e62008-01-29 02:16:57 +0000232{ }
Scott Michel8b6b4202007-12-04 22:35:58 +0000233
Scott Michelf9f42e62008-01-29 02:16:57 +0000234class StoreXForm<RegisterClass rclass>
235 : RRForm<0b00100100, (outs), (ins rclass:$rT, memrr:$src),
Scott Michel5a6f17b2008-01-30 02:55:46 +0000236 "stqx\t$rT, $src",
237 LoadStore,
238 [(store rclass:$rT, xform_addr:$src)]>
Scott Michelf9f42e62008-01-29 02:16:57 +0000239{ }
Scott Michel8b6b4202007-12-04 22:35:58 +0000240
Scott Michelf9f42e62008-01-29 02:16:57 +0000241multiclass StoreXForms
242{
243 def v16i8: StoreXFormVec<v16i8>;
244 def v8i16: StoreXFormVec<v8i16>;
245 def v4i32: StoreXFormVec<v4i32>;
246 def v2i64: StoreXFormVec<v2i64>;
247 def v4f32: StoreXFormVec<v4f32>;
248 def v2f64: StoreXFormVec<v2f64>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000249
Scott Michelf9f42e62008-01-29 02:16:57 +0000250 def r128: StoreXForm<GPRC>;
251 def r64: StoreXForm<R64C>;
252 def r32: StoreXForm<R32C>;
253 def f32: StoreXForm<R32FP>;
254 def f64: StoreXForm<R64FP>;
255 def r16: StoreXForm<R16C>;
256 def r8: StoreXForm<R8C>;
257}
Scott Michel8b6b4202007-12-04 22:35:58 +0000258
Scott Michelf9f42e62008-01-29 02:16:57 +0000259defm STQD : StoreDForms;
260defm STQA : StoreAForms;
261defm STQX : StoreXForms;
Scott Michel8b6b4202007-12-04 22:35:58 +0000262
263/* Store quadword, PC relative: Not much use at this point in time. Might
Scott Michelf9f42e62008-01-29 02:16:57 +0000264 be useful for relocatable code.
Chris Lattneref8d6082008-01-06 06:44:58 +0000265def STQR : RI16Form<0b111000100, (outs), (ins VECREG:$rT, s16imm:$disp),
266 "stqr\t$rT, $disp", LoadStore,
267 [(store VECREG:$rT, iaddr:$disp)]>;
268*/
Scott Michel8b6b4202007-12-04 22:35:58 +0000269
270//===----------------------------------------------------------------------===//
271// Generate Controls for Insertion:
272//===----------------------------------------------------------------------===//
273
274def CBD :
275 RI7Form<0b10101111100, (outs VECREG:$rT), (ins memri7:$src),
276 "cbd\t$rT, $src", ShuffleOp,
277 [(set (v16i8 VECREG:$rT), (SPUvecinsmask dform2_addr:$src))]>;
278
279def CBX : RRForm<0b00101011100, (outs VECREG:$rT), (ins memrr:$src),
280 "cbx\t$rT, $src", ShuffleOp,
281 [(set (v16i8 VECREG:$rT), (SPUvecinsmask xform_addr:$src))]>;
282
283def CHD : RI7Form<0b10101111100, (outs VECREG:$rT), (ins memri7:$src),
284 "chd\t$rT, $src", ShuffleOp,
285 [(set (v8i16 VECREG:$rT), (SPUvecinsmask dform2_addr:$src))]>;
286
287def CHX : RRForm<0b10101011100, (outs VECREG:$rT), (ins memrr:$src),
288 "chx\t$rT, $src", ShuffleOp,
289 [(set (v8i16 VECREG:$rT), (SPUvecinsmask xform_addr:$src))]>;
290
291def CWD : RI7Form<0b01101111100, (outs VECREG:$rT), (ins memri7:$src),
292 "cwd\t$rT, $src", ShuffleOp,
293 [(set (v4i32 VECREG:$rT), (SPUvecinsmask dform2_addr:$src))]>;
294
295def CWX : RRForm<0b01101011100, (outs VECREG:$rT), (ins memrr:$src),
296 "cwx\t$rT, $src", ShuffleOp,
297 [(set (v4i32 VECREG:$rT), (SPUvecinsmask xform_addr:$src))]>;
298
299def CDD : RI7Form<0b11101111100, (outs VECREG:$rT), (ins memri7:$src),
300 "cdd\t$rT, $src", ShuffleOp,
301 [(set (v2i64 VECREG:$rT), (SPUvecinsmask dform2_addr:$src))]>;
302
303def CDX : RRForm<0b11101011100, (outs VECREG:$rT), (ins memrr:$src),
304 "cdx\t$rT, $src", ShuffleOp,
305 [(set (v2i64 VECREG:$rT), (SPUvecinsmask xform_addr:$src))]>;
306
307//===----------------------------------------------------------------------===//
308// Constant formation:
309//===----------------------------------------------------------------------===//
310
311def ILHv8i16:
312 RI16Form<0b110000010, (outs VECREG:$rT), (ins s16imm:$val),
313 "ilh\t$rT, $val", ImmLoad,
314 [(set (v8i16 VECREG:$rT), (v8i16 v8i16SExt16Imm:$val))]>;
315
316def ILHr16:
317 RI16Form<0b110000010, (outs R16C:$rT), (ins s16imm:$val),
318 "ilh\t$rT, $val", ImmLoad,
319 [(set R16C:$rT, immSExt16:$val)]>;
320
Scott Michel438be252007-12-17 22:32:34 +0000321// Cell SPU doesn't have a native 8-bit immediate load, but ILH works ("with
322// the right constant")
323def ILHr8:
324 RI16Form<0b110000010, (outs R8C:$rT), (ins s16imm_i8:$val),
325 "ilh\t$rT, $val", ImmLoad,
326 [(set R8C:$rT, immSExt8:$val)]>;
327
Scott Michel8b6b4202007-12-04 22:35:58 +0000328// IL does sign extension!
329def ILr64:
330 RI16Form<0b100000010, (outs R64C:$rT), (ins s16imm_i64:$val),
331 "il\t$rT, $val", ImmLoad,
332 [(set R64C:$rT, immSExt16:$val)]>;
333
334def ILv2i64:
335 RI16Form<0b100000010, (outs VECREG:$rT), (ins s16imm_i64:$val),
336 "il\t$rT, $val", ImmLoad,
337 [(set VECREG:$rT, (v2i64 v2i64SExt16Imm:$val))]>;
338
339def ILv4i32:
340 RI16Form<0b100000010, (outs VECREG:$rT), (ins s16imm:$val),
341 "il\t$rT, $val", ImmLoad,
342 [(set VECREG:$rT, (v4i32 v4i32SExt16Imm:$val))]>;
343
344def ILr32:
345 RI16Form<0b100000010, (outs R32C:$rT), (ins s16imm_i32:$val),
346 "il\t$rT, $val", ImmLoad,
347 [(set R32C:$rT, immSExt16:$val)]>;
348
349def ILf32:
350 RI16Form<0b100000010, (outs R32FP:$rT), (ins s16imm_f32:$val),
351 "il\t$rT, $val", ImmLoad,
Nate Begeman78125042008-02-14 18:43:04 +0000352 [(set R32FP:$rT, fpimmSExt16:$val)]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000353
354def ILf64:
355 RI16Form<0b100000010, (outs R64FP:$rT), (ins s16imm_f64:$val),
356 "il\t$rT, $val", ImmLoad,
Nate Begeman78125042008-02-14 18:43:04 +0000357 [(set R64FP:$rT, fpimmSExt16:$val)]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000358
359def ILHUv4i32:
360 RI16Form<0b010000010, (outs VECREG:$rT), (ins u16imm:$val),
361 "ilhu\t$rT, $val", ImmLoad,
362 [(set VECREG:$rT, (v4i32 immILHUvec:$val))]>;
363
364def ILHUr32:
365 RI16Form<0b010000010, (outs R32C:$rT), (ins u16imm:$val),
366 "ilhu\t$rT, $val", ImmLoad,
367 [(set R32C:$rT, hi16:$val)]>;
368
369// ILHUf32: Used to custom lower float constant loads
370def ILHUf32:
371 RI16Form<0b010000010, (outs R32FP:$rT), (ins f16imm:$val),
372 "ilhu\t$rT, $val", ImmLoad,
Nate Begeman78125042008-02-14 18:43:04 +0000373 [(set R32FP:$rT, hi16_f32:$val)]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000374
375// ILHUhi: Used for loading high portion of an address. Note the symbolHi
376// printer used for the operand.
Scott Michel97872d32008-02-23 18:41:37 +0000377def ILHUhi:
378 RI16Form<0b010000010, (outs R32C:$rT), (ins symbolHi:$val),
Scott Michel8b6b4202007-12-04 22:35:58 +0000379 "ilhu\t$rT, $val", ImmLoad,
380 [(set R32C:$rT, hi16:$val)]>;
381
382// Immediate load address (can also be used to load 18-bit unsigned constants,
383// see the zext 16->32 pattern)
Scott Michel97872d32008-02-23 18:41:37 +0000384class ILAInst<dag OOL, dag IOL, list<dag> pattern>:
385 RI18Form<0b1000010, OOL, IOL, "ila\t$rT, $val",
386 LoadNOP, pattern>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000387
Scott Michel97872d32008-02-23 18:41:37 +0000388multiclass ImmLoadAddress
389{
390 def v2i64: ILAInst<(outs VECREG:$rT), (ins u18imm:$val),
391 [(set (v2i64 VECREG:$rT), v2i64Uns18Imm:$val)]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000392
Scott Michel97872d32008-02-23 18:41:37 +0000393 def v4i32: ILAInst<(outs VECREG:$rT), (ins u18imm:$val),
394 [(set (v4i32 VECREG:$rT), v4i32Uns18Imm:$val)]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000395
Scott Michel97872d32008-02-23 18:41:37 +0000396 def r64: ILAInst<(outs R64C:$rT), (ins u18imm_i64:$val),
397 [(set R64C:$rT, imm18:$val)]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000398
Scott Michel97872d32008-02-23 18:41:37 +0000399 def r32: ILAInst<(outs R32C:$rT), (ins u18imm:$val),
400 [(set R32C:$rT, imm18:$val)]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000401
Scott Michel97872d32008-02-23 18:41:37 +0000402 def f32: ILAInst<(outs R32FP:$rT), (ins f18imm:$val),
403 [(set R32FP:$rT, fpimm18:$val)]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000404
Scott Michel97872d32008-02-23 18:41:37 +0000405 def f64: ILAInst<(outs R64FP:$rT), (ins f18imm_f64:$val),
406 [(set R64FP:$rT, fpimm18:$val)]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000407
Scott Michel97872d32008-02-23 18:41:37 +0000408 def lo: ILAInst<(outs R32C:$rT), (ins symbolLo:$val),
409 [(set R32C:$rT, imm18:$val)]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000410
Scott Michel97872d32008-02-23 18:41:37 +0000411 def lsa: ILAInst<(outs R32C:$rT), (ins symbolLSA:$val),
412 [/* no pattern */]>;
413}
414
415defm ILA : ImmLoadAddress;
Scott Michel8b6b4202007-12-04 22:35:58 +0000416
417// Immediate OR, Halfword Lower: The "other" part of loading large constants
418// into 32-bit registers. See the anonymous pattern Pat<(i32 imm:$imm), ...>
419// Note that these are really two operand instructions, but they're encoded
420// as three operands with the first two arguments tied-to each other.
421
422def IOHLvec:
423 RI16Form<0b100000110, (outs VECREG:$rT), (ins VECREG:$rS, u16imm:$val),
424 "iohl\t$rT, $val", ImmLoad,
425 [/* insert intrinsic here */]>,
426 RegConstraint<"$rS = $rT">,
427 NoEncode<"$rS">;
428
429def IOHLr32:
430 RI16Form<0b100000110, (outs R32C:$rT), (ins R32C:$rS, i32imm:$val),
431 "iohl\t$rT, $val", ImmLoad,
432 [/* insert intrinsic here */]>,
433 RegConstraint<"$rS = $rT">,
434 NoEncode<"$rS">;
435
436def IOHLf32:
437 RI16Form<0b100000110, (outs R32FP:$rT), (ins R32FP:$rS, f32imm:$val),
438 "iohl\t$rT, $val", ImmLoad,
439 [/* insert intrinsic here */]>,
440 RegConstraint<"$rS = $rT">,
441 NoEncode<"$rS">;
442
Scott Micheldbac4cf2008-01-11 02:53:15 +0000443def IOHLlo:
444 RI16Form<0b100000110, (outs R32C:$rT), (ins R32C:$rS, symbolLo:$val),
445 "iohl\t$rT, $val", ImmLoad,
446 [/* no pattern */]>,
447 RegConstraint<"$rS = $rT">,
448 NoEncode<"$rS">;
449
Scott Michel8b6b4202007-12-04 22:35:58 +0000450// Form select mask for bytes using immediate, used in conjunction with the
451// SELB instruction:
452
Scott Michelf9f42e62008-01-29 02:16:57 +0000453class FSMBIVec<ValueType vectype>
454 : RI16Form<0b101001100, (outs VECREG:$rT), (ins u16imm:$val),
Scott Michel5a6f17b2008-01-30 02:55:46 +0000455 "fsmbi\t$rT, $val",
456 SelectOp,
457 [(set (vectype VECREG:$rT), (SPUfsmbi immU16:$val))]>
Scott Michelf9f42e62008-01-29 02:16:57 +0000458{ }
Scott Michel8b6b4202007-12-04 22:35:58 +0000459
Scott Michel97872d32008-02-23 18:41:37 +0000460multiclass FormSelectMaskBytesImm
Scott Michelf9f42e62008-01-29 02:16:57 +0000461{
462 def v16i8: FSMBIVec<v16i8>;
463 def v8i16: FSMBIVec<v8i16>;
464 def v4i32: FSMBIVec<v4i32>;
465 def v2i64: FSMBIVec<v2i64>;
466}
Scott Michel8b6b4202007-12-04 22:35:58 +0000467
Scott Michel97872d32008-02-23 18:41:37 +0000468defm FSMBI : FormSelectMaskBytesImm;
469
470// fsmb: Form select mask for bytes. N.B. Input operand, $rA, is 16-bits
471def FSMB:
472 RRForm_1<0b01101101100, (outs VECREG:$rT), (ins R16C:$rA),
473 "fsmb\t$rT, $rA", SelectOp,
474 []>;
475
476// fsmh: Form select mask for halfwords. N.B., Input operand, $rA, is
477// only 8-bits wide (even though it's input as 16-bits here)
478def FSMH:
479 RRForm_1<0b10101101100, (outs VECREG:$rT), (ins R16C:$rA),
480 "fsmh\t$rT, $rA", SelectOp,
481 []>;
482
483// fsm: Form select mask for words. Like the other fsm* instructions,
484// only the lower 4 bits of $rA are significant.
485def FSM:
486 RRForm_1<0b00101101100, (outs VECREG:$rT), (ins R16C:$rA),
487 "fsm\t$rT, $rA", SelectOp,
488 []>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000489
490//===----------------------------------------------------------------------===//
491// Integer and Logical Operations:
492//===----------------------------------------------------------------------===//
493
494def AHv8i16:
495 RRForm<0b00010011000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
496 "ah\t$rT, $rA, $rB", IntegerOp,
497 [(set (v8i16 VECREG:$rT), (int_spu_si_ah VECREG:$rA, VECREG:$rB))]>;
498
499def : Pat<(add (v8i16 VECREG:$rA), (v8i16 VECREG:$rB)),
500 (AHv8i16 VECREG:$rA, VECREG:$rB)>;
501
Scott Michel8b6b4202007-12-04 22:35:58 +0000502def AHr16:
503 RRForm<0b00010011000, (outs R16C:$rT), (ins R16C:$rA, R16C:$rB),
504 "ah\t$rT, $rA, $rB", IntegerOp,
505 [(set R16C:$rT, (add R16C:$rA, R16C:$rB))]>;
506
507def AHIvec:
508 RI10Form<0b10111000, (outs VECREG:$rT), (ins VECREG:$rA, s10imm:$val),
509 "ahi\t$rT, $rA, $val", IntegerOp,
510 [(set (v8i16 VECREG:$rT), (add (v8i16 VECREG:$rA),
511 v8i16SExt10Imm:$val))]>;
512
Scott Michel97872d32008-02-23 18:41:37 +0000513def AHIr16:
514 RI10Form<0b10111000, (outs R16C:$rT), (ins R16C:$rA, s10imm:$val),
515 "ahi\t$rT, $rA, $val", IntegerOp,
516 [(set R16C:$rT, (add R16C:$rA, v8i16SExt10Imm:$val))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000517
Scott Michel97872d32008-02-23 18:41:37 +0000518def Avec:
519 RRForm<0b00000011000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
520 "a\t$rT, $rA, $rB", IntegerOp,
521 [(set (v4i32 VECREG:$rT), (add (v4i32 VECREG:$rA), (v4i32 VECREG:$rB)))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000522
523def : Pat<(add (v16i8 VECREG:$rA), (v16i8 VECREG:$rB)),
524 (Avec VECREG:$rA, VECREG:$rB)>;
525
Scott Michel97872d32008-02-23 18:41:37 +0000526def Ar32:
527 RRForm<0b00000011000, (outs R32C:$rT), (ins R32C:$rA, R32C:$rB),
528 "a\t$rT, $rA, $rB", IntegerOp,
529 [(set R32C:$rT, (add R32C:$rA, R32C:$rB))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000530
Scott Michel438be252007-12-17 22:32:34 +0000531def Ar8:
532 RRForm<0b00000011000, (outs R8C:$rT), (ins R8C:$rA, R8C:$rB),
533 "a\t$rT, $rA, $rB", IntegerOp,
534 [(set R8C:$rT, (add R8C:$rA, R8C:$rB))]>;
535
Scott Michel8b6b4202007-12-04 22:35:58 +0000536def AIvec:
537 RI10Form<0b00111000, (outs VECREG:$rT), (ins VECREG:$rA, s10imm:$val),
538 "ai\t$rT, $rA, $val", IntegerOp,
539 [(set (v4i32 VECREG:$rT), (add (v4i32 VECREG:$rA),
540 v4i32SExt10Imm:$val))]>;
541
Scott Michel438be252007-12-17 22:32:34 +0000542def AIr32:
543 RI10Form<0b00111000, (outs R32C:$rT), (ins R32C:$rA, s10imm_i32:$val),
544 "ai\t$rT, $rA, $val", IntegerOp,
545 [(set R32C:$rT, (add R32C:$rA, i32ImmSExt10:$val))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000546
Scott Michel438be252007-12-17 22:32:34 +0000547def SFHvec:
548 RRForm<0b00010010000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
549 "sfh\t$rT, $rA, $rB", IntegerOp,
550 [(set (v8i16 VECREG:$rT), (sub (v8i16 VECREG:$rA),
551 (v8i16 VECREG:$rB)))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000552
Scott Michel438be252007-12-17 22:32:34 +0000553def SFHr16:
554 RRForm<0b00010010000, (outs R16C:$rT), (ins R16C:$rA, R16C:$rB),
555 "sfh\t$rT, $rA, $rB", IntegerOp,
556 [(set R16C:$rT, (sub R16C:$rA, R16C:$rB))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000557
558def SFHIvec:
559 RI10Form<0b10110000, (outs VECREG:$rT), (ins VECREG:$rA, s10imm:$val),
560 "sfhi\t$rT, $rA, $val", IntegerOp,
561 [(set (v8i16 VECREG:$rT), (sub v8i16SExt10Imm:$val,
562 (v8i16 VECREG:$rA)))]>;
563
564def SFHIr16 : RI10Form<0b10110000, (outs R16C:$rT), (ins R16C:$rA, s10imm:$val),
565 "sfhi\t$rT, $rA, $val", IntegerOp,
566 [(set R16C:$rT, (sub i16ImmSExt10:$val, R16C:$rA))]>;
567
568def SFvec : RRForm<0b00000010000, (outs VECREG:$rT),
569 (ins VECREG:$rA, VECREG:$rB),
570 "sf\t$rT, $rA, $rB", IntegerOp,
571 [(set (v4i32 VECREG:$rT), (sub (v4i32 VECREG:$rA), (v4i32 VECREG:$rB)))]>;
572
573def SFr32 : RRForm<0b00000010000, (outs R32C:$rT), (ins R32C:$rA, R32C:$rB),
574 "sf\t$rT, $rA, $rB", IntegerOp,
575 [(set R32C:$rT, (sub R32C:$rA, R32C:$rB))]>;
576
577def SFIvec:
578 RI10Form<0b00110000, (outs VECREG:$rT), (ins VECREG:$rA, s10imm:$val),
579 "sfi\t$rT, $rA, $val", IntegerOp,
580 [(set (v4i32 VECREG:$rT), (sub v4i32SExt10Imm:$val,
581 (v4i32 VECREG:$rA)))]>;
582
583def SFIr32 : RI10Form<0b00110000, (outs R32C:$rT),
584 (ins R32C:$rA, s10imm_i32:$val),
585 "sfi\t$rT, $rA, $val", IntegerOp,
586 [(set R32C:$rT, (sub i32ImmSExt10:$val, R32C:$rA))]>;
587
588// ADDX: only available in vector form, doesn't match a pattern.
589def ADDXvec:
590 RRForm<0b00000010110, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB,
591 VECREG:$rCarry),
592 "addx\t$rT, $rA, $rB", IntegerOp,
593 []>,
594 RegConstraint<"$rCarry = $rT">,
595 NoEncode<"$rCarry">;
596
597// CG: only available in vector form, doesn't match a pattern.
598def CGvec:
599 RRForm<0b01000011000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB,
600 VECREG:$rCarry),
601 "cg\t$rT, $rA, $rB", IntegerOp,
602 []>,
603 RegConstraint<"$rCarry = $rT">,
604 NoEncode<"$rCarry">;
605
606// SFX: only available in vector form, doesn't match a pattern
607def SFXvec:
608 RRForm<0b10000010110, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB,
609 VECREG:$rCarry),
610 "sfx\t$rT, $rA, $rB", IntegerOp,
611 []>,
612 RegConstraint<"$rCarry = $rT">,
613 NoEncode<"$rCarry">;
614
615// BG: only available in vector form, doesn't match a pattern.
616def BGvec:
617 RRForm<0b01000010000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB,
618 VECREG:$rCarry),
619 "bg\t$rT, $rA, $rB", IntegerOp,
620 []>,
621 RegConstraint<"$rCarry = $rT">,
622 NoEncode<"$rCarry">;
623
624// BGX: only available in vector form, doesn't match a pattern.
625def BGXvec:
626 RRForm<0b11000010110, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB,
627 VECREG:$rCarry),
628 "bgx\t$rT, $rA, $rB", IntegerOp,
629 []>,
630 RegConstraint<"$rCarry = $rT">,
631 NoEncode<"$rCarry">;
632
633// Halfword multiply variants:
634// N.B: These can be used to build up larger quantities (16x16 -> 32)
635
636def MPYv8i16:
637 RRForm<0b00100011110, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
638 "mpy\t$rT, $rA, $rB", IntegerMulDiv,
639 [(set (v8i16 VECREG:$rT), (SPUmpy_v8i16 (v8i16 VECREG:$rA),
640 (v8i16 VECREG:$rB)))]>;
641
642def MPYr16:
643 RRForm<0b00100011110, (outs R16C:$rT), (ins R16C:$rA, R16C:$rB),
644 "mpy\t$rT, $rA, $rB", IntegerMulDiv,
645 [(set R16C:$rT, (mul R16C:$rA, R16C:$rB))]>;
646
647def MPYUv4i32:
648 RRForm<0b00110011110, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
649 "mpyu\t$rT, $rA, $rB", IntegerMulDiv,
650 [(set (v4i32 VECREG:$rT),
651 (SPUmpyu_v4i32 (v4i32 VECREG:$rA), (v4i32 VECREG:$rB)))]>;
652
653def MPYUr16:
654 RRForm<0b00110011110, (outs R32C:$rT), (ins R16C:$rA, R16C:$rB),
655 "mpyu\t$rT, $rA, $rB", IntegerMulDiv,
656 [(set R32C:$rT, (mul (zext R16C:$rA),
657 (zext R16C:$rB)))]>;
658
659def MPYUr32:
660 RRForm<0b00110011110, (outs R32C:$rT), (ins R32C:$rA, R32C:$rB),
661 "mpyu\t$rT, $rA, $rB", IntegerMulDiv,
662 [(set R32C:$rT, (SPUmpyu_i32 R32C:$rA, R32C:$rB))]>;
663
664// mpyi: multiply 16 x s10imm -> 32 result (custom lowering for 32 bit result,
665// this only produces the lower 16 bits)
666def MPYIvec:
667 RI10Form<0b00101110, (outs VECREG:$rT), (ins VECREG:$rA, s10imm:$val),
668 "mpyi\t$rT, $rA, $val", IntegerMulDiv,
669 [(set (v8i16 VECREG:$rT), (mul (v8i16 VECREG:$rA), v8i16SExt10Imm:$val))]>;
670
671def MPYIr16:
672 RI10Form<0b00101110, (outs R16C:$rT), (ins R16C:$rA, s10imm:$val),
673 "mpyi\t$rT, $rA, $val", IntegerMulDiv,
674 [(set R16C:$rT, (mul R16C:$rA, i16ImmSExt10:$val))]>;
675
676// mpyui: same issues as other multiplies, plus, this doesn't match a
677// pattern... but may be used during target DAG selection or lowering
678def MPYUIvec:
679 RI10Form<0b10101110, (outs VECREG:$rT), (ins VECREG:$rA, s10imm:$val),
680 "mpyui\t$rT, $rA, $val", IntegerMulDiv,
681 []>;
682
683def MPYUIr16:
684 RI10Form<0b10101110, (outs R16C:$rT), (ins R16C:$rA, s10imm:$val),
685 "mpyui\t$rT, $rA, $val", IntegerMulDiv,
686 []>;
687
688// mpya: 16 x 16 + 16 -> 32 bit result
689def MPYAvec:
690 RRRForm<0b0011, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB, VECREG:$rC),
691 "mpya\t$rT, $rA, $rB, $rC", IntegerMulDiv,
692 [(set (v4i32 VECREG:$rT), (add (v4i32 (bitconvert (mul (v8i16 VECREG:$rA),
693 (v8i16 VECREG:$rB)))),
694 (v4i32 VECREG:$rC)))]>;
695
696def MPYAr32:
697 RRRForm<0b0011, (outs R32C:$rT), (ins R16C:$rA, R16C:$rB, R32C:$rC),
698 "mpya\t$rT, $rA, $rB, $rC", IntegerMulDiv,
699 [(set R32C:$rT, (add (sext (mul R16C:$rA, R16C:$rB)),
700 R32C:$rC))]>;
701
702def : Pat<(add (mul (sext R16C:$rA), (sext R16C:$rB)), R32C:$rC),
703 (MPYAr32 R16C:$rA, R16C:$rB, R32C:$rC)>;
704
705def MPYAr32_sextinreg:
706 RRRForm<0b0011, (outs R32C:$rT), (ins R32C:$rA, R32C:$rB, R32C:$rC),
707 "mpya\t$rT, $rA, $rB, $rC", IntegerMulDiv,
708 [(set R32C:$rT, (add (mul (sext_inreg R32C:$rA, i16),
709 (sext_inreg R32C:$rB, i16)),
710 R32C:$rC))]>;
711
712//def MPYAr32:
713// RRRForm<0b0011, (outs R32C:$rT), (ins R16C:$rA, R16C:$rB, R32C:$rC),
714// "mpya\t$rT, $rA, $rB, $rC", IntegerMulDiv,
715// [(set R32C:$rT, (add (sext (mul R16C:$rA, R16C:$rB)),
716// R32C:$rC))]>;
717
718// mpyh: multiply high, used to synthesize 32-bit multiplies
719def MPYHv4i32:
720 RRForm<0b10100011110, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
721 "mpyh\t$rT, $rA, $rB", IntegerMulDiv,
722 [(set (v4i32 VECREG:$rT),
723 (SPUmpyh_v4i32 (v4i32 VECREG:$rA), (v4i32 VECREG:$rB)))]>;
724
725def MPYHr32:
726 RRForm<0b10100011110, (outs R32C:$rT), (ins R32C:$rA, R32C:$rB),
727 "mpyh\t$rT, $rA, $rB", IntegerMulDiv,
728 [(set R32C:$rT, (SPUmpyh_i32 R32C:$rA, R32C:$rB))]>;
729
730// mpys: multiply high and shift right (returns the top half of
731// a 16-bit multiply, sign extended to 32 bits.)
732def MPYSvec:
733 RRForm<0b11100011110, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
734 "mpys\t$rT, $rA, $rB", IntegerMulDiv,
735 []>;
736
737def MPYSr16:
738 RRForm<0b11100011110, (outs R32C:$rT), (ins R16C:$rA, R16C:$rB),
739 "mpys\t$rT, $rA, $rB", IntegerMulDiv,
740 []>;
741
742// mpyhh: multiply high-high (returns the 32-bit result from multiplying
743// the top 16 bits of the $rA, $rB)
744def MPYHHv8i16:
745 RRForm<0b01100011110, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
746 "mpyhh\t$rT, $rA, $rB", IntegerMulDiv,
747 [(set (v8i16 VECREG:$rT),
748 (SPUmpyhh_v8i16 (v8i16 VECREG:$rA), (v8i16 VECREG:$rB)))]>;
749
750def MPYHHr32:
751 RRForm<0b01100011110, (outs R32C:$rT), (ins R32C:$rA, R32C:$rB),
752 "mpyhh\t$rT, $rA, $rB", IntegerMulDiv,
753 []>;
754
755// mpyhha: Multiply high-high, add to $rT:
756def MPYHHAvec:
757 RRForm<0b01100010110, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
758 "mpyhha\t$rT, $rA, $rB", IntegerMulDiv,
759 []>;
760
761def MPYHHAr32:
762 RRForm<0b01100010110, (outs R32C:$rT), (ins R32C:$rA, R32C:$rB),
763 "mpyhha\t$rT, $rA, $rB", IntegerMulDiv,
764 []>;
765
766// mpyhhu: Multiply high-high, unsigned
767def MPYHHUvec:
768 RRForm<0b01110011110, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
769 "mpyhhu\t$rT, $rA, $rB", IntegerMulDiv,
770 []>;
771
772def MPYHHUr32:
773 RRForm<0b01110011110, (outs R32C:$rT), (ins R32C:$rA, R32C:$rB),
774 "mpyhhu\t$rT, $rA, $rB", IntegerMulDiv,
775 []>;
776
777// mpyhhau: Multiply high-high, unsigned
778def MPYHHAUvec:
779 RRForm<0b01110010110, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
780 "mpyhhau\t$rT, $rA, $rB", IntegerMulDiv,
781 []>;
782
783def MPYHHAUr32:
784 RRForm<0b01110010110, (outs R32C:$rT), (ins R32C:$rA, R32C:$rB),
785 "mpyhhau\t$rT, $rA, $rB", IntegerMulDiv,
786 []>;
787
788// clz: Count leading zeroes
789def CLZv4i32:
790 RRForm_1<0b10100101010, (outs VECREG:$rT), (ins VECREG:$rA),
791 "clz\t$rT, $rA", IntegerOp,
792 [/* intrinsic */]>;
793
794def CLZr32:
795 RRForm_1<0b10100101010, (outs R32C:$rT), (ins R32C:$rA),
796 "clz\t$rT, $rA", IntegerOp,
797 [(set R32C:$rT, (ctlz R32C:$rA))]>;
798
799// cntb: Count ones in bytes (aka "population count")
800// NOTE: This instruction is really a vector instruction, but the custom
801// lowering code uses it in unorthodox ways to support CTPOP for other
802// data types!
803def CNTBv16i8:
804 RRForm_1<0b00101101010, (outs VECREG:$rT), (ins VECREG:$rA),
805 "cntb\t$rT, $rA", IntegerOp,
806 [(set (v16i8 VECREG:$rT), (SPUcntb_v16i8 (v16i8 VECREG:$rA)))]>;
807
808def CNTBv8i16 :
809 RRForm_1<0b00101101010, (outs VECREG:$rT), (ins VECREG:$rA),
810 "cntb\t$rT, $rA", IntegerOp,
811 [(set (v8i16 VECREG:$rT), (SPUcntb_v8i16 (v8i16 VECREG:$rA)))]>;
812
813def CNTBv4i32 :
814 RRForm_1<0b00101101010, (outs VECREG:$rT), (ins VECREG:$rA),
815 "cntb\t$rT, $rA", IntegerOp,
816 [(set (v4i32 VECREG:$rT), (SPUcntb_v4i32 (v4i32 VECREG:$rA)))]>;
817
Scott Michel8b6b4202007-12-04 22:35:58 +0000818// gbb: Gather all low order bits from each byte in $rA into a single 16-bit
819// quantity stored into $rT
820def GBB:
821 RRForm_1<0b01001101100, (outs R16C:$rT), (ins VECREG:$rA),
822 "gbb\t$rT, $rA", GatherOp,
823 []>;
824
825// gbh: Gather all low order bits from each halfword in $rA into a single
826// 8-bit quantity stored in $rT
827def GBH:
828 RRForm_1<0b10001101100, (outs R16C:$rT), (ins VECREG:$rA),
829 "gbh\t$rT, $rA", GatherOp,
830 []>;
831
832// gb: Gather all low order bits from each word in $rA into a single
833// 4-bit quantity stored in $rT
834def GB:
835 RRForm_1<0b00001101100, (outs R16C:$rT), (ins VECREG:$rA),
836 "gb\t$rT, $rA", GatherOp,
837 []>;
838
839// avgb: average bytes
840def AVGB:
841 RRForm<0b11001011000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
842 "avgb\t$rT, $rA, $rB", ByteOp,
843 []>;
844
845// absdb: absolute difference of bytes
846def ABSDB:
847 RRForm<0b11001010000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
848 "absdb\t$rT, $rA, $rB", ByteOp,
849 []>;
850
851// sumb: sum bytes into halfwords
852def SUMB:
853 RRForm<0b11001010010, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
854 "sumb\t$rT, $rA, $rB", ByteOp,
855 []>;
856
857// Sign extension operations:
858def XSBHvec:
859 RRForm_1<0b01101101010, (outs VECREG:$rDst), (ins VECREG:$rSrc),
860 "xsbh\t$rDst, $rSrc", IntegerOp,
861 [(set (v8i16 VECREG:$rDst), (sext (v16i8 VECREG:$rSrc)))]>;
862
863// Ordinary form for XSBH
864def XSBHr16:
865 RRForm_1<0b01101101010, (outs R16C:$rDst), (ins R16C:$rSrc),
866 "xsbh\t$rDst, $rSrc", IntegerOp,
867 [(set R16C:$rDst, (sext_inreg R16C:$rSrc, i8))]>;
868
Scott Michel438be252007-12-17 22:32:34 +0000869def XSBHr8:
870 RRForm_1<0b01101101010, (outs R16C:$rDst), (ins R8C:$rSrc),
871 "xsbh\t$rDst, $rSrc", IntegerOp,
872 [(set R16C:$rDst, (sext R8C:$rSrc))]>;
873
Scott Michel8b6b4202007-12-04 22:35:58 +0000874// 32-bit form for XSBH: used to sign extend 8-bit quantities to 16-bit
875// quantities to 32-bit quantities via a 32-bit register (see the sext 8->32
876// pattern below). Intentionally doesn't match a pattern because we want the
877// sext 8->32 pattern to do the work for us, namely because we need the extra
878// XSHWr32.
879def XSBHr32:
880 RRForm_1<0b01101101010, (outs R32C:$rDst), (ins R32C:$rSrc),
881 "xsbh\t$rDst, $rSrc", IntegerOp,
882 [(set R32C:$rDst, (sext_inreg R32C:$rSrc, i8))]>;
883
884// Sign extend halfwords to words:
885def XSHWvec:
886 RRForm_1<0b01101101010, (outs VECREG:$rDest), (ins VECREG:$rSrc),
887 "xshw\t$rDest, $rSrc", IntegerOp,
888 [(set (v4i32 VECREG:$rDest), (sext (v8i16 VECREG:$rSrc)))]>;
889
890def XSHWr32:
891 RRForm_1<0b01101101010, (outs R32C:$rDst), (ins R32C:$rSrc),
892 "xshw\t$rDst, $rSrc", IntegerOp,
893 [(set R32C:$rDst, (sext_inreg R32C:$rSrc, i16))]>;
894
895def XSHWr16:
896 RRForm_1<0b01101101010, (outs R32C:$rDst), (ins R16C:$rSrc),
897 "xshw\t$rDst, $rSrc", IntegerOp,
898 [(set R32C:$rDst, (sext R16C:$rSrc))]>;
899
900def XSWDvec:
901 RRForm_1<0b01100101010, (outs VECREG:$rDst), (ins VECREG:$rSrc),
902 "xswd\t$rDst, $rSrc", IntegerOp,
903 [(set (v2i64 VECREG:$rDst), (sext (v4i32 VECREG:$rSrc)))]>;
904
905def XSWDr64:
906 RRForm_1<0b01100101010, (outs R64C:$rDst), (ins R64C:$rSrc),
907 "xswd\t$rDst, $rSrc", IntegerOp,
908 [(set R64C:$rDst, (sext_inreg R64C:$rSrc, i32))]>;
909
910def XSWDr32:
911 RRForm_1<0b01100101010, (outs R64C:$rDst), (ins R32C:$rSrc),
912 "xswd\t$rDst, $rSrc", IntegerOp,
913 [(set R64C:$rDst, (SPUsext32_to_64 R32C:$rSrc))]>;
914
915def : Pat<(sext R32C:$inp),
916 (XSWDr32 R32C:$inp)>;
917
918// AND operations
Scott Michel8b6b4202007-12-04 22:35:58 +0000919
Scott Michel97872d32008-02-23 18:41:37 +0000920class ANDInst<dag OOL, dag IOL, list<dag> pattern> :
921 RRForm<0b10000011000, OOL, IOL, "and\t$rT, $rA, $rB",
922 IntegerOp, pattern>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000923
Scott Michel97872d32008-02-23 18:41:37 +0000924class ANDVecInst<ValueType vectype>:
925 ANDInst<(outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
926 [(set (vectype VECREG:$rT), (and (vectype VECREG:$rA),
927 (vectype VECREG:$rB)))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000928
Scott Michel97872d32008-02-23 18:41:37 +0000929multiclass BitwiseAnd
930{
931 def v16i8: ANDVecInst<v16i8>;
932 def v8i16: ANDVecInst<v8i16>;
933 def v4i32: ANDVecInst<v4i32>;
934 def v2i64: ANDVecInst<v2i64>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000935
Scott Michel97872d32008-02-23 18:41:37 +0000936 def r64: ANDInst<(outs R64C:$rT), (ins R64C:$rA, R64C:$rB),
937 [(set R64C:$rT, (and R64C:$rA, R64C:$rB))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000938
Scott Michel97872d32008-02-23 18:41:37 +0000939 def r32: ANDInst<(outs R32C:$rT), (ins R32C:$rA, R32C:$rB),
940 [(set R32C:$rT, (and R32C:$rA, R32C:$rB))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000941
Scott Michel97872d32008-02-23 18:41:37 +0000942 def r16: ANDInst<(outs R16C:$rT), (ins R16C:$rA, R16C:$rB),
943 [(set R16C:$rT, (and R16C:$rA, R16C:$rB))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000944
Scott Michel97872d32008-02-23 18:41:37 +0000945 def r8: ANDInst<(outs R8C:$rT), (ins R8C:$rA, R8C:$rB),
946 [(set R8C:$rT, (and R8C:$rA, R8C:$rB))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000947
Scott Michel97872d32008-02-23 18:41:37 +0000948 //===---------------------------------------------
949 // Special instructions to perform the fabs instruction
950 def fabs32: ANDInst<(outs R32FP:$rT), (ins R32FP:$rA, R32C:$rB),
951 [/* Intentionally does not match a pattern */]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000952
Scott Michel97872d32008-02-23 18:41:37 +0000953 def fabs64: ANDInst<(outs R64FP:$rT), (ins R64FP:$rA, VECREG:$rB),
954 [/* Intentionally does not match a pattern */]>;
Scott Michel438be252007-12-17 22:32:34 +0000955
Scott Michel97872d32008-02-23 18:41:37 +0000956 // Could use v4i32, but won't for clarity
957 def fabsvec: ANDInst<(outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
958 [/* Intentionally does not match a pattern */]>;
959
960 //===---------------------------------------------
961
962 // Hacked form of AND to zero-extend 16-bit quantities to 32-bit
963 // quantities -- see 16->32 zext pattern.
964 //
965 // This pattern is somewhat artificial, since it might match some
966 // compiler generated pattern but it is unlikely to do so.
967
968 def i16i32: ANDInst<(outs R32C:$rT), (ins R16C:$rA, R32C:$rB),
969 [(set R32C:$rT, (and (zext R16C:$rA), R32C:$rB))]>;
970}
971
972defm AND : BitwiseAnd;
Scott Michel8b6b4202007-12-04 22:35:58 +0000973
974// N.B.: vnot_conv is one of those special target selection pattern fragments,
975// in which we expect there to be a bit_convert on the constant. Bear in mind
976// that llvm translates "not <reg>" to "xor <reg>, -1" (or in this case, a
977// constant -1 vector.)
Scott Michel8b6b4202007-12-04 22:35:58 +0000978
Scott Michel97872d32008-02-23 18:41:37 +0000979class ANDCInst<dag OOL, dag IOL, list<dag> pattern>:
980 RRForm<0b10000011010, OOL, IOL, "andc\t$rT, $rA, $rB",
981 IntegerOp, pattern>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000982
Scott Michel97872d32008-02-23 18:41:37 +0000983class ANDCVecInst<ValueType vectype>:
984 ANDCInst<(outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
985 [(set (vectype VECREG:$rT), (and (vectype VECREG:$rA),
986 (vnot (vectype VECREG:$rB))))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000987
Scott Michel97872d32008-02-23 18:41:37 +0000988class ANDCRegInst<RegisterClass rclass>:
989 ANDCInst<(outs rclass:$rT), (ins rclass:$rA, rclass:$rB),
990 [(set rclass:$rT, (and rclass:$rA, (not rclass:$rB)))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000991
Scott Michel97872d32008-02-23 18:41:37 +0000992multiclass AndComplement
993{
994 def v16i8: ANDCVecInst<v16i8>;
995 def v8i16: ANDCVecInst<v8i16>;
996 def v4i32: ANDCVecInst<v4i32>;
997 def v2i64: ANDCVecInst<v2i64>;
Scott Michel8b6b4202007-12-04 22:35:58 +0000998
Scott Michel97872d32008-02-23 18:41:37 +0000999 def r128: ANDCRegInst<GPRC>;
1000 def r64: ANDCRegInst<R64C>;
1001 def r32: ANDCRegInst<R32C>;
1002 def r16: ANDCRegInst<R16C>;
1003 def r8: ANDCRegInst<R8C>;
1004}
Scott Michel438be252007-12-17 22:32:34 +00001005
Scott Michel97872d32008-02-23 18:41:37 +00001006defm ANDC : AndComplement;
Scott Michel8b6b4202007-12-04 22:35:58 +00001007
Scott Michel97872d32008-02-23 18:41:37 +00001008class ANDBIInst<dag OOL, dag IOL, list<dag> pattern>:
1009 RI10Form<0b01101000, OOL, IOL, "andbi\t$rT, $rA, $val",
1010 IntegerOp, pattern>;
Scott Michel438be252007-12-17 22:32:34 +00001011
Scott Michel97872d32008-02-23 18:41:37 +00001012multiclass AndByteImm
1013{
1014 def v16i8: ANDBIInst<(outs VECREG:$rT), (ins VECREG:$rA, u10imm:$val),
1015 [(set (v16i8 VECREG:$rT),
1016 (and (v16i8 VECREG:$rA),
1017 (v16i8 v16i8U8Imm:$val)))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001018
Scott Michel97872d32008-02-23 18:41:37 +00001019 def r8: ANDBIInst<(outs R8C:$rT), (ins R8C:$rA, u10imm_i8:$val),
1020 [(set R8C:$rT, (and R8C:$rA, immU8:$val))]>;
1021}
Scott Michel438be252007-12-17 22:32:34 +00001022
Scott Michel97872d32008-02-23 18:41:37 +00001023defm ANDBI : AndByteImm;
Scott Michel8b6b4202007-12-04 22:35:58 +00001024
Scott Michel97872d32008-02-23 18:41:37 +00001025class ANDHIInst<dag OOL, dag IOL, list<dag> pattern> :
1026 RI10Form<0b10101000, OOL, IOL, "andhi\t$rT, $rA, $val",
1027 IntegerOp, pattern>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001028
Scott Michel97872d32008-02-23 18:41:37 +00001029multiclass AndHalfwordImm
1030{
1031 def v8i16: ANDHIInst<(outs VECREG:$rT), (ins VECREG:$rA, s10imm:$val),
1032 [(set (v8i16 VECREG:$rT),
1033 (and (v8i16 VECREG:$rA), v8i16SExt10Imm:$val))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001034
Scott Michel97872d32008-02-23 18:41:37 +00001035 def r16: ANDHIInst<(outs R16C:$rT), (ins R16C:$rA, u10imm:$val),
1036 [(set R16C:$rT, (and R16C:$rA, i16ImmUns10:$val))]>;
Scott Michel438be252007-12-17 22:32:34 +00001037
Scott Michel97872d32008-02-23 18:41:37 +00001038 // Zero-extend i8 to i16:
1039 def i8i16: ANDHIInst<(outs R16C:$rT), (ins R8C:$rA, u10imm:$val),
1040 [(set R16C:$rT, (and (zext R8C:$rA), i16ImmUns10:$val))]>;
1041}
Scott Michel8b6b4202007-12-04 22:35:58 +00001042
Scott Michel97872d32008-02-23 18:41:37 +00001043defm ANDHI : AndHalfwordImm;
1044
1045class ANDIInst<dag OOL, dag IOL, list<dag> pattern> :
1046 RI10Form<0b00101000, OOL, IOL, "andi\t$rT, $rA, $val",
1047 IntegerOp, pattern>;
1048
1049multiclass AndWordImm
1050{
1051 def v4i32: ANDIInst<(outs VECREG:$rT), (ins VECREG:$rA, s10imm:$val),
1052 [(set (v4i32 VECREG:$rT),
1053 (and (v4i32 VECREG:$rA), v4i32SExt10Imm:$val))]>;
1054
1055 def r32: ANDIInst<(outs R32C:$rT), (ins R32C:$rA, s10imm_i32:$val),
1056 [(set R32C:$rT, (and R32C:$rA, i32ImmSExt10:$val))]>;
1057
1058 // Hacked form of ANDI to zero-extend i8 quantities to i32. See the zext 8->32
1059 // pattern below.
1060 def i8i32: ANDIInst<(outs R32C:$rT), (ins R8C:$rA, s10imm_i32:$val),
1061 [(set R32C:$rT,
1062 (and (zext R8C:$rA), i32ImmSExt10:$val))]>;
1063
1064 // Hacked form of ANDI to zero-extend i16 quantities to i32. See the
1065 // zext 16->32 pattern below.
1066 //
1067 // Note that this pattern is somewhat artificial, since it might match
1068 // something the compiler generates but is unlikely to occur in practice.
1069 def i16i32: ANDIInst<(outs R32C:$rT), (ins R16C:$rA, s10imm_i32:$val),
1070 [(set R32C:$rT,
1071 (and (zext R16C:$rA), i32ImmSExt10:$val))]>;
1072}
1073
1074defm ANDI : AndWordImm;
1075
1076//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
Scott Michel8b6b4202007-12-04 22:35:58 +00001077// Bitwise OR group:
Scott Michel97872d32008-02-23 18:41:37 +00001078//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
1079
Scott Michel8b6b4202007-12-04 22:35:58 +00001080// Bitwise "or" (N.B.: These are also register-register copy instructions...)
Scott Michel97872d32008-02-23 18:41:37 +00001081class ORInst<dag OOL, dag IOL, list<dag> pattern>:
1082 RRForm<0b10000010000, OOL, IOL, "or\t$rT, $rA, $rB",
1083 IntegerOp, pattern>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001084
Scott Michel97872d32008-02-23 18:41:37 +00001085class ORVecInst<ValueType vectype>:
1086 ORInst<(outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
1087 [(set (vectype VECREG:$rT), (or (vectype VECREG:$rA),
1088 (vectype VECREG:$rB)))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001089
Scott Michel97872d32008-02-23 18:41:37 +00001090class ORRegInst<RegisterClass rclass>:
1091 ORInst<(outs rclass:$rT), (ins rclass:$rA, rclass:$rB),
1092 [(set rclass:$rT, (or rclass:$rA, rclass:$rB))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001093
Scott Michel97872d32008-02-23 18:41:37 +00001094class ORPromoteScalar<RegisterClass rclass>:
1095 ORInst<(outs VECREG:$rT), (ins rclass:$rA, rclass:$rB),
1096 [/* no pattern */]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001097
Scott Michel97872d32008-02-23 18:41:37 +00001098class ORExtractElt<RegisterClass rclass>:
1099 ORInst<(outs rclass:$rT), (ins VECREG:$rA, VECREG:$rB),
1100 [/* no pattern */]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001101
Scott Michel97872d32008-02-23 18:41:37 +00001102multiclass BitwiseOr
1103{
1104 def v16i8: ORVecInst<v16i8>;
1105 def v8i16: ORVecInst<v8i16>;
1106 def v4i32: ORVecInst<v4i32>;
1107 def v2i64: ORVecInst<v2i64>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001108
Scott Michel97872d32008-02-23 18:41:37 +00001109 def v4f32: ORInst<(outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
1110 [(set (v4f32 VECREG:$rT),
1111 (v4f32 (bitconvert (or (v4i32 VECREG:$rA),
1112 (v4i32 VECREG:$rB)))))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001113
Scott Michel97872d32008-02-23 18:41:37 +00001114 def v2f64: ORInst<(outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
1115 [(set (v2f64 VECREG:$rT),
1116 (v2f64 (bitconvert (or (v2i64 VECREG:$rA),
1117 (v2i64 VECREG:$rB)))))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001118
Scott Michel97872d32008-02-23 18:41:37 +00001119 def r64: ORRegInst<R64C>;
1120 def r32: ORRegInst<R32C>;
1121 def r16: ORRegInst<R16C>;
1122 def r8: ORRegInst<R8C>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001123
Scott Michel97872d32008-02-23 18:41:37 +00001124 // OR instructions used to copy f32 and f64 registers.
1125 def f32: ORInst<(outs R32FP:$rT), (ins R32FP:$rA, R32FP:$rB),
1126 [/* no pattern */]>;
Scott Michel438be252007-12-17 22:32:34 +00001127
Scott Michel97872d32008-02-23 18:41:37 +00001128 def f64: ORInst<(outs R64FP:$rT), (ins R64FP:$rA, R64FP:$rB),
1129 [/* no pattern */]>;
Scott Michel754d8662007-12-20 00:44:13 +00001130
Scott Michel97872d32008-02-23 18:41:37 +00001131 // scalar->vector promotion:
1132 def v16i8_i8: ORPromoteScalar<R8C>;
1133 def v8i16_i16: ORPromoteScalar<R16C>;
1134 def v4i32_i32: ORPromoteScalar<R32C>;
1135 def v2i64_i64: ORPromoteScalar<R64C>;
1136 def v4f32_f32: ORPromoteScalar<R32FP>;
1137 def v2f64_f64: ORPromoteScalar<R64FP>;
Scott Michel754d8662007-12-20 00:44:13 +00001138
Scott Michel97872d32008-02-23 18:41:37 +00001139 // extract element 0:
1140 def i8_v16i8: ORExtractElt<R8C>;
1141 def i16_v8i16: ORExtractElt<R16C>;
1142 def i32_v4i32: ORExtractElt<R32C>;
1143 def i64_v2i64: ORExtractElt<R64C>;
1144 def f32_v4f32: ORExtractElt<R32FP>;
1145 def f64_v2f64: ORExtractElt<R64FP>;
1146}
Scott Michel438be252007-12-17 22:32:34 +00001147
Scott Michel97872d32008-02-23 18:41:37 +00001148defm OR : BitwiseOr;
1149
1150// scalar->vector promotion patterns:
Scott Michel438be252007-12-17 22:32:34 +00001151def : Pat<(v16i8 (SPUpromote_scalar R8C:$rA)),
Scott Michel5a6f17b2008-01-30 02:55:46 +00001152 (ORv16i8_i8 R8C:$rA, R8C:$rA)>;
Scott Michel438be252007-12-17 22:32:34 +00001153
Scott Michel8b6b4202007-12-04 22:35:58 +00001154def : Pat<(v8i16 (SPUpromote_scalar R16C:$rA)),
1155 (ORv8i16_i16 R16C:$rA, R16C:$rA)>;
1156
Scott Michel8b6b4202007-12-04 22:35:58 +00001157def : Pat<(v4i32 (SPUpromote_scalar R32C:$rA)),
1158 (ORv4i32_i32 R32C:$rA, R32C:$rA)>;
1159
Scott Michel8b6b4202007-12-04 22:35:58 +00001160def : Pat<(v2i64 (SPUpromote_scalar R64C:$rA)),
1161 (ORv2i64_i64 R64C:$rA, R64C:$rA)>;
1162
Scott Michel8b6b4202007-12-04 22:35:58 +00001163def : Pat<(v4f32 (SPUpromote_scalar R32FP:$rA)),
1164 (ORv4f32_f32 R32FP:$rA, R32FP:$rA)>;
1165
Scott Michel8b6b4202007-12-04 22:35:58 +00001166def : Pat<(v2f64 (SPUpromote_scalar R64FP:$rA)),
1167 (ORv2f64_f64 R64FP:$rA, R64FP:$rA)>;
1168
1169// ORi*_v*: Used to extract vector element 0 (the preferred slot)
Scott Michel438be252007-12-17 22:32:34 +00001170
1171def : Pat<(SPUextract_elt0 (v16i8 VECREG:$rA)),
Scott Michel5a6f17b2008-01-30 02:55:46 +00001172 (ORi8_v16i8 VECREG:$rA, VECREG:$rA)>;
Scott Michel438be252007-12-17 22:32:34 +00001173
Scott Michel394e26d2008-01-17 20:38:41 +00001174def : Pat<(SPUextract_elt0_chained (v16i8 VECREG:$rA)),
Scott Michel5a6f17b2008-01-30 02:55:46 +00001175 (ORi8_v16i8 VECREG:$rA, VECREG:$rA)>;
Scott Michel394e26d2008-01-17 20:38:41 +00001176
Scott Michel8b6b4202007-12-04 22:35:58 +00001177def : Pat<(SPUextract_elt0 (v8i16 VECREG:$rA)),
1178 (ORi16_v8i16 VECREG:$rA, VECREG:$rA)>;
1179
1180def : Pat<(SPUextract_elt0_chained (v8i16 VECREG:$rA)),
1181 (ORi16_v8i16 VECREG:$rA, VECREG:$rA)>;
1182
Scott Michel8b6b4202007-12-04 22:35:58 +00001183def : Pat<(SPUextract_elt0 (v4i32 VECREG:$rA)),
1184 (ORi32_v4i32 VECREG:$rA, VECREG:$rA)>;
1185
1186def : Pat<(SPUextract_elt0_chained (v4i32 VECREG:$rA)),
1187 (ORi32_v4i32 VECREG:$rA, VECREG:$rA)>;
1188
Scott Michel8b6b4202007-12-04 22:35:58 +00001189def : Pat<(SPUextract_elt0 (v2i64 VECREG:$rA)),
1190 (ORi64_v2i64 VECREG:$rA, VECREG:$rA)>;
1191
1192def : Pat<(SPUextract_elt0_chained (v2i64 VECREG:$rA)),
1193 (ORi64_v2i64 VECREG:$rA, VECREG:$rA)>;
1194
Scott Michel8b6b4202007-12-04 22:35:58 +00001195def : Pat<(SPUextract_elt0 (v4f32 VECREG:$rA)),
1196 (ORf32_v4f32 VECREG:$rA, VECREG:$rA)>;
1197
1198def : Pat<(SPUextract_elt0_chained (v4f32 VECREG:$rA)),
1199 (ORf32_v4f32 VECREG:$rA, VECREG:$rA)>;
1200
Scott Michel8b6b4202007-12-04 22:35:58 +00001201def : Pat<(SPUextract_elt0 (v2f64 VECREG:$rA)),
1202 (ORf64_v2f64 VECREG:$rA, VECREG:$rA)>;
1203
1204def : Pat<(SPUextract_elt0_chained (v2f64 VECREG:$rA)),
1205 (ORf64_v2f64 VECREG:$rA, VECREG:$rA)>;
1206
Scott Michel97872d32008-02-23 18:41:37 +00001207// ORC: Bitwise "or" with complement (c = a | ~b)
Scott Michel8b6b4202007-12-04 22:35:58 +00001208
Scott Michel97872d32008-02-23 18:41:37 +00001209class ORCInst<dag OOL, dag IOL, list<dag> pattern>:
1210 RRForm<0b10010010000, OOL, IOL, "orc\t$rT, $rA, $rB",
1211 IntegerOp, pattern>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001212
Scott Michel97872d32008-02-23 18:41:37 +00001213class ORCVecInst<ValueType vectype>:
1214 ORCInst<(outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
1215 [(set (vectype VECREG:$rT), (or (vectype VECREG:$rA),
1216 (vnot (vectype VECREG:$rB))))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001217
Scott Michel97872d32008-02-23 18:41:37 +00001218class ORCRegInst<RegisterClass rclass>:
1219 ORCInst<(outs rclass:$rT), (ins rclass:$rA, rclass:$rB),
1220 [(set rclass:$rT, (or rclass:$rA, (not rclass:$rB)))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001221
Scott Michel97872d32008-02-23 18:41:37 +00001222multiclass BitwiseOrComplement
1223{
1224 def v16i8: ORCVecInst<v16i8>;
1225 def v8i16: ORCVecInst<v8i16>;
1226 def v4i32: ORCVecInst<v4i32>;
1227 def v2i64: ORCVecInst<v2i64>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001228
Scott Michel97872d32008-02-23 18:41:37 +00001229 def r64: ORCRegInst<R64C>;
1230 def r32: ORCRegInst<R32C>;
1231 def r16: ORCRegInst<R16C>;
1232 def r8: ORCRegInst<R8C>;
1233}
1234
1235defm ORC : BitwiseOrComplement;
Scott Michel438be252007-12-17 22:32:34 +00001236
Scott Michel8b6b4202007-12-04 22:35:58 +00001237// OR byte immediate
Scott Michel97872d32008-02-23 18:41:37 +00001238class ORBIInst<dag OOL, dag IOL, list<dag> pattern>:
1239 RI10Form<0b01100000, OOL, IOL, "orbi\t$rT, $rA, $val",
1240 IntegerOp, pattern>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001241
Scott Michel97872d32008-02-23 18:41:37 +00001242class ORBIVecInst<ValueType vectype, PatLeaf immpred>:
1243 ORBIInst<(outs VECREG:$rT), (ins VECREG:$rA, u10imm:$val),
1244 [(set (v16i8 VECREG:$rT), (or (vectype VECREG:$rA),
1245 (vectype immpred:$val)))]>;
1246
1247multiclass BitwiseOrByteImm
1248{
1249 def v16i8: ORBIVecInst<v16i8, v16i8U8Imm>;
1250
1251 def r8: ORBIInst<(outs R8C:$rT), (ins R8C:$rA, u10imm_i8:$val),
1252 [(set R8C:$rT, (or R8C:$rA, immU8:$val))]>;
1253}
1254
1255defm ORBI : BitwiseOrByteImm;
Scott Michel438be252007-12-17 22:32:34 +00001256
Scott Michel8b6b4202007-12-04 22:35:58 +00001257// OR halfword immediate
Scott Michel97872d32008-02-23 18:41:37 +00001258class ORHIInst<dag OOL, dag IOL, list<dag> pattern>:
1259 RI10Form<0b10100000, OOL, IOL, "orhi\t$rT, $rA, $val",
1260 IntegerOp, pattern>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001261
Scott Michel97872d32008-02-23 18:41:37 +00001262class ORHIVecInst<ValueType vectype, PatLeaf immpred>:
1263 ORHIInst<(outs VECREG:$rT), (ins VECREG:$rA, u10imm:$val),
1264 [(set (vectype VECREG:$rT), (or (vectype VECREG:$rA),
1265 immpred:$val))]>;
Scott Michel438be252007-12-17 22:32:34 +00001266
Scott Michel97872d32008-02-23 18:41:37 +00001267multiclass BitwiseOrHalfwordImm
1268{
1269 def v8i16: ORHIVecInst<v8i16, v8i16Uns10Imm>;
1270
1271 def r16: ORHIInst<(outs R16C:$rT), (ins R16C:$rA, u10imm:$val),
1272 [(set R16C:$rT, (or R16C:$rA, i16ImmUns10:$val))]>;
1273
1274 // Specialized ORHI form used to promote 8-bit registers to 16-bit
1275 def i8i16: ORHIInst<(outs R16C:$rT), (ins R8C:$rA, s10imm:$val),
1276 [(set R16C:$rT, (or (anyext R8C:$rA),
1277 i16ImmSExt10:$val))]>;
1278}
1279
1280defm ORHI : BitwiseOrHalfwordImm;
1281
1282class ORIInst<dag OOL, dag IOL, list<dag> pattern>:
1283 RI10Form<0b00100000, OOL, IOL, "ori\t$rT, $rA, $val",
1284 IntegerOp, pattern>;
1285
1286class ORIVecInst<ValueType vectype, PatLeaf immpred>:
1287 ORIInst<(outs VECREG:$rT), (ins VECREG:$rA, u10imm:$val),
1288 [(set (vectype VECREG:$rT), (or (vectype VECREG:$rA),
1289 immpred:$val))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001290
1291// Bitwise "or" with immediate
Scott Michel97872d32008-02-23 18:41:37 +00001292multiclass BitwiseOrImm
1293{
1294 def v4i32: ORIVecInst<v4i32, v4i32Uns10Imm>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001295
Scott Michel97872d32008-02-23 18:41:37 +00001296 def r32: ORIInst<(outs R32C:$rT), (ins R32C:$rA, u10imm_i32:$val),
1297 [(set R32C:$rT, (or R32C:$rA, i32ImmUns10:$val))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001298
Scott Michel97872d32008-02-23 18:41:37 +00001299 // i16i32: hacked version of the ori instruction to extend 16-bit quantities
1300 // to 32-bit quantities. used exclusively to match "anyext" conversions (vide
1301 // infra "anyext 16->32" pattern.)
1302 def i16i32: ORIInst<(outs R32C:$rT), (ins R16C:$rA, s10imm_i32:$val),
1303 [(set R32C:$rT, (or (anyext R16C:$rA),
1304 i32ImmSExt10:$val))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001305
Scott Michel97872d32008-02-23 18:41:37 +00001306 // i8i32: Hacked version of the ORI instruction to extend 16-bit quantities
1307 // to 32-bit quantities. Used exclusively to match "anyext" conversions (vide
1308 // infra "anyext 16->32" pattern.)
1309 def i8i32: ORIInst<(outs R32C:$rT), (ins R8C:$rA, s10imm_i32:$val),
1310 [(set R32C:$rT, (or (anyext R8C:$rA),
1311 i32ImmSExt10:$val))]>;
1312}
Scott Michel8b6b4202007-12-04 22:35:58 +00001313
Scott Michel97872d32008-02-23 18:41:37 +00001314defm ORI : BitwiseOrImm;
Scott Michel438be252007-12-17 22:32:34 +00001315
Scott Michel8b6b4202007-12-04 22:35:58 +00001316// ORX: "or" across the vector: or's $rA's word slots leaving the result in
1317// $rT[0], slots 1-3 are zeroed.
1318//
Scott Michel438be252007-12-17 22:32:34 +00001319// FIXME: Needs to match an intrinsic pattern.
Scott Michel8b6b4202007-12-04 22:35:58 +00001320def ORXv4i32:
1321 RRForm<0b10010010000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
1322 "orx\t$rT, $rA, $rB", IntegerOp,
1323 []>;
1324
Scott Michel438be252007-12-17 22:32:34 +00001325// XOR:
Scott Michel8b6b4202007-12-04 22:35:58 +00001326def XORv16i8:
1327 RRForm<0b10010010000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
1328 "xor\t$rT, $rA, $rB", IntegerOp,
1329 [(set (v16i8 VECREG:$rT), (xor (v16i8 VECREG:$rA), (v16i8 VECREG:$rB)))]>;
1330
1331def XORv8i16:
1332 RRForm<0b10010010000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
1333 "xor\t$rT, $rA, $rB", IntegerOp,
1334 [(set (v8i16 VECREG:$rT), (xor (v8i16 VECREG:$rA), (v8i16 VECREG:$rB)))]>;
1335
1336def XORv4i32:
1337 RRForm<0b10010010000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
1338 "xor\t$rT, $rA, $rB", IntegerOp,
1339 [(set (v4i32 VECREG:$rT), (xor (v4i32 VECREG:$rA), (v4i32 VECREG:$rB)))]>;
1340
1341def XORr32:
1342 RRForm<0b10010010000, (outs R32C:$rT), (ins R32C:$rA, R32C:$rB),
1343 "xor\t$rT, $rA, $rB", IntegerOp,
1344 [(set R32C:$rT, (xor R32C:$rA, R32C:$rB))]>;
1345
1346//==----------------------------------------------------------
1347// Special forms for floating point instructions.
1348// Bitwise ORs and ANDs don't make sense for normal floating
1349// point numbers. These operations (fneg and fabs), however,
1350// require bitwise logical ops to manipulate the sign bit.
1351def XORfneg32:
1352 RRForm<0b10010010000, (outs R32FP:$rT), (ins R32FP:$rA, R32C:$rB),
1353 "xor\t$rT, $rA, $rB", IntegerOp,
1354 [/* Intentionally does not match a pattern, see fneg32 */]>;
1355
1356// KLUDGY! Better way to do this without a VECREG? bitconvert?
1357// VECREG is assumed to contain two identical 64-bit masks, so
1358// it doesn't matter which word we select for the xor
1359def XORfneg64:
1360 RRForm<0b10010010000, (outs R64FP:$rT), (ins R64FP:$rA, VECREG:$rB),
1361 "xor\t$rT, $rA, $rB", IntegerOp,
1362 [/* Intentionally does not match a pattern, see fneg64 */]>;
1363
1364// Could use XORv4i32, but will use this for clarity
1365def XORfnegvec:
1366 RRForm<0b10010010000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
1367 "xor\t$rT, $rA, $rB", IntegerOp,
1368 [/* Intentionally does not match a pattern, see fneg{32,64} */]>;
1369
1370//==----------------------------------------------------------
1371
1372def XORr16:
1373 RRForm<0b10010010000, (outs R16C:$rT), (ins R16C:$rA, R16C:$rB),
1374 "xor\t$rT, $rA, $rB", IntegerOp,
1375 [(set R16C:$rT, (xor R16C:$rA, R16C:$rB))]>;
1376
Scott Michel438be252007-12-17 22:32:34 +00001377def XORr8:
1378 RRForm<0b10010010000, (outs R8C:$rT), (ins R8C:$rA, R8C:$rB),
1379 "xor\t$rT, $rA, $rB", IntegerOp,
1380 [(set R8C:$rT, (xor R8C:$rA, R8C:$rB))]>;
1381
Scott Michel97872d32008-02-23 18:41:37 +00001382class XORBIInst<dag OOL, dag IOL, list<dag> pattern>:
1383 RI10Form<0b01100000, OOL, IOL, "xorbi\t$rT, $rA, $val",
1384 IntegerOp, pattern>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001385
Scott Michel97872d32008-02-23 18:41:37 +00001386multiclass XorByteImm
1387{
1388 def v16i8:
1389 XORBIInst<(outs VECREG:$rT), (ins VECREG:$rA, u10imm:$val),
1390 [(set (v16i8 VECREG:$rT), (xor (v16i8 VECREG:$rA), v16i8U8Imm:$val))]>;
1391
1392 def r8:
1393 XORBIInst<(outs R8C:$rT), (ins R8C:$rA, u10imm_i8:$val),
1394 [(set R8C:$rT, (xor R8C:$rA, immU8:$val))]>;
1395}
1396
1397defm XORBI : XorByteImm;
Scott Michel438be252007-12-17 22:32:34 +00001398
Scott Michel8b6b4202007-12-04 22:35:58 +00001399def XORHIv8i16:
Scott Michel97872d32008-02-23 18:41:37 +00001400 RI10Form<0b10100000, (outs VECREG:$rT), (ins VECREG:$rA, u10imm:$val),
Scott Michel8b6b4202007-12-04 22:35:58 +00001401 "xorhi\t$rT, $rA, $val", IntegerOp,
1402 [(set (v8i16 VECREG:$rT), (xor (v8i16 VECREG:$rA),
1403 v8i16SExt10Imm:$val))]>;
1404
1405def XORHIr16:
1406 RI10Form<0b10100000, (outs R16C:$rT), (ins R16C:$rA, s10imm:$val),
1407 "xorhi\t$rT, $rA, $val", IntegerOp,
1408 [(set R16C:$rT, (xor R16C:$rA, i16ImmSExt10:$val))]>;
1409
1410def XORIv4i32:
Scott Michel97872d32008-02-23 18:41:37 +00001411 RI10Form<0b00100000, (outs VECREG:$rT), (ins VECREG:$rA, u10imm:$val),
Scott Michel8b6b4202007-12-04 22:35:58 +00001412 "xori\t$rT, $rA, $val", IntegerOp,
1413 [(set (v4i32 VECREG:$rT), (xor (v4i32 VECREG:$rA),
1414 v4i32SExt10Imm:$val))]>;
1415
1416def XORIr32:
1417 RI10Form<0b00100000, (outs R32C:$rT), (ins R32C:$rA, s10imm_i32:$val),
1418 "xori\t$rT, $rA, $val", IntegerOp,
1419 [(set R32C:$rT, (xor R32C:$rA, i32ImmSExt10:$val))]>;
1420
1421// NAND:
1422def NANDv16i8:
1423 RRForm<0b10010010000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
1424 "nand\t$rT, $rA, $rB", IntegerOp,
1425 [(set (v16i8 VECREG:$rT), (vnot (and (v16i8 VECREG:$rA),
1426 (v16i8 VECREG:$rB))))]>;
1427
1428def NANDv8i16:
1429 RRForm<0b10010010000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
1430 "nand\t$rT, $rA, $rB", IntegerOp,
1431 [(set (v8i16 VECREG:$rT), (vnot (and (v8i16 VECREG:$rA),
1432 (v8i16 VECREG:$rB))))]>;
1433
1434def NANDv4i32:
1435 RRForm<0b10010010000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
1436 "nand\t$rT, $rA, $rB", IntegerOp,
1437 [(set (v4i32 VECREG:$rT), (vnot (and (v4i32 VECREG:$rA),
1438 (v4i32 VECREG:$rB))))]>;
1439
1440def NANDr32:
1441 RRForm<0b10010010000, (outs R32C:$rT), (ins R32C:$rA, R32C:$rB),
1442 "nand\t$rT, $rA, $rB", IntegerOp,
1443 [(set R32C:$rT, (not (and R32C:$rA, R32C:$rB)))]>;
1444
1445def NANDr16:
1446 RRForm<0b10010010000, (outs R16C:$rT), (ins R16C:$rA, R16C:$rB),
1447 "nand\t$rT, $rA, $rB", IntegerOp,
1448 [(set R16C:$rT, (not (and R16C:$rA, R16C:$rB)))]>;
1449
Scott Michel438be252007-12-17 22:32:34 +00001450def NANDr8:
1451 RRForm<0b10010010000, (outs R8C:$rT), (ins R8C:$rA, R8C:$rB),
1452 "nand\t$rT, $rA, $rB", IntegerOp,
1453 [(set R8C:$rT, (not (and R8C:$rA, R8C:$rB)))]>;
1454
Scott Michel8b6b4202007-12-04 22:35:58 +00001455// NOR:
1456def NORv16i8:
1457 RRForm<0b10010010000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
1458 "nor\t$rT, $rA, $rB", IntegerOp,
1459 [(set (v16i8 VECREG:$rT), (vnot (or (v16i8 VECREG:$rA),
1460 (v16i8 VECREG:$rB))))]>;
1461
1462def NORv8i16:
1463 RRForm<0b10010010000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
1464 "nor\t$rT, $rA, $rB", IntegerOp,
1465 [(set (v8i16 VECREG:$rT), (vnot (or (v8i16 VECREG:$rA),
1466 (v8i16 VECREG:$rB))))]>;
1467
1468def NORv4i32:
1469 RRForm<0b10010010000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
1470 "nor\t$rT, $rA, $rB", IntegerOp,
1471 [(set (v4i32 VECREG:$rT), (vnot (or (v4i32 VECREG:$rA),
1472 (v4i32 VECREG:$rB))))]>;
1473
1474def NORr32:
1475 RRForm<0b10010010000, (outs R32C:$rT), (ins R32C:$rA, R32C:$rB),
1476 "nor\t$rT, $rA, $rB", IntegerOp,
1477 [(set R32C:$rT, (not (or R32C:$rA, R32C:$rB)))]>;
1478
1479def NORr16:
1480 RRForm<0b10010010000, (outs R16C:$rT), (ins R16C:$rA, R16C:$rB),
1481 "nor\t$rT, $rA, $rB", IntegerOp,
1482 [(set R16C:$rT, (not (or R16C:$rA, R16C:$rB)))]>;
1483
Scott Michel438be252007-12-17 22:32:34 +00001484def NORr8:
1485 RRForm<0b10010010000, (outs R8C:$rT), (ins R8C:$rA, R8C:$rB),
1486 "nor\t$rT, $rA, $rB", IntegerOp,
1487 [(set R8C:$rT, (not (or R8C:$rA, R8C:$rB)))]>;
1488
Scott Michel8b6b4202007-12-04 22:35:58 +00001489// EQV: Equivalence (1 for each same bit, otherwise 0)
1490def EQVv16i8:
1491 RRForm<0b10010010000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
1492 "eqv\t$rT, $rA, $rB", IntegerOp,
1493 [(set (v16i8 VECREG:$rT), (or (and (v16i8 VECREG:$rA),
1494 (v16i8 VECREG:$rB)),
1495 (and (vnot (v16i8 VECREG:$rA)),
1496 (vnot (v16i8 VECREG:$rB)))))]>;
1497
1498def : Pat<(xor (v16i8 VECREG:$rA), (vnot (v16i8 VECREG:$rB))),
1499 (EQVv16i8 VECREG:$rA, VECREG:$rB)>;
1500
1501def : Pat<(xor (vnot (v16i8 VECREG:$rA)), (v16i8 VECREG:$rB)),
1502 (EQVv16i8 VECREG:$rA, VECREG:$rB)>;
1503
1504def EQVv8i16:
1505 RRForm<0b10010010000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
1506 "eqv\t$rT, $rA, $rB", IntegerOp,
1507 [(set (v8i16 VECREG:$rT), (or (and (v8i16 VECREG:$rA),
1508 (v8i16 VECREG:$rB)),
1509 (and (vnot (v8i16 VECREG:$rA)),
1510 (vnot (v8i16 VECREG:$rB)))))]>;
1511
1512def : Pat<(xor (v8i16 VECREG:$rA), (vnot (v8i16 VECREG:$rB))),
1513 (EQVv8i16 VECREG:$rA, VECREG:$rB)>;
1514
1515def : Pat<(xor (vnot (v8i16 VECREG:$rA)), (v8i16 VECREG:$rB)),
1516 (EQVv8i16 VECREG:$rA, VECREG:$rB)>;
1517
1518def EQVv4i32:
1519 RRForm<0b10010010000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
1520 "eqv\t$rT, $rA, $rB", IntegerOp,
1521 [(set (v4i32 VECREG:$rT), (or (and (v4i32 VECREG:$rA),
1522 (v4i32 VECREG:$rB)),
1523 (and (vnot (v4i32 VECREG:$rA)),
1524 (vnot (v4i32 VECREG:$rB)))))]>;
1525
1526def : Pat<(xor (v4i32 VECREG:$rA), (vnot (v4i32 VECREG:$rB))),
1527 (EQVv4i32 VECREG:$rA, VECREG:$rB)>;
1528
1529def : Pat<(xor (vnot (v4i32 VECREG:$rA)), (v4i32 VECREG:$rB)),
1530 (EQVv4i32 VECREG:$rA, VECREG:$rB)>;
1531
1532def EQVr32:
1533 RRForm<0b10010010000, (outs R32C:$rT), (ins R32C:$rA, R32C:$rB),
1534 "eqv\t$rT, $rA, $rB", IntegerOp,
1535 [(set R32C:$rT, (or (and R32C:$rA, R32C:$rB),
1536 (and (not R32C:$rA), (not R32C:$rB))))]>;
1537
1538def : Pat<(xor R32C:$rA, (not R32C:$rB)),
1539 (EQVr32 R32C:$rA, R32C:$rB)>;
1540
1541def : Pat<(xor (not R32C:$rA), R32C:$rB),
1542 (EQVr32 R32C:$rA, R32C:$rB)>;
1543
1544def EQVr16:
1545 RRForm<0b10010010000, (outs R16C:$rT), (ins R16C:$rA, R16C:$rB),
1546 "eqv\t$rT, $rA, $rB", IntegerOp,
1547 [(set R16C:$rT, (or (and R16C:$rA, R16C:$rB),
1548 (and (not R16C:$rA), (not R16C:$rB))))]>;
1549
1550def : Pat<(xor R16C:$rA, (not R16C:$rB)),
1551 (EQVr16 R16C:$rA, R16C:$rB)>;
1552
1553def : Pat<(xor (not R16C:$rA), R16C:$rB),
1554 (EQVr16 R16C:$rA, R16C:$rB)>;
1555
Scott Michel438be252007-12-17 22:32:34 +00001556def EQVr8:
1557 RRForm<0b10010010000, (outs R8C:$rT), (ins R8C:$rA, R8C:$rB),
1558 "eqv\t$rT, $rA, $rB", IntegerOp,
1559 [(set R8C:$rT, (or (and R8C:$rA, R8C:$rB),
1560 (and (not R8C:$rA), (not R8C:$rB))))]>;
1561
1562def : Pat<(xor R8C:$rA, (not R8C:$rB)),
1563 (EQVr8 R8C:$rA, R8C:$rB)>;
1564
1565def : Pat<(xor (not R8C:$rA), R8C:$rB),
1566 (EQVr8 R8C:$rA, R8C:$rB)>;
1567
Scott Michel8b6b4202007-12-04 22:35:58 +00001568// gcc optimizes (p & q) | (~p & ~q) -> ~(p | q) | (p & q), so match that
1569// pattern also:
1570def : Pat<(or (vnot (or (v16i8 VECREG:$rA), (v16i8 VECREG:$rB))),
1571 (and (v16i8 VECREG:$rA), (v16i8 VECREG:$rB))),
1572 (EQVv16i8 VECREG:$rA, VECREG:$rB)>;
1573
1574def : Pat<(or (vnot (or (v8i16 VECREG:$rA), (v8i16 VECREG:$rB))),
1575 (and (v8i16 VECREG:$rA), (v8i16 VECREG:$rB))),
1576 (EQVv8i16 VECREG:$rA, VECREG:$rB)>;
1577
1578def : Pat<(or (vnot (or (v4i32 VECREG:$rA), (v4i32 VECREG:$rB))),
1579 (and (v4i32 VECREG:$rA), (v4i32 VECREG:$rB))),
1580 (EQVv4i32 VECREG:$rA, VECREG:$rB)>;
1581
1582def : Pat<(or (not (or R32C:$rA, R32C:$rB)), (and R32C:$rA, R32C:$rB)),
1583 (EQVr32 R32C:$rA, R32C:$rB)>;
1584
1585def : Pat<(or (not (or R16C:$rA, R16C:$rB)), (and R16C:$rA, R16C:$rB)),
1586 (EQVr16 R16C:$rA, R16C:$rB)>;
1587
Scott Michel438be252007-12-17 22:32:34 +00001588def : Pat<(or (not (or R8C:$rA, R8C:$rB)), (and R8C:$rA, R8C:$rB)),
1589 (EQVr8 R8C:$rA, R8C:$rB)>;
1590
Scott Michel8b6b4202007-12-04 22:35:58 +00001591// Select bits:
1592def SELBv16i8:
1593 RRRForm<0b1000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB, VECREG:$rC),
1594 "selb\t$rT, $rA, $rB, $rC", IntegerOp,
1595 [(set (v16i8 VECREG:$rT),
Scott Michel97872d32008-02-23 18:41:37 +00001596 (SPUselb (v16i8 VECREG:$rA), (v16i8 VECREG:$rB),
Scott Michel8b6b4202007-12-04 22:35:58 +00001597 (v16i8 VECREG:$rC)))]>;
1598
1599def : Pat<(or (and (v16i8 VECREG:$rA), (v16i8 VECREG:$rC)),
1600 (and (v16i8 VECREG:$rB), (vnot (v16i8 VECREG:$rC)))),
1601 (SELBv16i8 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1602
1603def : Pat<(or (and (v16i8 VECREG:$rC), (v16i8 VECREG:$rA)),
1604 (and (v16i8 VECREG:$rB), (vnot (v16i8 VECREG:$rC)))),
1605 (SELBv16i8 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1606
1607def : Pat<(or (and (v16i8 VECREG:$rA), (v16i8 VECREG:$rC)),
1608 (and (vnot (v16i8 VECREG:$rC)), (v16i8 VECREG:$rB))),
1609 (SELBv16i8 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1610
1611def : Pat<(or (and (v16i8 VECREG:$rC), (v16i8 VECREG:$rA)),
1612 (and (vnot (v16i8 VECREG:$rC)), (v16i8 VECREG:$rB))),
1613 (SELBv16i8 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1614
1615def : Pat<(or (and (v16i8 VECREG:$rA), (vnot (v16i8 VECREG:$rC))),
1616 (and (v16i8 VECREG:$rB), (v16i8 VECREG:$rC))),
1617 (SELBv16i8 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1618
1619def : Pat<(or (and (v16i8 VECREG:$rA), (vnot (v16i8 VECREG:$rC))),
1620 (and (v16i8 VECREG:$rC), (v16i8 VECREG:$rB))),
1621 (SELBv16i8 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1622
1623def : Pat<(or (and (vnot (v16i8 VECREG:$rC)), (v16i8 VECREG:$rA)),
1624 (and (v16i8 VECREG:$rB), (v16i8 VECREG:$rC))),
1625 (SELBv16i8 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1626
1627def : Pat<(or (and (vnot (v16i8 VECREG:$rC)), (v16i8 VECREG:$rA)),
1628 (and (v16i8 VECREG:$rC), (v16i8 VECREG:$rB))),
1629 (SELBv16i8 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1630
1631def : Pat<(or (and (v16i8 VECREG:$rA), (v16i8 VECREG:$rC)),
1632 (and (v16i8 VECREG:$rB), (vnot (v16i8 VECREG:$rC)))),
1633 (SELBv16i8 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1634
1635def : Pat<(or (and (v16i8 VECREG:$rC), (v16i8 VECREG:$rA)),
1636 (and (v16i8 VECREG:$rB), (vnot (v16i8 VECREG:$rC)))),
1637 (SELBv16i8 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1638
1639def : Pat<(or (and (v16i8 VECREG:$rA), (v16i8 VECREG:$rC)),
1640 (and (vnot (v16i8 VECREG:$rC)), (v16i8 VECREG:$rB))),
1641 (SELBv16i8 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1642
1643def : Pat<(or (and (v16i8 VECREG:$rC), (v16i8 VECREG:$rA)),
1644 (and (vnot (v16i8 VECREG:$rC)), (v16i8 VECREG:$rB))),
1645 (SELBv16i8 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1646
1647def : Pat<(or (and (v16i8 VECREG:$rA), (vnot (v16i8 VECREG:$rC))),
1648 (and (v16i8 VECREG:$rB), (v16i8 VECREG:$rC))),
1649 (SELBv16i8 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1650
1651def : Pat<(or (and (v16i8 VECREG:$rA), (vnot (v16i8 VECREG:$rC))),
1652 (and (v16i8 VECREG:$rC), (v16i8 VECREG:$rB))),
1653 (SELBv16i8 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1654
1655def : Pat<(or (and (vnot (v16i8 VECREG:$rC)), (v16i8 VECREG:$rA)),
1656 (and (v16i8 VECREG:$rB), (v16i8 VECREG:$rC))),
1657 (SELBv16i8 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1658
1659def : Pat<(or (and (vnot (v16i8 VECREG:$rC)), (v16i8 VECREG:$rA)),
1660 (and (v16i8 VECREG:$rC), (v16i8 VECREG:$rB))),
1661 (SELBv16i8 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1662
1663def SELBv8i16:
1664 RRRForm<0b1000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB, VECREG:$rC),
1665 "selb\t$rT, $rA, $rB, $rC", IntegerOp,
1666 [(set (v8i16 VECREG:$rT),
Scott Michel97872d32008-02-23 18:41:37 +00001667 (SPUselb (v8i16 VECREG:$rA), (v8i16 VECREG:$rB),
Scott Michel8b6b4202007-12-04 22:35:58 +00001668 (v8i16 VECREG:$rC)))]>;
1669
1670def : Pat<(or (and (v8i16 VECREG:$rA), (v8i16 VECREG:$rC)),
1671 (and (v8i16 VECREG:$rB), (vnot (v8i16 VECREG:$rC)))),
1672 (SELBv8i16 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1673
1674def : Pat<(or (and (v8i16 VECREG:$rC), (v8i16 VECREG:$rA)),
1675 (and (v8i16 VECREG:$rB), (vnot (v8i16 VECREG:$rC)))),
1676 (SELBv8i16 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1677
1678def : Pat<(or (and (v8i16 VECREG:$rA), (v8i16 VECREG:$rC)),
1679 (and (vnot (v8i16 VECREG:$rC)), (v8i16 VECREG:$rB))),
1680 (SELBv8i16 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1681
1682def : Pat<(or (and (v8i16 VECREG:$rC), (v8i16 VECREG:$rA)),
1683 (and (vnot (v8i16 VECREG:$rC)), (v8i16 VECREG:$rB))),
1684 (SELBv8i16 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1685
1686def : Pat<(or (and (v8i16 VECREG:$rA), (vnot (v8i16 VECREG:$rC))),
1687 (and (v8i16 VECREG:$rB), (v8i16 VECREG:$rC))),
1688 (SELBv8i16 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1689
1690def : Pat<(or (and (v8i16 VECREG:$rA), (vnot (v8i16 VECREG:$rC))),
1691 (and (v8i16 VECREG:$rC), (v8i16 VECREG:$rB))),
1692 (SELBv8i16 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1693
1694def : Pat<(or (and (vnot (v8i16 VECREG:$rC)), (v8i16 VECREG:$rA)),
1695 (and (v8i16 VECREG:$rB), (v8i16 VECREG:$rC))),
1696 (SELBv8i16 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1697
1698def : Pat<(or (and (vnot (v8i16 VECREG:$rC)), (v8i16 VECREG:$rA)),
1699 (and (v8i16 VECREG:$rC), (v8i16 VECREG:$rB))),
1700 (SELBv8i16 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1701
1702def : Pat<(or (and (v8i16 VECREG:$rA), (v8i16 VECREG:$rC)),
1703 (and (v8i16 VECREG:$rB), (vnot (v8i16 VECREG:$rC)))),
1704 (SELBv8i16 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1705
1706def : Pat<(or (and (v8i16 VECREG:$rC), (v8i16 VECREG:$rA)),
1707 (and (v8i16 VECREG:$rB), (vnot (v8i16 VECREG:$rC)))),
1708 (SELBv8i16 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1709
1710def : Pat<(or (and (v8i16 VECREG:$rA), (v8i16 VECREG:$rC)),
1711 (and (vnot (v8i16 VECREG:$rC)), (v8i16 VECREG:$rB))),
1712 (SELBv8i16 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1713
1714def : Pat<(or (and (v8i16 VECREG:$rC), (v8i16 VECREG:$rA)),
1715 (and (vnot (v8i16 VECREG:$rC)), (v8i16 VECREG:$rB))),
1716 (SELBv8i16 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1717
1718def : Pat<(or (and (v8i16 VECREG:$rA), (vnot (v8i16 VECREG:$rC))),
1719 (and (v8i16 VECREG:$rB), (v8i16 VECREG:$rC))),
1720 (SELBv8i16 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1721
1722def : Pat<(or (and (v8i16 VECREG:$rA), (vnot (v8i16 VECREG:$rC))),
1723 (and (v8i16 VECREG:$rC), (v8i16 VECREG:$rB))),
1724 (SELBv8i16 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1725
1726def : Pat<(or (and (vnot (v8i16 VECREG:$rC)), (v8i16 VECREG:$rA)),
1727 (and (v8i16 VECREG:$rB), (v8i16 VECREG:$rC))),
1728 (SELBv8i16 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1729
1730def : Pat<(or (and (vnot (v8i16 VECREG:$rC)), (v8i16 VECREG:$rA)),
1731 (and (v8i16 VECREG:$rC), (v8i16 VECREG:$rB))),
1732 (SELBv8i16 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1733
1734def SELBv4i32:
1735 RRRForm<0b1000, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB, VECREG:$rC),
1736 "selb\t$rT, $rA, $rB, $rC", IntegerOp,
1737 [(set (v4i32 VECREG:$rT),
Scott Michel97872d32008-02-23 18:41:37 +00001738 (SPUselb (v4i32 VECREG:$rA), (v4i32 VECREG:$rB),
Scott Michel8b6b4202007-12-04 22:35:58 +00001739 (v4i32 VECREG:$rC)))]>;
1740
1741def : Pat<(or (and (v4i32 VECREG:$rA), (v4i32 VECREG:$rC)),
1742 (and (v4i32 VECREG:$rB), (vnot (v4i32 VECREG:$rC)))),
1743 (SELBv4i32 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1744
1745def : Pat<(or (and (v4i32 VECREG:$rC), (v4i32 VECREG:$rA)),
1746 (and (v4i32 VECREG:$rB), (vnot (v4i32 VECREG:$rC)))),
1747 (SELBv4i32 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1748
1749def : Pat<(or (and (v4i32 VECREG:$rA), (v4i32 VECREG:$rC)),
1750 (and (vnot (v4i32 VECREG:$rC)), (v4i32 VECREG:$rB))),
1751 (SELBv4i32 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1752
1753def : Pat<(or (and (v4i32 VECREG:$rC), (v4i32 VECREG:$rA)),
1754 (and (vnot (v4i32 VECREG:$rC)), (v4i32 VECREG:$rB))),
1755 (SELBv4i32 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1756
1757def : Pat<(or (and (v4i32 VECREG:$rA), (vnot (v4i32 VECREG:$rC))),
1758 (and (v4i32 VECREG:$rB), (v4i32 VECREG:$rC))),
1759 (SELBv4i32 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1760
1761def : Pat<(or (and (v4i32 VECREG:$rA), (vnot (v4i32 VECREG:$rC))),
1762 (and (v4i32 VECREG:$rC), (v4i32 VECREG:$rB))),
1763 (SELBv4i32 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1764
1765def : Pat<(or (and (vnot (v4i32 VECREG:$rC)), (v4i32 VECREG:$rA)),
1766 (and (v4i32 VECREG:$rB), (v4i32 VECREG:$rC))),
1767 (SELBv4i32 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1768
1769def : Pat<(or (and (vnot (v4i32 VECREG:$rC)), (v4i32 VECREG:$rA)),
1770 (and (v4i32 VECREG:$rC), (v4i32 VECREG:$rB))),
1771 (SELBv4i32 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1772
1773def : Pat<(or (and (v4i32 VECREG:$rA), (v4i32 VECREG:$rC)),
1774 (and (v4i32 VECREG:$rB), (vnot (v4i32 VECREG:$rC)))),
1775 (SELBv4i32 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1776
1777def : Pat<(or (and (v4i32 VECREG:$rC), (v4i32 VECREG:$rA)),
1778 (and (v4i32 VECREG:$rB), (vnot (v4i32 VECREG:$rC)))),
1779 (SELBv4i32 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1780
1781def : Pat<(or (and (v4i32 VECREG:$rA), (v4i32 VECREG:$rC)),
1782 (and (vnot (v4i32 VECREG:$rC)), (v4i32 VECREG:$rB))),
1783 (SELBv4i32 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1784
1785def : Pat<(or (and (v4i32 VECREG:$rC), (v4i32 VECREG:$rA)),
1786 (and (vnot (v4i32 VECREG:$rC)), (v4i32 VECREG:$rB))),
1787 (SELBv4i32 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1788
1789def : Pat<(or (and (v4i32 VECREG:$rA), (vnot (v4i32 VECREG:$rC))),
1790 (and (v4i32 VECREG:$rB), (v4i32 VECREG:$rC))),
1791 (SELBv4i32 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1792
1793def : Pat<(or (and (v4i32 VECREG:$rA), (vnot (v4i32 VECREG:$rC))),
1794 (and (v4i32 VECREG:$rC), (v4i32 VECREG:$rB))),
1795 (SELBv4i32 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1796
1797def : Pat<(or (and (vnot (v4i32 VECREG:$rC)), (v4i32 VECREG:$rA)),
1798 (and (v4i32 VECREG:$rB), (v4i32 VECREG:$rC))),
1799 (SELBv4i32 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1800
1801def : Pat<(or (and (vnot (v4i32 VECREG:$rC)), (v4i32 VECREG:$rA)),
1802 (and (v4i32 VECREG:$rC), (v4i32 VECREG:$rB))),
1803 (SELBv4i32 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
1804
1805def SELBr32:
1806 RRRForm<0b1000, (outs R32C:$rT), (ins R32C:$rA, R32C:$rB, R32C:$rC),
1807 "selb\t$rT, $rA, $rB, $rC", IntegerOp,
1808 []>;
1809
1810// And the various patterns that can be matched... (all 8 of them :-)
1811def : Pat<(or (and R32C:$rA, R32C:$rC),
1812 (and R32C:$rB, (not R32C:$rC))),
1813 (SELBr32 R32C:$rA, R32C:$rB, R32C:$rC)>;
1814
1815def : Pat<(or (and R32C:$rC, R32C:$rA),
1816 (and R32C:$rB, (not R32C:$rC))),
1817 (SELBr32 R32C:$rA, R32C:$rB, R32C:$rC)>;
1818
1819def : Pat<(or (and R32C:$rA, R32C:$rC),
1820 (and (not R32C:$rC), R32C:$rB)),
1821 (SELBr32 R32C:$rA, R32C:$rB, R32C:$rC)>;
1822
1823def : Pat<(or (and R32C:$rC, R32C:$rA),
1824 (and (not R32C:$rC), R32C:$rB)),
1825 (SELBr32 R32C:$rA, R32C:$rB, R32C:$rC)>;
1826
1827def : Pat<(or (and R32C:$rA, (not R32C:$rC)),
1828 (and R32C:$rB, R32C:$rC)),
1829 (SELBr32 R32C:$rA, R32C:$rB, R32C:$rC)>;
1830
1831def : Pat<(or (and R32C:$rA, (not R32C:$rC)),
1832 (and R32C:$rC, R32C:$rB)),
1833 (SELBr32 R32C:$rA, R32C:$rB, R32C:$rC)>;
1834
1835def : Pat<(or (and (not R32C:$rC), R32C:$rA),
1836 (and R32C:$rB, R32C:$rC)),
1837 (SELBr32 R32C:$rA, R32C:$rB, R32C:$rC)>;
1838
1839def : Pat<(or (and (not R32C:$rC), R32C:$rA),
1840 (and R32C:$rC, R32C:$rB)),
1841 (SELBr32 R32C:$rA, R32C:$rB, R32C:$rC)>;
1842
1843def SELBr16:
1844 RRRForm<0b1000, (outs R16C:$rT), (ins R16C:$rA, R16C:$rB, R16C:$rC),
1845 "selb\t$rT, $rA, $rB, $rC", IntegerOp,
1846 []>;
1847
1848def : Pat<(or (and R16C:$rA, R16C:$rC),
1849 (and R16C:$rB, (not R16C:$rC))),
1850 (SELBr16 R16C:$rA, R16C:$rB, R16C:$rC)>;
1851
1852def : Pat<(or (and R16C:$rC, R16C:$rA),
1853 (and R16C:$rB, (not R16C:$rC))),
1854 (SELBr16 R16C:$rA, R16C:$rB, R16C:$rC)>;
1855
1856def : Pat<(or (and R16C:$rA, R16C:$rC),
1857 (and (not R16C:$rC), R16C:$rB)),
1858 (SELBr16 R16C:$rA, R16C:$rB, R16C:$rC)>;
1859
1860def : Pat<(or (and R16C:$rC, R16C:$rA),
1861 (and (not R16C:$rC), R16C:$rB)),
1862 (SELBr16 R16C:$rA, R16C:$rB, R16C:$rC)>;
1863
1864def : Pat<(or (and R16C:$rA, (not R16C:$rC)),
1865 (and R16C:$rB, R16C:$rC)),
1866 (SELBr16 R16C:$rA, R16C:$rB, R16C:$rC)>;
1867
1868def : Pat<(or (and R16C:$rA, (not R16C:$rC)),
1869 (and R16C:$rC, R16C:$rB)),
1870 (SELBr16 R16C:$rA, R16C:$rB, R16C:$rC)>;
1871
1872def : Pat<(or (and (not R16C:$rC), R16C:$rA),
1873 (and R16C:$rB, R16C:$rC)),
1874 (SELBr16 R16C:$rA, R16C:$rB, R16C:$rC)>;
1875
1876def : Pat<(or (and (not R16C:$rC), R16C:$rA),
1877 (and R16C:$rC, R16C:$rB)),
1878 (SELBr16 R16C:$rA, R16C:$rB, R16C:$rC)>;
Scott Michel438be252007-12-17 22:32:34 +00001879
1880def SELBr8:
1881 RRRForm<0b1000, (outs R8C:$rT), (ins R8C:$rA, R8C:$rB, R8C:$rC),
1882 "selb\t$rT, $rA, $rB, $rC", IntegerOp,
1883 []>;
1884
1885def : Pat<(or (and R8C:$rA, R8C:$rC),
1886 (and R8C:$rB, (not R8C:$rC))),
1887 (SELBr8 R8C:$rA, R8C:$rB, R8C:$rC)>;
1888
1889def : Pat<(or (and R8C:$rC, R8C:$rA),
1890 (and R8C:$rB, (not R8C:$rC))),
1891 (SELBr8 R8C:$rA, R8C:$rB, R8C:$rC)>;
1892
1893def : Pat<(or (and R8C:$rA, R8C:$rC),
1894 (and (not R8C:$rC), R8C:$rB)),
1895 (SELBr8 R8C:$rA, R8C:$rB, R8C:$rC)>;
1896
1897def : Pat<(or (and R8C:$rC, R8C:$rA),
1898 (and (not R8C:$rC), R8C:$rB)),
1899 (SELBr8 R8C:$rA, R8C:$rB, R8C:$rC)>;
1900
1901def : Pat<(or (and R8C:$rA, (not R8C:$rC)),
1902 (and R8C:$rB, R8C:$rC)),
1903 (SELBr8 R8C:$rA, R8C:$rB, R8C:$rC)>;
1904
1905def : Pat<(or (and R8C:$rA, (not R8C:$rC)),
1906 (and R8C:$rC, R8C:$rB)),
1907 (SELBr8 R8C:$rA, R8C:$rB, R8C:$rC)>;
1908
1909def : Pat<(or (and (not R8C:$rC), R8C:$rA),
1910 (and R8C:$rB, R8C:$rC)),
1911 (SELBr8 R8C:$rA, R8C:$rB, R8C:$rC)>;
1912
1913def : Pat<(or (and (not R8C:$rC), R8C:$rA),
1914 (and R8C:$rC, R8C:$rB)),
1915 (SELBr8 R8C:$rA, R8C:$rB, R8C:$rC)>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001916
1917//===----------------------------------------------------------------------===//
1918// Vector shuffle...
1919//===----------------------------------------------------------------------===//
Scott Michel8b6b4202007-12-04 22:35:58 +00001920// SPUshuffle is generated in LowerVECTOR_SHUFFLE and gets replaced with SHUFB.
1921// See the SPUshuffle SDNode operand above, which sets up the DAG pattern
1922// matcher to emit something when the LowerVECTOR_SHUFFLE generates a node with
1923// the SPUISD::SHUFB opcode.
Scott Michel97872d32008-02-23 18:41:37 +00001924//===----------------------------------------------------------------------===//
Scott Michel8b6b4202007-12-04 22:35:58 +00001925
Scott Michel97872d32008-02-23 18:41:37 +00001926class SHUFBInst<dag OOL, dag IOL, list<dag> pattern>:
1927 RRRForm<0b1000, OOL, IOL, "shufb\t$rT, $rA, $rB, $rC",
1928 IntegerOp, pattern>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001929
Scott Michel97872d32008-02-23 18:41:37 +00001930class SHUFBVecInst<ValueType vectype>:
1931 SHUFBInst<(outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB, VECREG:$rC),
1932 [(set (vectype VECREG:$rT), (SPUshuffle (vectype VECREG:$rA),
1933 (vectype VECREG:$rB),
1934 (vectype VECREG:$rC)))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001935
Scott Michel97872d32008-02-23 18:41:37 +00001936// It's this pattern that's probably the most useful, since SPUISelLowering
1937// methods create a v16i8 vector for $rC:
1938class SHUFBVecPat1<ValueType vectype, SPUInstr inst>:
1939 Pat<(SPUshuffle (vectype VECREG:$rA), (vectype VECREG:$rB),
1940 (v16i8 VECREG:$rC)),
1941 (inst VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
Scott Michel754d8662007-12-20 00:44:13 +00001942
Scott Michel97872d32008-02-23 18:41:37 +00001943multiclass ShuffleBytes
1944{
1945 def v16i8 : SHUFBVecInst<v16i8>;
1946 def v8i16 : SHUFBVecInst<v8i16>;
1947 def v4i32 : SHUFBVecInst<v4i32>;
1948 def v2i64 : SHUFBVecInst<v2i64>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001949
Scott Michel97872d32008-02-23 18:41:37 +00001950 def v4f32 : SHUFBVecInst<v4f32>;
1951 def v2f64 : SHUFBVecInst<v2f64>;
1952}
1953
1954defm SHUFB : ShuffleBytes;
1955
1956def : SHUFBVecPat1<v8i16, SHUFBv16i8>;
1957def : SHUFBVecPat1<v4i32, SHUFBv16i8>;
1958def : SHUFBVecPat1<v2i64, SHUFBv16i8>;
1959def : SHUFBVecPat1<v4f32, SHUFBv16i8>;
1960def : SHUFBVecPat1<v2f64, SHUFBv16i8>;
Scott Michel754d8662007-12-20 00:44:13 +00001961
Scott Michel8b6b4202007-12-04 22:35:58 +00001962//===----------------------------------------------------------------------===//
1963// Shift and rotate group:
1964//===----------------------------------------------------------------------===//
1965
Scott Michel97872d32008-02-23 18:41:37 +00001966class SHLHInst<dag OOL, dag IOL, list<dag> pattern>:
1967 RRForm<0b11111010000, OOL, IOL, "shlh\t$rT, $rA, $rB",
1968 RotateShift, pattern>;
1969
1970class SHLHVecInst<ValueType vectype>:
1971 SHLHInst<(outs VECREG:$rT), (ins VECREG:$rA, R16C:$rB),
1972 [(set (vectype VECREG:$rT),
1973 (SPUvec_shl (vectype VECREG:$rA), R16C:$rB))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001974
1975// $rB gets promoted to 32-bit register type when confronted with
1976// this llvm assembly code:
1977//
1978// define i16 @shlh_i16_1(i16 %arg1, i16 %arg2) {
1979// %A = shl i16 %arg1, %arg2
1980// ret i16 %A
1981// }
Scott Michel8b6b4202007-12-04 22:35:58 +00001982
Scott Michel97872d32008-02-23 18:41:37 +00001983multiclass ShiftLeftHalfword
1984{
1985 def v8i16: SHLHVecInst<v8i16>;
1986 def r16: SHLHInst<(outs R16C:$rT), (ins R16C:$rA, R16C:$rB),
1987 [(set R16C:$rT, (shl R16C:$rA, R16C:$rB))]>;
1988 def r16_r32: SHLHInst<(outs R16C:$rT), (ins R16C:$rA, R32C:$rB),
1989 [(set R16C:$rT, (shl R16C:$rA, R32C:$rB))]>;
1990}
Scott Michel8b6b4202007-12-04 22:35:58 +00001991
Scott Michel97872d32008-02-23 18:41:37 +00001992defm SHLH : ShiftLeftHalfword;
Scott Michel8b6b4202007-12-04 22:35:58 +00001993
Scott Michel97872d32008-02-23 18:41:37 +00001994//===----------------------------------------------------------------------===//
Scott Michel438be252007-12-17 22:32:34 +00001995
Scott Michel97872d32008-02-23 18:41:37 +00001996class SHLHIInst<dag OOL, dag IOL, list<dag> pattern>:
1997 RI7Form<0b11111010000, OOL, IOL, "shlhi\t$rT, $rA, $val",
1998 RotateShift, pattern>;
Scott Michel8b6b4202007-12-04 22:35:58 +00001999
Scott Michel97872d32008-02-23 18:41:37 +00002000class SHLHIVecInst<ValueType vectype>:
2001 SHLHIInst<(outs VECREG:$rT), (ins VECREG:$rA, u7imm:$val),
2002 [(set (vectype VECREG:$rT),
2003 (SPUvec_shl (vectype VECREG:$rA), (i16 uimm7:$val)))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002004
Scott Michel97872d32008-02-23 18:41:37 +00002005multiclass ShiftLeftHalfwordImm
2006{
2007 def v8i16: SHLHIVecInst<v8i16>;
2008 def r16: SHLHIInst<(outs R16C:$rT), (ins R16C:$rA, u7imm:$val),
2009 [(set R16C:$rT, (shl R16C:$rA, (i16 uimm7:$val)))]>;
2010}
2011
2012defm SHLHI : ShiftLeftHalfwordImm;
2013
2014def : Pat<(SPUvec_shl (v8i16 VECREG:$rA), (i32 uimm7:$val)),
2015 (SHLHIv8i16 VECREG:$rA, uimm7:$val)>;
2016
2017def : Pat<(shl R16C:$rA, (i32 uimm7:$val)),
Scott Michel438be252007-12-17 22:32:34 +00002018 (SHLHIr16 R16C:$rA, uimm7:$val)>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002019
Scott Michel97872d32008-02-23 18:41:37 +00002020//===----------------------------------------------------------------------===//
Scott Michel8b6b4202007-12-04 22:35:58 +00002021
Scott Michel97872d32008-02-23 18:41:37 +00002022class SHLInst<dag OOL, dag IOL, list<dag> pattern>:
2023 RRForm<0b11111010000, OOL, IOL, "shl\t$rT, $rA, $rB",
2024 RotateShift, pattern>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002025
Scott Michel97872d32008-02-23 18:41:37 +00002026multiclass ShiftLeftWord
2027{
2028 def v4i32:
2029 SHLInst<(outs VECREG:$rT), (ins VECREG:$rA, R16C:$rB),
2030 [(set (v4i32 VECREG:$rT),
2031 (SPUvec_shl (v4i32 VECREG:$rA), R16C:$rB))]>;
2032 def r32:
2033 SHLInst<(outs R32C:$rT), (ins R32C:$rA, R32C:$rB),
2034 [(set R32C:$rT, (shl R32C:$rA, R32C:$rB))]>;
2035}
Scott Michel8b6b4202007-12-04 22:35:58 +00002036
Scott Michel97872d32008-02-23 18:41:37 +00002037defm SHL: ShiftLeftWord;
Scott Michel438be252007-12-17 22:32:34 +00002038
Scott Michel97872d32008-02-23 18:41:37 +00002039//===----------------------------------------------------------------------===//
Scott Michel8b6b4202007-12-04 22:35:58 +00002040
Scott Michel97872d32008-02-23 18:41:37 +00002041class SHLIInst<dag OOL, dag IOL, list<dag> pattern>:
2042 RI7Form<0b11111010000, OOL, IOL, "shli\t$rT, $rA, $val",
2043 RotateShift, pattern>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002044
Scott Michel97872d32008-02-23 18:41:37 +00002045multiclass ShiftLeftWordImm
2046{
2047 def v4i32:
2048 SHLIInst<(outs VECREG:$rT), (ins VECREG:$rA, u7imm_i32:$val),
2049 [(set (v4i32 VECREG:$rT),
2050 (SPUvec_shl (v4i32 VECREG:$rA), (i32 uimm7:$val)))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002051
Scott Michel97872d32008-02-23 18:41:37 +00002052 def r32:
2053 SHLIInst<(outs R32C:$rT), (ins R32C:$rA, u7imm_i32:$val),
2054 [(set R32C:$rT, (shl R32C:$rA, (i32 uimm7:$val)))]>;
2055}
Scott Michel8b6b4202007-12-04 22:35:58 +00002056
Scott Michel97872d32008-02-23 18:41:37 +00002057defm SHLI : ShiftLeftWordImm;
Scott Michel438be252007-12-17 22:32:34 +00002058
Scott Michel97872d32008-02-23 18:41:37 +00002059//===----------------------------------------------------------------------===//
Scott Michel8b6b4202007-12-04 22:35:58 +00002060// SHLQBI vec form: Note that this will shift the entire vector (the 128-bit
2061// register) to the left. Vector form is here to ensure type correctness.
Scott Michel97872d32008-02-23 18:41:37 +00002062//
2063// The shift count is in the lowest 3 bits (29-31) of $rB, so only a bit shift
2064// of 7 bits is actually possible.
2065//
2066// Note also that SHLQBI/SHLQBII are used in conjunction with SHLQBY/SHLQBYI
2067// to shift i64 and i128. SHLQBI is the residual left over after shifting by
2068// bytes with SHLQBY.
Scott Michel8b6b4202007-12-04 22:35:58 +00002069
Scott Michel97872d32008-02-23 18:41:37 +00002070class SHLQBIInst<dag OOL, dag IOL, list<dag> pattern>:
2071 RRForm<0b11011011100, OOL, IOL, "shlqbi\t$rT, $rA, $rB",
2072 RotateShift, pattern>;
2073
2074class SHLQBIVecInst<ValueType vectype>:
2075 SHLQBIInst<(outs VECREG:$rT), (ins VECREG:$rA, R32C:$rB),
2076 [(set (vectype VECREG:$rT),
2077 (SPUshlquad_l_bits (vectype VECREG:$rA), R32C:$rB))]>;
2078
2079multiclass ShiftLeftQuadByBits
2080{
2081 def v16i8: SHLQBIVecInst<v16i8>;
2082 def v8i16: SHLQBIVecInst<v8i16>;
2083 def v4i32: SHLQBIVecInst<v4i32>;
2084 def v2i64: SHLQBIVecInst<v2i64>;
2085}
2086
2087defm SHLQBI : ShiftLeftQuadByBits;
2088
2089// See note above on SHLQBI. In this case, the predicate actually does then
2090// enforcement, whereas with SHLQBI, we have to "take it on faith."
2091class SHLQBIIInst<dag OOL, dag IOL, list<dag> pattern>:
2092 RI7Form<0b11011111100, OOL, IOL, "shlqbii\t$rT, $rA, $val",
2093 RotateShift, pattern>;
2094
2095class SHLQBIIVecInst<ValueType vectype>:
2096 SHLQBIIInst<(outs VECREG:$rT), (ins VECREG:$rA, u7imm_i32:$val),
2097 [(set (vectype VECREG:$rT),
2098 (SPUshlquad_l_bits (vectype VECREG:$rA), (i32 bitshift:$val)))]>;
2099
2100multiclass ShiftLeftQuadByBitsImm
2101{
2102 def v16i8 : SHLQBIIVecInst<v16i8>;
2103 def v8i16 : SHLQBIIVecInst<v8i16>;
2104 def v4i32 : SHLQBIIVecInst<v4i32>;
2105 def v2i64 : SHLQBIIVecInst<v2i64>;
2106}
2107
2108defm SHLQBII : ShiftLeftQuadByBitsImm;
Scott Michel8b6b4202007-12-04 22:35:58 +00002109
2110// SHLQBY, SHLQBYI vector forms: Shift the entire vector to the left by bytes,
Scott Michel97872d32008-02-23 18:41:37 +00002111// not by bits. See notes above on SHLQBI.
Scott Michel8b6b4202007-12-04 22:35:58 +00002112
Scott Michel97872d32008-02-23 18:41:37 +00002113class SHLQBYInst<dag OOL, dag IOL, list<dag> pattern>:
2114 RI7Form<0b11111011100, OOL, IOL, "shlqbyi\t$rT, $rA, $rB",
2115 RotateShift, pattern>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002116
Scott Michel97872d32008-02-23 18:41:37 +00002117class SHLQBYVecInst<ValueType vectype>:
2118 SHLQBYInst<(outs VECREG:$rT), (ins VECREG:$rA, R32C:$rB),
2119 [(set (vectype VECREG:$rT),
2120 (SPUshlquad_l_bytes (vectype VECREG:$rA), R32C:$rB))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002121
Scott Michel97872d32008-02-23 18:41:37 +00002122multiclass ShiftLeftQuadBytes
2123{
2124 def v16i8: SHLQBYVecInst<v16i8>;
2125 def v8i16: SHLQBYVecInst<v8i16>;
2126 def v4i32: SHLQBYVecInst<v4i32>;
2127 def v2i64: SHLQBYVecInst<v2i64>;
2128 def r128: SHLQBYInst<(outs GPRC:$rT), (ins GPRC:$rA, R32C:$rB),
2129 [(set GPRC:$rT, (SPUshlquad_l_bytes GPRC:$rA, R32C:$rB))]>;
2130}
Scott Michel8b6b4202007-12-04 22:35:58 +00002131
Scott Michel97872d32008-02-23 18:41:37 +00002132defm SHLQBY: ShiftLeftQuadBytes;
Scott Michel8b6b4202007-12-04 22:35:58 +00002133
Scott Michel97872d32008-02-23 18:41:37 +00002134class SHLQBYIInst<dag OOL, dag IOL, list<dag> pattern>:
2135 RI7Form<0b11111111100, OOL, IOL, "shlqbyi\t$rT, $rA, $val",
2136 RotateShift, pattern>;
Scott Michel438be252007-12-17 22:32:34 +00002137
Scott Michel97872d32008-02-23 18:41:37 +00002138class SHLQBYIVecInst<ValueType vectype>:
2139 SHLQBYIInst<(outs VECREG:$rT), (ins VECREG:$rA, u7imm_i32:$val),
2140 [(set (vectype VECREG:$rT),
2141 (SPUshlquad_l_bytes (vectype VECREG:$rA), (i32 uimm7:$val)))]>;
Scott Michel438be252007-12-17 22:32:34 +00002142
Scott Michel97872d32008-02-23 18:41:37 +00002143multiclass ShiftLeftQuadBytesImm
2144{
2145 def v16i8: SHLQBYIVecInst<v16i8>;
2146 def v8i16: SHLQBYIVecInst<v8i16>;
2147 def v4i32: SHLQBYIVecInst<v4i32>;
2148 def v2i64: SHLQBYIVecInst<v2i64>;
2149 def r128: SHLQBYIInst<(outs GPRC:$rT), (ins GPRC:$rA, u7imm_i32:$val),
2150 [(set GPRC:$rT,
2151 (SPUshlquad_l_bytes GPRC:$rA, (i32 uimm7:$val)))]>;
2152}
Scott Michel438be252007-12-17 22:32:34 +00002153
Scott Michel97872d32008-02-23 18:41:37 +00002154defm SHLQBYI : ShiftLeftQuadBytesImm;
Scott Michel438be252007-12-17 22:32:34 +00002155
Scott Michel97872d32008-02-23 18:41:37 +00002156// Special form for truncating i64 to i32:
2157def SHLQBYItrunc64: SHLQBYIInst<(outs R32C:$rT), (ins R64C:$rA, u7imm_i32:$val),
2158 [/* no pattern, see below */]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002159
Scott Michel97872d32008-02-23 18:41:37 +00002160def : Pat<(trunc R64C:$rSrc),
2161 (SHLQBYItrunc64 R64C:$rSrc, 4)>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002162
Scott Michel97872d32008-02-23 18:41:37 +00002163//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
2164// Rotate halfword:
2165//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
2166class ROTHInst<dag OOL, dag IOL, list<dag> pattern>:
2167 RRForm<0b00111010000, OOL, IOL, "roth\t$rT, $rA, $rB",
2168 RotateShift, pattern>;
2169
2170class ROTHVecInst<ValueType vectype>:
2171 ROTHInst<(outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
2172 [(set (vectype VECREG:$rT),
2173 (SPUvec_rotl VECREG:$rA, VECREG:$rB))]>;
2174
2175class ROTHRegInst<RegisterClass rclass>:
2176 ROTHInst<(outs rclass:$rT), (ins rclass:$rA, rclass:$rB),
2177 [(set rclass:$rT, (rotl rclass:$rA, rclass:$rB))]>;
2178
2179multiclass RotateLeftHalfword
2180{
2181 def v8i16: ROTHVecInst<v8i16>;
2182 def r16: ROTHRegInst<R16C>;
2183}
2184
2185defm ROTH: RotateLeftHalfword;
2186
2187def ROTHr16_r32: ROTHInst<(outs R16C:$rT), (ins R16C:$rA, R32C:$rB),
2188 [(set R16C:$rT, (rotl R16C:$rA, R32C:$rB))]>;
2189
2190//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
2191// Rotate halfword, immediate:
2192//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
2193class ROTHIInst<dag OOL, dag IOL, list<dag> pattern>:
2194 RI7Form<0b00111110000, OOL, IOL, "rothi\t$rT, $rA, $val",
2195 RotateShift, pattern>;
2196
2197class ROTHIVecInst<ValueType vectype>:
2198 ROTHIInst<(outs VECREG:$rT), (ins VECREG:$rA, u7imm:$val),
2199 [(set (vectype VECREG:$rT),
2200 (SPUvec_rotl VECREG:$rA, (i16 uimm7:$val)))]>;
2201
2202multiclass RotateLeftHalfwordImm
2203{
2204 def v8i16: ROTHIVecInst<v8i16>;
2205 def r16: ROTHIInst<(outs R16C:$rT), (ins R16C:$rA, u7imm:$val),
2206 [(set R16C:$rT, (rotl R16C:$rA, (i16 uimm7:$val)))]>;
2207 def r16_r32: ROTHIInst<(outs R16C:$rT), (ins R16C:$rA, u7imm_i32:$val),
2208 [(set R16C:$rT, (rotl R16C:$rA, (i32 uimm7:$val)))]>;
2209}
2210
2211defm ROTHI: RotateLeftHalfwordImm;
2212
2213def : Pat<(SPUvec_rotl VECREG:$rA, (i32 uimm7:$val)),
Scott Michel8b6b4202007-12-04 22:35:58 +00002214 (ROTHIv8i16 VECREG:$rA, imm:$val)>;
2215
Scott Michel97872d32008-02-23 18:41:37 +00002216//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
2217// Rotate word:
2218//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
Scott Michel8b6b4202007-12-04 22:35:58 +00002219
Scott Michel97872d32008-02-23 18:41:37 +00002220class ROTInst<dag OOL, dag IOL, list<dag> pattern>:
2221 RRForm<0b00011010000, OOL, IOL, "rot\t$rT, $rA, $rB",
2222 RotateShift, pattern>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002223
Scott Michel97872d32008-02-23 18:41:37 +00002224class ROTVecInst<ValueType vectype>:
2225 ROTInst<(outs VECREG:$rT), (ins VECREG:$rA, R32C:$rB),
2226 [(set (vectype VECREG:$rT),
2227 (SPUvec_rotl (vectype VECREG:$rA), R32C:$rB))]>;
Scott Michel438be252007-12-17 22:32:34 +00002228
Scott Michel97872d32008-02-23 18:41:37 +00002229class ROTRegInst<RegisterClass rclass>:
2230 ROTInst<(outs rclass:$rT), (ins rclass:$rA, R32C:$rB),
2231 [(set rclass:$rT,
2232 (rotl rclass:$rA, R32C:$rB))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002233
Scott Michel97872d32008-02-23 18:41:37 +00002234multiclass RotateLeftWord
2235{
2236 def v4i32: ROTVecInst<v4i32>;
2237 def r32: ROTRegInst<R32C>;
2238}
2239
2240defm ROT: RotateLeftWord;
Scott Michel8b6b4202007-12-04 22:35:58 +00002241
Scott Michel438be252007-12-17 22:32:34 +00002242// The rotate amount is in the same bits whether we've got an 8-bit, 16-bit or
2243// 32-bit register
2244def ROTr32_r16_anyext:
Scott Michel97872d32008-02-23 18:41:37 +00002245 ROTInst<(outs R32C:$rT), (ins R32C:$rA, R16C:$rB),
2246 [(set R32C:$rT, (rotl R32C:$rA, (i32 (anyext R16C:$rB))))]>;
Scott Michel438be252007-12-17 22:32:34 +00002247
2248def : Pat<(rotl R32C:$rA, (i32 (zext R16C:$rB))),
2249 (ROTr32_r16_anyext R32C:$rA, R16C:$rB)>;
2250
2251def : Pat<(rotl R32C:$rA, (i32 (sext R16C:$rB))),
2252 (ROTr32_r16_anyext R32C:$rA, R16C:$rB)>;
2253
2254def ROTr32_r8_anyext:
Scott Michel97872d32008-02-23 18:41:37 +00002255 ROTInst<(outs R32C:$rT), (ins R32C:$rA, R8C:$rB),
2256 [(set R32C:$rT, (rotl R32C:$rA, (i32 (anyext R8C:$rB))))]>;
Scott Michel438be252007-12-17 22:32:34 +00002257
2258def : Pat<(rotl R32C:$rA, (i32 (zext R8C:$rB))),
2259 (ROTr32_r8_anyext R32C:$rA, R8C:$rB)>;
2260
2261def : Pat<(rotl R32C:$rA, (i32 (sext R8C:$rB))),
2262 (ROTr32_r8_anyext R32C:$rA, R8C:$rB)>;
2263
Scott Michel97872d32008-02-23 18:41:37 +00002264//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
2265// Rotate word, immediate
2266//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
Scott Michel8b6b4202007-12-04 22:35:58 +00002267
Scott Michel97872d32008-02-23 18:41:37 +00002268class ROTIInst<dag OOL, dag IOL, list<dag> pattern>:
2269 RI7Form<0b00011110000, OOL, IOL, "roti\t$rT, $rA, $val",
2270 RotateShift, pattern>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002271
Scott Michel97872d32008-02-23 18:41:37 +00002272class ROTIVecInst<ValueType vectype, Operand optype, ValueType inttype, PatLeaf pred>:
2273 ROTIInst<(outs VECREG:$rT), (ins VECREG:$rA, optype:$val),
2274 [(set (vectype VECREG:$rT),
2275 (SPUvec_rotl (vectype VECREG:$rA), (inttype pred:$val)))]>;
Scott Michel438be252007-12-17 22:32:34 +00002276
Scott Michel97872d32008-02-23 18:41:37 +00002277class ROTIRegInst<RegisterClass rclass, Operand optype, ValueType inttype, PatLeaf pred>:
2278 ROTIInst<(outs rclass:$rT), (ins rclass:$rA, optype:$val),
2279 [(set rclass:$rT, (rotl rclass:$rA, (inttype pred:$val)))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002280
Scott Michel97872d32008-02-23 18:41:37 +00002281multiclass RotateLeftWordImm
2282{
2283 def v4i32: ROTIVecInst<v4i32, u7imm_i32, i32, uimm7>;
2284 def v4i32_i16: ROTIVecInst<v4i32, u7imm, i16, uimm7>;
2285 def v4i32_i8: ROTIVecInst<v4i32, u7imm_i8, i8, uimm7>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002286
Scott Michel97872d32008-02-23 18:41:37 +00002287 def r32: ROTIRegInst<R32C, u7imm_i32, i32, uimm7>;
2288 def r32_i16: ROTIRegInst<R32C, u7imm, i16, uimm7>;
2289 def r32_i8: ROTIRegInst<R32C, u7imm_i8, i8, uimm7>;
2290}
Scott Michel438be252007-12-17 22:32:34 +00002291
Scott Michel97872d32008-02-23 18:41:37 +00002292defm ROTI : RotateLeftWordImm;
2293
2294//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
2295// Rotate quad by byte (count)
2296//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
2297
2298class ROTQBYInst<dag OOL, dag IOL, list<dag> pattern>:
2299 RRForm<0b00111011100, OOL, IOL, "rotqby\t$rT, $rA, $rB",
2300 RotateShift, pattern>;
2301
2302class ROTQBYVecInst<ValueType vectype>:
2303 ROTQBYInst<(outs VECREG:$rT), (ins VECREG:$rA, R32C:$rB),
2304 [(set (vectype VECREG:$rT),
2305 (SPUrotbytes_left (vectype VECREG:$rA), R32C:$rB))]>;
2306
2307multiclass RotateQuadLeftByBytes
2308{
2309 def v16i8: ROTQBYVecInst<v16i8>;
2310 def v8i16: ROTQBYVecInst<v8i16>;
2311 def v4i32: ROTQBYVecInst<v4i32>;
2312 def v2i64: ROTQBYVecInst<v2i64>;
2313}
2314
2315defm ROTQBY: RotateQuadLeftByBytes;
Scott Michel8b6b4202007-12-04 22:35:58 +00002316
Scott Micheldbac4cf2008-01-11 02:53:15 +00002317def : Pat<(SPUrotbytes_left_chained (v16i8 VECREG:$rA), R32C:$rB),
Scott Michel97872d32008-02-23 18:41:37 +00002318 (ROTQBYv16i8 VECREG:$rA, R32C:$rB)>;
2319def : Pat<(SPUrotbytes_left_chained (v8i16 VECREG:$rA), R32C:$rB),
2320 (ROTQBYv8i16 VECREG:$rA, R32C:$rB)>;
2321def : Pat<(SPUrotbytes_left_chained (v4i32 VECREG:$rA), R32C:$rB),
2322 (ROTQBYv4i32 VECREG:$rA, R32C:$rB)>;
2323def : Pat<(SPUrotbytes_left_chained (v2i64 VECREG:$rA), R32C:$rB),
2324 (ROTQBYv2i64 VECREG:$rA, R32C:$rB)>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002325
Scott Michel97872d32008-02-23 18:41:37 +00002326//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
2327// Rotate quad by byte (count), immediate
2328//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
2329
2330class ROTQBYIInst<dag OOL, dag IOL, list<dag> pattern>:
2331 RI7Form<0b00111111100, OOL, IOL, "rotqbyi\t$rT, $rA, $val",
2332 RotateShift, pattern>;
2333
2334class ROTQBYIVecInst<ValueType vectype>:
2335 ROTQBYIInst<(outs VECREG:$rT), (ins VECREG:$rA, u7imm:$val),
2336 [(set (vectype VECREG:$rT),
2337 (SPUrotbytes_left (vectype VECREG:$rA), (i16 uimm7:$val)))]>;
2338
2339multiclass RotateQuadByBytesImm
2340{
2341 def v16i8: ROTQBYIVecInst<v16i8>;
2342 def v8i16: ROTQBYIVecInst<v8i16>;
2343 def v4i32: ROTQBYIVecInst<v4i32>;
2344 def v2i64: ROTQBYIVecInst<v2i64>;
2345}
2346
2347defm ROTQBYI: RotateQuadByBytesImm;
Scott Michel8b6b4202007-12-04 22:35:58 +00002348
2349def : Pat<(SPUrotbytes_left_chained (v16i8 VECREG:$rA), (i16 uimm7:$val)),
Scott Michel97872d32008-02-23 18:41:37 +00002350 (ROTQBYIv16i8 VECREG:$rA, uimm7:$val)>;
2351def : Pat<(SPUrotbytes_left_chained (v8i16 VECREG:$rA), (i16 uimm7:$val)),
2352 (ROTQBYIv8i16 VECREG:$rA, uimm7:$val)>;
2353def : Pat<(SPUrotbytes_left_chained (v4i32 VECREG:$rA), (i16 uimm7:$val)),
2354 (ROTQBYIv4i32 VECREG:$rA, uimm7:$val)>;
2355def : Pat<(SPUrotbytes_left_chained (v2i64 VECREG:$rA), (i16 uimm7:$val)),
2356 (ROTQBYIv2i64 VECREG:$rA, uimm7:$val)>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002357
2358// See ROTQBY note above.
2359def ROTQBYBIvec:
2360 RI7Form<0b00110011100, (outs VECREG:$rT), (ins VECREG:$rA, u7imm:$val),
2361 "rotqbybi\t$rT, $rA, $val", RotateShift,
2362 [/* intrinsic */]>;
2363
Scott Michel97872d32008-02-23 18:41:37 +00002364//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
Scott Michel8b6b4202007-12-04 22:35:58 +00002365// See ROTQBY note above.
2366//
2367// Assume that the user of this instruction knows to shift the rotate count
2368// into bit 29
Scott Michel97872d32008-02-23 18:41:37 +00002369//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
Scott Michel8b6b4202007-12-04 22:35:58 +00002370
Scott Michel97872d32008-02-23 18:41:37 +00002371class ROTQBIInst<dag OOL, dag IOL, list<dag> pattern>:
2372 RRForm<0b00011011100, OOL, IOL, "rotqbi\t$rT, $rA, $rB",
2373 RotateShift, pattern>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002374
Scott Michel97872d32008-02-23 18:41:37 +00002375class ROTQBIVecInst<ValueType vectype>:
2376 ROTQBIInst<(outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
2377 [/* no pattern yet */]>;
2378
2379class ROTQBIRegInst<RegisterClass rclass>:
2380 ROTQBIInst<(outs rclass:$rT), (ins rclass:$rA, rclass:$rB),
2381 [/* no pattern yet */]>;
2382
2383multiclass RotateQuadByBitCount
2384{
2385 def v16i8: ROTQBIVecInst<v16i8>;
2386 def v8i16: ROTQBIVecInst<v8i16>;
2387 def v4i32: ROTQBIVecInst<v4i32>;
2388 def v2i64: ROTQBIVecInst<v2i64>;
2389
2390 def r128: ROTQBIRegInst<GPRC>;
2391 def r64: ROTQBIRegInst<R64C>;
2392}
2393
2394defm ROTQBI: RotateQuadByBitCount;
2395
2396class ROTQBIIInst<dag OOL, dag IOL, list<dag> pattern>:
2397 RI7Form<0b00011111100, OOL, IOL, "rotqbii\t$rT, $rA, $val",
2398 RotateShift, pattern>;
2399
2400class ROTQBIIVecInst<ValueType vectype, Operand optype, ValueType inttype,
2401 PatLeaf pred>:
2402 ROTQBIIInst<(outs VECREG:$rT), (ins VECREG:$rA, optype:$val),
2403 [/* no pattern yet */]>;
2404
2405class ROTQBIIRegInst<RegisterClass rclass, Operand optype, ValueType inttype,
2406 PatLeaf pred>:
2407 ROTQBIIInst<(outs rclass:$rT), (ins rclass:$rA, optype:$val),
2408 [/* no pattern yet */]>;
2409
2410multiclass RotateQuadByBitCountImm
2411{
2412 def v16i8: ROTQBIIVecInst<v16i8, u7imm_i32, i32, uimm7>;
2413 def v8i16: ROTQBIIVecInst<v8i16, u7imm_i32, i32, uimm7>;
2414 def v4i32: ROTQBIIVecInst<v4i32, u7imm_i32, i32, uimm7>;
2415 def v2i64: ROTQBIIVecInst<v2i64, u7imm_i32, i32, uimm7>;
2416
2417 def r128: ROTQBIIRegInst<GPRC, u7imm_i32, i32, uimm7>;
2418 def r64: ROTQBIIRegInst<R64C, u7imm_i32, i32, uimm7>;
2419}
2420
2421defm ROTQBII : RotateQuadByBitCountImm;
2422
2423//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
Scott Michel8b6b4202007-12-04 22:35:58 +00002424// ROTHM v8i16 form:
2425// NOTE(1): No vector rotate is generated by the C/C++ frontend (today),
2426// so this only matches a synthetically generated/lowered code
2427// fragment.
2428// NOTE(2): $rB must be negated before the right rotate!
Scott Michel97872d32008-02-23 18:41:37 +00002429//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
Scott Michel8b6b4202007-12-04 22:35:58 +00002430
Scott Michel97872d32008-02-23 18:41:37 +00002431class ROTHMInst<dag OOL, dag IOL, list<dag> pattern>:
2432 RRForm<0b10111010000, OOL, IOL, "rothm\t$rT, $rA, $rB",
2433 RotateShift, pattern>;
2434
2435def ROTHMv8i16:
2436 ROTHMInst<(outs VECREG:$rT), (ins VECREG:$rA, R32C:$rB),
2437 [/* see patterns below - $rB must be negated */]>;
2438
2439def : Pat<(SPUvec_srl (v8i16 VECREG:$rA), R32C:$rB),
Scott Michel8b6b4202007-12-04 22:35:58 +00002440 (ROTHMv8i16 VECREG:$rA, (SFIr32 R32C:$rB, 0))>;
2441
Scott Michel97872d32008-02-23 18:41:37 +00002442def : Pat<(SPUvec_srl (v8i16 VECREG:$rA), R16C:$rB),
Scott Michel8b6b4202007-12-04 22:35:58 +00002443 (ROTHMv8i16 VECREG:$rA,
2444 (SFIr32 (XSHWr16 R16C:$rB), 0))>;
2445
Scott Michel97872d32008-02-23 18:41:37 +00002446def : Pat<(SPUvec_srl (v8i16 VECREG:$rA), R8C:$rB),
Scott Michel8b6b4202007-12-04 22:35:58 +00002447 (ROTHMv8i16 VECREG:$rA,
Scott Michel438be252007-12-17 22:32:34 +00002448 (SFIr32 (XSHWr16 (XSBHr8 R8C:$rB) ), 0))>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002449
2450// ROTHM r16 form: Rotate 16-bit quantity to right, zero fill at the left
2451// Note: This instruction doesn't match a pattern because rB must be negated
2452// for the instruction to work. Thus, the pattern below the instruction!
Scott Michel97872d32008-02-23 18:41:37 +00002453
Scott Michel8b6b4202007-12-04 22:35:58 +00002454def ROTHMr16:
Scott Michel97872d32008-02-23 18:41:37 +00002455 ROTHMInst<(outs R16C:$rT), (ins R16C:$rA, R32C:$rB),
2456 [/* see patterns below - $rB must be negated! */]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002457
2458def : Pat<(srl R16C:$rA, R32C:$rB),
2459 (ROTHMr16 R16C:$rA, (SFIr32 R32C:$rB, 0))>;
2460
2461def : Pat<(srl R16C:$rA, R16C:$rB),
2462 (ROTHMr16 R16C:$rA,
2463 (SFIr32 (XSHWr16 R16C:$rB), 0))>;
2464
Scott Michel438be252007-12-17 22:32:34 +00002465def : Pat<(srl R16C:$rA, R8C:$rB),
Scott Michel8b6b4202007-12-04 22:35:58 +00002466 (ROTHMr16 R16C:$rA,
Scott Michel438be252007-12-17 22:32:34 +00002467 (SFIr32 (XSHWr16 (XSBHr8 R8C:$rB) ), 0))>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002468
2469// ROTHMI v8i16 form: See the comment for ROTHM v8i16. The difference here is
2470// that the immediate can be complemented, so that the user doesn't have to
2471// worry about it.
Scott Michel8b6b4202007-12-04 22:35:58 +00002472
Scott Michel97872d32008-02-23 18:41:37 +00002473class ROTHMIInst<dag OOL, dag IOL, list<dag> pattern>:
2474 RI7Form<0b10111110000, OOL, IOL, "rothmi\t$rT, $rA, $val",
2475 RotateShift, pattern>;
2476
2477def ROTHMIv8i16:
2478 ROTHMIInst<(outs VECREG:$rT), (ins VECREG:$rA, rothNeg7imm:$val),
2479 [/* no pattern */]>;
2480
2481def : Pat<(SPUvec_srl (v8i16 VECREG:$rA), (i32 imm:$val)),
2482 (ROTHMIv8i16 VECREG:$rA, imm:$val)>;
2483
2484def: Pat<(SPUvec_srl (v8i16 VECREG:$rA), (i16 imm:$val)),
Scott Michel8b6b4202007-12-04 22:35:58 +00002485 (ROTHMIv8i16 VECREG:$rA, imm:$val)>;
Scott Michel438be252007-12-17 22:32:34 +00002486
Scott Michel97872d32008-02-23 18:41:37 +00002487def: Pat<(SPUvec_srl (v8i16 VECREG:$rA), (i8 imm:$val)),
Scott Michel5a6f17b2008-01-30 02:55:46 +00002488 (ROTHMIv8i16 VECREG:$rA, imm:$val)>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002489
2490def ROTHMIr16:
Scott Michel97872d32008-02-23 18:41:37 +00002491 ROTHMIInst<(outs R16C:$rT), (ins R16C:$rA, rothNeg7imm:$val),
2492 [/* no pattern */]>;
2493
2494def: Pat<(srl R16C:$rA, (i32 uimm7:$val)),
2495 (ROTHMIr16 R16C:$rA, uimm7:$val)>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002496
2497def: Pat<(srl R16C:$rA, (i16 uimm7:$val)),
2498 (ROTHMIr16 R16C:$rA, uimm7:$val)>;
2499
Scott Michel438be252007-12-17 22:32:34 +00002500def: Pat<(srl R16C:$rA, (i8 uimm7:$val)),
2501 (ROTHMIr16 R16C:$rA, uimm7:$val)>;
2502
Scott Michel8b6b4202007-12-04 22:35:58 +00002503// ROTM v4i32 form: See the ROTHM v8i16 comments.
Scott Michel97872d32008-02-23 18:41:37 +00002504class ROTMInst<dag OOL, dag IOL, list<dag> pattern>:
2505 RRForm<0b10011010000, OOL, IOL, "rotm\t$rT, $rA, $rB",
2506 RotateShift, pattern>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002507
Scott Michel97872d32008-02-23 18:41:37 +00002508def ROTMv4i32:
2509 ROTMInst<(outs VECREG:$rT), (ins VECREG:$rA, R32C:$rB),
2510 [/* see patterns below - $rB must be negated */]>;
2511
2512def : Pat<(SPUvec_srl VECREG:$rA, R32C:$rB),
Scott Michel8b6b4202007-12-04 22:35:58 +00002513 (ROTMv4i32 VECREG:$rA, (SFIr32 R32C:$rB, 0))>;
2514
Scott Michel97872d32008-02-23 18:41:37 +00002515def : Pat<(SPUvec_srl VECREG:$rA, R16C:$rB),
Scott Michel8b6b4202007-12-04 22:35:58 +00002516 (ROTMv4i32 VECREG:$rA,
2517 (SFIr32 (XSHWr16 R16C:$rB), 0))>;
2518
Scott Michel97872d32008-02-23 18:41:37 +00002519def : Pat<(SPUvec_srl VECREG:$rA, R8C:$rB),
Scott Michel8b6b4202007-12-04 22:35:58 +00002520 (ROTMv4i32 VECREG:$rA,
Scott Michel97872d32008-02-23 18:41:37 +00002521 (SFIr32 (XSHWr16 (XSBHr8 R8C:$rB)), 0))>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002522
2523def ROTMr32:
Scott Michel97872d32008-02-23 18:41:37 +00002524 ROTMInst<(outs R32C:$rT), (ins R32C:$rA, R32C:$rB),
2525 [/* see patterns below - $rB must be negated */]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002526
2527def : Pat<(srl R32C:$rA, R32C:$rB),
2528 (ROTMr32 R32C:$rA, (SFIr32 R32C:$rB, 0))>;
2529
2530def : Pat<(srl R32C:$rA, R16C:$rB),
2531 (ROTMr32 R32C:$rA,
2532 (SFIr32 (XSHWr16 R16C:$rB), 0))>;
2533
Scott Michel438be252007-12-17 22:32:34 +00002534def : Pat<(srl R32C:$rA, R8C:$rB),
2535 (ROTMr32 R32C:$rA,
2536 (SFIr32 (XSHWr16 (XSBHr8 R8C:$rB)), 0))>;
2537
Scott Michel8b6b4202007-12-04 22:35:58 +00002538// ROTMI v4i32 form: See the comment for ROTHM v8i16.
2539def ROTMIv4i32:
2540 RI7Form<0b10011110000, (outs VECREG:$rT), (ins VECREG:$rA, rotNeg7imm:$val),
2541 "rotmi\t$rT, $rA, $val", RotateShift,
2542 [(set (v4i32 VECREG:$rT),
Scott Michel97872d32008-02-23 18:41:37 +00002543 (SPUvec_srl VECREG:$rA, (i32 uimm7:$val)))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002544
Scott Michel97872d32008-02-23 18:41:37 +00002545def : Pat<(SPUvec_srl VECREG:$rA, (i16 uimm7:$val)),
Scott Michel8b6b4202007-12-04 22:35:58 +00002546 (ROTMIv4i32 VECREG:$rA, uimm7:$val)>;
Scott Michel438be252007-12-17 22:32:34 +00002547
Scott Michel97872d32008-02-23 18:41:37 +00002548def : Pat<(SPUvec_srl VECREG:$rA, (i8 uimm7:$val)),
Scott Michel438be252007-12-17 22:32:34 +00002549 (ROTMIv4i32 VECREG:$rA, uimm7:$val)>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002550
2551// ROTMI r32 form: know how to complement the immediate value.
2552def ROTMIr32:
2553 RI7Form<0b10011110000, (outs R32C:$rT), (ins R32C:$rA, rotNeg7imm:$val),
2554 "rotmi\t$rT, $rA, $val", RotateShift,
2555 [(set R32C:$rT, (srl R32C:$rA, (i32 uimm7:$val)))]>;
2556
2557def : Pat<(srl R32C:$rA, (i16 imm:$val)),
2558 (ROTMIr32 R32C:$rA, uimm7:$val)>;
2559
Scott Michel438be252007-12-17 22:32:34 +00002560def : Pat<(srl R32C:$rA, (i8 imm:$val)),
2561 (ROTMIr32 R32C:$rA, uimm7:$val)>;
2562
Scott Michel97872d32008-02-23 18:41:37 +00002563//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
Scott Michel8b6b4202007-12-04 22:35:58 +00002564// ROTQMBYvec: This is a vector form merely so that when used in an
2565// instruction pattern, type checking will succeed. This instruction assumes
Scott Michel97872d32008-02-23 18:41:37 +00002566// that the user knew to negate $rB.
2567//
2568// Using the SPUrotquad_rz_bytes target-specific DAG node, the patterns
2569// ensure that $rB is negated.
2570//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
Scott Michel8b6b4202007-12-04 22:35:58 +00002571
Scott Michel97872d32008-02-23 18:41:37 +00002572class ROTQMBYInst<dag OOL, dag IOL, list<dag> pattern>:
2573 RRForm<0b10111011100, OOL, IOL, "rotqmby\t$rT, $rA, $rB",
2574 RotateShift, pattern>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002575
Scott Michel97872d32008-02-23 18:41:37 +00002576class ROTQMBYVecInst<ValueType vectype>:
2577 ROTQMBYInst<(outs VECREG:$rT), (ins VECREG:$rA, R32C:$rB),
2578 [/* no pattern, $rB must be negated */]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002579
Scott Michel97872d32008-02-23 18:41:37 +00002580class ROTQMBYRegInst<RegisterClass rclass>:
2581 ROTQMBYInst<(outs rclass:$rT), (ins rclass:$rA, R32C:$rB),
2582 [(set rclass:$rT,
2583 (SPUrotquad_rz_bytes rclass:$rA, R32C:$rB))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002584
Scott Michel97872d32008-02-23 18:41:37 +00002585multiclass RotateQuadBytes
2586{
2587 def v16i8: ROTQMBYVecInst<v16i8>;
2588 def v8i16: ROTQMBYVecInst<v8i16>;
2589 def v4i32: ROTQMBYVecInst<v4i32>;
2590 def v2i64: ROTQMBYVecInst<v2i64>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002591
Scott Michel97872d32008-02-23 18:41:37 +00002592 def r128: ROTQMBYRegInst<GPRC>;
2593 def r64: ROTQMBYRegInst<R64C>;
2594}
2595
2596defm ROTQMBY : RotateQuadBytes;
2597
2598def : Pat<(SPUrotquad_rz_bytes (v16i8 VECREG:$rA), R32C:$rB),
2599 (ROTQMBYv16i8 VECREG:$rA, (SFIr32 R32C:$rB, 0))>;
2600def : Pat<(SPUrotquad_rz_bytes (v8i16 VECREG:$rA), R32C:$rB),
2601 (ROTQMBYv8i16 VECREG:$rA, (SFIr32 R32C:$rB, 0))>;
2602def : Pat<(SPUrotquad_rz_bytes (v4i32 VECREG:$rA), R32C:$rB),
2603 (ROTQMBYv4i32 VECREG:$rA, (SFIr32 R32C:$rB, 0))>;
2604def : Pat<(SPUrotquad_rz_bytes (v2i64 VECREG:$rA), R32C:$rB),
2605 (ROTQMBYv2i64 VECREG:$rA, (SFIr32 R32C:$rB, 0))>;
2606def : Pat<(SPUrotquad_rz_bytes GPRC:$rA, R32C:$rB),
2607 (ROTQMBYr128 GPRC:$rA, (SFIr32 R32C:$rB, 0))>;
2608def : Pat<(SPUrotquad_rz_bytes R64C:$rA, R32C:$rB),
2609 (ROTQMBYr64 R64C:$rA, (SFIr32 R32C:$rB, 0))>;
2610
2611class ROTQMBYIInst<dag OOL, dag IOL, list<dag> pattern>:
2612 RI7Form<0b10111111100, OOL, IOL, "rotqmbyi\t$rT, $rA, $val",
2613 RotateShift, pattern>;
2614
2615class ROTQMBYIVecInst<ValueType vectype>:
2616 ROTQMBYIInst<(outs VECREG:$rT), (ins VECREG:$rA, rotNeg7imm:$val),
2617 [(set (vectype VECREG:$rT),
2618 (SPUrotquad_rz_bytes (vectype VECREG:$rA), (i32 uimm7:$val)))]>;
2619
2620class ROTQMBYIRegInst<RegisterClass rclass, Operand optype, ValueType inttype, PatLeaf pred>:
2621 ROTQMBYIInst<(outs rclass:$rT), (ins rclass:$rA, optype:$val),
2622 [(set rclass:$rT,
2623 (SPUrotquad_rz_bytes rclass:$rA, (inttype pred:$val)))]>;
2624
2625multiclass RotateQuadBytesImm
2626{
2627 def v16i8: ROTQMBYIVecInst<v16i8>;
2628 def v8i16: ROTQMBYIVecInst<v8i16>;
2629 def v4i32: ROTQMBYIVecInst<v4i32>;
2630 def v2i64: ROTQMBYIVecInst<v2i64>;
2631
2632 def r128: ROTQMBYIRegInst<GPRC, rotNeg7imm, i32, uimm7>;
2633 def r64: ROTQMBYIRegInst<R64C, rotNeg7imm, i32, uimm7>;
2634}
2635
2636defm ROTQMBYI : RotateQuadBytesImm;
2637
2638
2639//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
2640// Rotate right and mask by bit count
2641//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
2642
2643class ROTQMBYBIInst<dag OOL, dag IOL, list<dag> pattern>:
2644 RRForm<0b10110011100, OOL, IOL, "rotqmbybi\t$rT, $rA, $rB",
2645 RotateShift, pattern>;
2646
2647class ROTQMBYBIVecInst<ValueType vectype>:
2648 ROTQMBYBIInst<(outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
2649 [/* no pattern, intrinsic? */]>;
2650
2651multiclass RotateMaskQuadByBitCount
2652{
2653 def v16i8: ROTQMBYBIVecInst<v16i8>;
2654 def v8i16: ROTQMBYBIVecInst<v8i16>;
2655 def v4i32: ROTQMBYBIVecInst<v4i32>;
2656 def v2i64: ROTQMBYBIVecInst<v2i64>;
2657}
2658
2659defm ROTQMBYBI: RotateMaskQuadByBitCount;
2660
2661//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
2662// Rotate quad and mask by bits
2663// Note that the rotate amount has to be negated
2664//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
2665
2666class ROTQMBIInst<dag OOL, dag IOL, list<dag> pattern>:
2667 RRForm<0b10011011100, OOL, IOL, "rotqmbi\t$rT, $rA, $rB",
2668 RotateShift, pattern>;
2669
2670class ROTQMBIVecInst<ValueType vectype>:
2671 ROTQMBIInst<(outs VECREG:$rT), (ins VECREG:$rA, R32C:$rB),
2672 [/* no pattern */]>;
2673
2674class ROTQMBIRegInst<RegisterClass rclass>:
2675 ROTQMBIInst<(outs rclass:$rT), (ins rclass:$rA, R32C:$rB),
2676 [/* no pattern */]>;
2677
2678multiclass RotateMaskQuadByBits
2679{
2680 def v16i8: ROTQMBIVecInst<v16i8>;
2681 def v8i16: ROTQMBIVecInst<v8i16>;
2682 def v4i32: ROTQMBIVecInst<v4i32>;
2683 def v2i64: ROTQMBIVecInst<v2i64>;
2684
2685 def r128: ROTQMBIRegInst<GPRC>;
2686 def r64: ROTQMBIRegInst<R64C>;
2687}
2688
2689defm ROTQMBI: RotateMaskQuadByBits;
2690
2691def : Pat<(SPUrotquad_rz_bits (v16i8 VECREG:$rA), R32C:$rB),
2692 (ROTQMBIv16i8 VECREG:$rA, (SFIr32 R32C:$rB, 0))>;
2693def : Pat<(SPUrotquad_rz_bits (v8i16 VECREG:$rA), R32C:$rB),
2694 (ROTQMBIv8i16 VECREG:$rA, (SFIr32 R32C:$rB, 0))>;
2695def : Pat<(SPUrotquad_rz_bits (v4i32 VECREG:$rA), R32C:$rB),
2696 (ROTQMBIv4i32 VECREG:$rA, (SFIr32 R32C:$rB, 0))>;
2697def : Pat<(SPUrotquad_rz_bits (v2i64 VECREG:$rA), R32C:$rB),
2698 (ROTQMBIv2i64 VECREG:$rA, (SFIr32 R32C:$rB, 0))>;
2699def : Pat<(SPUrotquad_rz_bits GPRC:$rA, R32C:$rB),
2700 (ROTQMBIr128 GPRC:$rA, (SFIr32 R32C:$rB, 0))>;
2701def : Pat<(SPUrotquad_rz_bits R64C:$rA, R32C:$rB),
2702 (ROTQMBIr64 R64C:$rA, (SFIr32 R32C:$rB, 0))>;
2703
2704//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
2705// Rotate quad and mask by bits, immediate
2706//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
2707
2708class ROTQMBIIInst<dag OOL, dag IOL, list<dag> pattern>:
2709 RI7Form<0b10011111100, OOL, IOL, "rotqmbii\t$rT, $rA, $val",
2710 RotateShift, pattern>;
2711
2712class ROTQMBIIVecInst<ValueType vectype>:
2713 ROTQMBIIInst<(outs VECREG:$rT), (ins VECREG:$rA, rotNeg7imm:$val),
2714 [(set (vectype VECREG:$rT),
2715 (SPUrotquad_rz_bits (vectype VECREG:$rA), (i32 uimm7:$val)))]>;
2716
2717class ROTQMBIIRegInst<RegisterClass rclass>:
2718 ROTQMBIIInst<(outs rclass:$rT), (ins rclass:$rA, rotNeg7imm:$val),
2719 [(set rclass:$rT,
2720 (SPUrotquad_rz_bits rclass:$rA, (i32 uimm7:$val)))]>;
2721
2722multiclass RotateMaskQuadByBitsImm
2723{
2724 def v16i8: ROTQMBIIVecInst<v16i8>;
2725 def v8i16: ROTQMBIIVecInst<v8i16>;
2726 def v4i32: ROTQMBIIVecInst<v4i32>;
2727 def v2i64: ROTQMBIIVecInst<v2i64>;
2728
2729 def r128: ROTQMBIIRegInst<GPRC>;
2730 def r64: ROTQMBIIRegInst<R64C>;
2731}
2732
2733defm ROTQMBII: RotateMaskQuadByBitsImm;
2734
2735//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
2736//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
Scott Michel8b6b4202007-12-04 22:35:58 +00002737
2738def ROTMAHv8i16:
2739 RRForm<0b01111010000, (outs VECREG:$rT), (ins VECREG:$rA, R32C:$rB),
2740 "rotmah\t$rT, $rA, $rB", RotateShift,
2741 [/* see patterns below - $rB must be negated */]>;
2742
Scott Michel97872d32008-02-23 18:41:37 +00002743def : Pat<(SPUvec_sra VECREG:$rA, R32C:$rB),
Scott Michel8b6b4202007-12-04 22:35:58 +00002744 (ROTMAHv8i16 VECREG:$rA, (SFIr32 R32C:$rB, 0))>;
2745
Scott Michel97872d32008-02-23 18:41:37 +00002746def : Pat<(SPUvec_sra VECREG:$rA, R16C:$rB),
Scott Michel8b6b4202007-12-04 22:35:58 +00002747 (ROTMAHv8i16 VECREG:$rA,
2748 (SFIr32 (XSHWr16 R16C:$rB), 0))>;
2749
Scott Michel97872d32008-02-23 18:41:37 +00002750def : Pat<(SPUvec_sra VECREG:$rA, R8C:$rB),
Scott Michel438be252007-12-17 22:32:34 +00002751 (ROTMAHv8i16 VECREG:$rA,
2752 (SFIr32 (XSHWr16 (XSBHr8 R8C:$rB)), 0))>;
2753
Scott Michel8b6b4202007-12-04 22:35:58 +00002754def ROTMAHr16:
2755 RRForm<0b01111010000, (outs R16C:$rT), (ins R16C:$rA, R32C:$rB),
2756 "rotmah\t$rT, $rA, $rB", RotateShift,
2757 [/* see patterns below - $rB must be negated */]>;
2758
2759def : Pat<(sra R16C:$rA, R32C:$rB),
2760 (ROTMAHr16 R16C:$rA, (SFIr32 R32C:$rB, 0))>;
2761
2762def : Pat<(sra R16C:$rA, R16C:$rB),
2763 (ROTMAHr16 R16C:$rA,
2764 (SFIr32 (XSHWr16 R16C:$rB), 0))>;
2765
Scott Michel438be252007-12-17 22:32:34 +00002766def : Pat<(sra R16C:$rA, R8C:$rB),
2767 (ROTMAHr16 R16C:$rA,
2768 (SFIr32 (XSHWr16 (XSBHr8 R8C:$rB)), 0))>;
2769
Scott Michel8b6b4202007-12-04 22:35:58 +00002770def ROTMAHIv8i16:
2771 RRForm<0b01111110000, (outs VECREG:$rT), (ins VECREG:$rA, rothNeg7imm:$val),
2772 "rotmahi\t$rT, $rA, $val", RotateShift,
2773 [(set (v8i16 VECREG:$rT),
Scott Michel97872d32008-02-23 18:41:37 +00002774 (SPUvec_sra (v8i16 VECREG:$rA), (i32 uimm7:$val)))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002775
Scott Michel97872d32008-02-23 18:41:37 +00002776def : Pat<(SPUvec_sra (v8i16 VECREG:$rA), (i16 uimm7:$val)),
Scott Michel8b6b4202007-12-04 22:35:58 +00002777 (ROTMAHIv8i16 (v8i16 VECREG:$rA), (i32 uimm7:$val))>;
2778
Scott Michel97872d32008-02-23 18:41:37 +00002779def : Pat<(SPUvec_sra (v8i16 VECREG:$rA), (i8 uimm7:$val)),
Scott Michel438be252007-12-17 22:32:34 +00002780 (ROTMAHIv8i16 (v8i16 VECREG:$rA), (i32 uimm7:$val))>;
2781
Scott Michel8b6b4202007-12-04 22:35:58 +00002782def ROTMAHIr16:
2783 RRForm<0b01111110000, (outs R16C:$rT), (ins R16C:$rA, rothNeg7imm_i16:$val),
2784 "rotmahi\t$rT, $rA, $val", RotateShift,
2785 [(set R16C:$rT, (sra R16C:$rA, (i16 uimm7:$val)))]>;
2786
2787def : Pat<(sra R16C:$rA, (i32 imm:$val)),
2788 (ROTMAHIr16 R16C:$rA, uimm7:$val)>;
2789
Scott Michel438be252007-12-17 22:32:34 +00002790def : Pat<(sra R16C:$rA, (i8 imm:$val)),
2791 (ROTMAHIr16 R16C:$rA, uimm7:$val)>;
2792
Scott Michel8b6b4202007-12-04 22:35:58 +00002793def ROTMAv4i32:
2794 RRForm<0b01011010000, (outs VECREG:$rT), (ins VECREG:$rA, R32C:$rB),
2795 "rotma\t$rT, $rA, $rB", RotateShift,
2796 [/* see patterns below - $rB must be negated */]>;
2797
Scott Michel97872d32008-02-23 18:41:37 +00002798def : Pat<(SPUvec_sra VECREG:$rA, R32C:$rB),
Scott Michel8b6b4202007-12-04 22:35:58 +00002799 (ROTMAv4i32 (v4i32 VECREG:$rA), (SFIr32 R32C:$rB, 0))>;
2800
Scott Michel97872d32008-02-23 18:41:37 +00002801def : Pat<(SPUvec_sra VECREG:$rA, R16C:$rB),
Scott Michel8b6b4202007-12-04 22:35:58 +00002802 (ROTMAv4i32 (v4i32 VECREG:$rA),
2803 (SFIr32 (XSHWr16 R16C:$rB), 0))>;
2804
Scott Michel97872d32008-02-23 18:41:37 +00002805def : Pat<(SPUvec_sra VECREG:$rA, R8C:$rB),
Scott Michel438be252007-12-17 22:32:34 +00002806 (ROTMAv4i32 (v4i32 VECREG:$rA),
2807 (SFIr32 (XSHWr16 (XSBHr8 R8C:$rB)), 0))>;
2808
Scott Michel8b6b4202007-12-04 22:35:58 +00002809def ROTMAr32:
2810 RRForm<0b01011010000, (outs R32C:$rT), (ins R32C:$rA, R32C:$rB),
2811 "rotma\t$rT, $rA, $rB", RotateShift,
2812 [/* see patterns below - $rB must be negated */]>;
2813
2814def : Pat<(sra R32C:$rA, R32C:$rB),
2815 (ROTMAr32 R32C:$rA, (SFIr32 R32C:$rB, 0))>;
2816
2817def : Pat<(sra R32C:$rA, R16C:$rB),
2818 (ROTMAr32 R32C:$rA,
2819 (SFIr32 (XSHWr16 R16C:$rB), 0))>;
2820
Scott Michel438be252007-12-17 22:32:34 +00002821def : Pat<(sra R32C:$rA, R8C:$rB),
2822 (ROTMAr32 R32C:$rA,
2823 (SFIr32 (XSHWr16 (XSBHr8 R8C:$rB)), 0))>;
2824
Scott Michel8b6b4202007-12-04 22:35:58 +00002825def ROTMAIv4i32:
2826 RRForm<0b01011110000, (outs VECREG:$rT), (ins VECREG:$rA, rotNeg7imm:$val),
2827 "rotmai\t$rT, $rA, $val", RotateShift,
2828 [(set (v4i32 VECREG:$rT),
Scott Michel97872d32008-02-23 18:41:37 +00002829 (SPUvec_sra VECREG:$rA, (i32 uimm7:$val)))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002830
Scott Michel97872d32008-02-23 18:41:37 +00002831def : Pat<(SPUvec_sra VECREG:$rA, (i16 uimm7:$val)),
Scott Michel8b6b4202007-12-04 22:35:58 +00002832 (ROTMAIv4i32 VECREG:$rA, uimm7:$val)>;
2833
2834def ROTMAIr32:
2835 RRForm<0b01011110000, (outs R32C:$rT), (ins R32C:$rA, rotNeg7imm:$val),
2836 "rotmai\t$rT, $rA, $val", RotateShift,
2837 [(set R32C:$rT, (sra R32C:$rA, (i32 uimm7:$val)))]>;
2838
2839def : Pat<(sra R32C:$rA, (i16 uimm7:$val)),
2840 (ROTMAIr32 R32C:$rA, uimm7:$val)>;
2841
Scott Michel438be252007-12-17 22:32:34 +00002842def : Pat<(sra R32C:$rA, (i8 uimm7:$val)),
2843 (ROTMAIr32 R32C:$rA, uimm7:$val)>;
2844
Scott Michel8b6b4202007-12-04 22:35:58 +00002845//===----------------------------------------------------------------------===//
2846// Branch and conditionals:
2847//===----------------------------------------------------------------------===//
2848
2849let isTerminator = 1, isBarrier = 1 in {
2850 // Halt If Equal (r32 preferred slot only, no vector form)
2851 def HEQr32:
2852 RRForm_3<0b00011011110, (outs), (ins R32C:$rA, R32C:$rB),
2853 "heq\t$rA, $rB", BranchResolv,
2854 [/* no pattern to match */]>;
2855
2856 def HEQIr32 :
2857 RI10Form_2<0b11111110, (outs), (ins R32C:$rA, s10imm:$val),
2858 "heqi\t$rA, $val", BranchResolv,
2859 [/* no pattern to match */]>;
2860
2861 // HGT/HGTI: These instructions use signed arithmetic for the comparison,
2862 // contrasting with HLGT/HLGTI, which use unsigned comparison:
2863 def HGTr32:
2864 RRForm_3<0b00011010010, (outs), (ins R32C:$rA, R32C:$rB),
2865 "hgt\t$rA, $rB", BranchResolv,
2866 [/* no pattern to match */]>;
2867
2868 def HGTIr32:
2869 RI10Form_2<0b11110010, (outs), (ins R32C:$rA, s10imm:$val),
2870 "hgti\t$rA, $val", BranchResolv,
2871 [/* no pattern to match */]>;
2872
2873 def HLGTr32:
2874 RRForm_3<0b00011011010, (outs), (ins R32C:$rA, R32C:$rB),
2875 "hlgt\t$rA, $rB", BranchResolv,
2876 [/* no pattern to match */]>;
2877
2878 def HLGTIr32:
2879 RI10Form_2<0b11111010, (outs), (ins R32C:$rA, s10imm:$val),
2880 "hlgti\t$rA, $val", BranchResolv,
2881 [/* no pattern to match */]>;
2882}
2883
Scott Michel97872d32008-02-23 18:41:37 +00002884//------------------------------------------------------------------------
Scott Michel8b6b4202007-12-04 22:35:58 +00002885// Comparison operators:
Scott Michel97872d32008-02-23 18:41:37 +00002886//------------------------------------------------------------------------
Scott Michel8b6b4202007-12-04 22:35:58 +00002887
Scott Michel97872d32008-02-23 18:41:37 +00002888class CEQBInst<dag OOL, dag IOL, list<dag> pattern> :
2889 RRForm<0b00001011110, OOL, IOL, "ceqb\t$rT, $rA, $rB",
2890 ByteOp, pattern>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002891
Scott Michel97872d32008-02-23 18:41:37 +00002892multiclass CmpEqualByte
2893{
2894 def v16i8 :
2895 CEQBInst<(outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
2896 [(set (v16i8 VECREG:$rT), (seteq (v8i16 VECREG:$rA),
2897 (v8i16 VECREG:$rB)))]>;
Scott Michel438be252007-12-17 22:32:34 +00002898
Scott Michel97872d32008-02-23 18:41:37 +00002899 def r8 :
2900 CEQBInst<(outs R8C:$rT), (ins R8C:$rA, R8C:$rB),
2901 [(set R8C:$rT, (seteq R8C:$rA, R8C:$rB))]>;
2902}
Scott Michel8b6b4202007-12-04 22:35:58 +00002903
Scott Michel97872d32008-02-23 18:41:37 +00002904class CEQBIInst<dag OOL, dag IOL, list<dag> pattern> :
2905 RI10Form<0b01111110, OOL, IOL, "ceqbi\t$rT, $rA, $val",
2906 ByteOp, pattern>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002907
Scott Michel97872d32008-02-23 18:41:37 +00002908multiclass CmpEqualByteImm
2909{
2910 def v16i8 :
2911 CEQBIInst<(outs VECREG:$rT), (ins VECREG:$rA, s10imm_i8:$val),
2912 [(set (v16i8 VECREG:$rT), (seteq (v16i8 VECREG:$rA),
2913 v16i8SExt8Imm:$val))]>;
2914 def r8:
2915 CEQBIInst<(outs R8C:$rT), (ins R8C:$rA, s10imm_i8:$val),
2916 [(set R8C:$rT, (seteq R8C:$rA, immSExt8:$val))]>;
2917}
Scott Michel8b6b4202007-12-04 22:35:58 +00002918
Scott Michel97872d32008-02-23 18:41:37 +00002919class CEQHInst<dag OOL, dag IOL, list<dag> pattern> :
2920 RRForm<0b00010011110, OOL, IOL, "ceqh\t$rT, $rA, $rB",
2921 ByteOp, pattern>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002922
Scott Michel97872d32008-02-23 18:41:37 +00002923multiclass CmpEqualHalfword
2924{
2925 def v8i16 : CEQHInst<(outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
2926 [(set (v8i16 VECREG:$rT), (seteq (v8i16 VECREG:$rA),
2927 (v8i16 VECREG:$rB)))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002928
Scott Michel97872d32008-02-23 18:41:37 +00002929 def r16 : CEQHInst<(outs R16C:$rT), (ins R16C:$rA, R16C:$rB),
2930 [(set R16C:$rT, (seteq R16C:$rA, R16C:$rB))]>;
2931}
Scott Michel8b6b4202007-12-04 22:35:58 +00002932
Scott Michel97872d32008-02-23 18:41:37 +00002933class CEQHIInst<dag OOL, dag IOL, list<dag> pattern> :
2934 RI10Form<0b10111110, OOL, IOL, "ceqhi\t$rT, $rA, $val",
2935 ByteOp, pattern>;
Scott Michel8b6b4202007-12-04 22:35:58 +00002936
Scott Michel97872d32008-02-23 18:41:37 +00002937multiclass CmpEqualHalfwordImm
2938{
2939 def v8i16 : CEQHIInst<(outs VECREG:$rT), (ins VECREG:$rA, s10imm:$val),
2940 [(set (v8i16 VECREG:$rT),
2941 (seteq (v8i16 VECREG:$rA),
2942 (v8i16 v8i16SExt10Imm:$val)))]>;
2943 def r16 : CEQHIInst<(outs R16C:$rT), (ins R16C:$rA, s10imm:$val),
2944 [(set R16C:$rT, (seteq R16C:$rA, i16ImmSExt10:$val))]>;
2945}
Scott Michel8b6b4202007-12-04 22:35:58 +00002946
Scott Michel97872d32008-02-23 18:41:37 +00002947class CEQInst<dag OOL, dag IOL, list<dag> pattern> :
2948 RRForm<0b00000011110, OOL, IOL, "ceq\t$rT, $rA, $rB",
2949 ByteOp, pattern>;
2950
2951multiclass CmpEqualWord
2952{
2953 def v4i32 : CEQInst<(outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
2954 [(set (v4i32 VECREG:$rT),
2955 (seteq (v4i32 VECREG:$rA), (v4i32 VECREG:$rB)))]>;
2956
2957 def r32 : CEQInst<(outs R32C:$rT), (ins R32C:$rA, R32C:$rB),
2958 [(set R32C:$rT, (seteq R32C:$rA, R32C:$rB))]>;
2959}
2960
2961class CEQIInst<dag OOL, dag IOL, list<dag> pattern> :
2962 RI10Form<0b00111110, OOL, IOL, "ceqi\t$rT, $rA, $val",
2963 ByteOp, pattern>;
2964
2965multiclass CmpEqualWordImm
2966{
2967 def v4i32 : CEQIInst<(outs VECREG:$rT), (ins VECREG:$rA, s10imm:$val),
2968 [(set (v4i32 VECREG:$rT),
2969 (seteq (v4i32 VECREG:$rA),
2970 (v4i32 v4i32SExt16Imm:$val)))]>;
2971
2972 def r32: CEQIInst<(outs R32C:$rT), (ins R32C:$rA, s10imm_i32:$val),
2973 [(set R32C:$rT, (seteq R32C:$rA, i32ImmSExt10:$val))]>;
2974}
2975
2976class CGTBInst<dag OOL, dag IOL, list<dag> pattern> :
2977 RRForm<0b00001010010, OOL, IOL, "cgtb\t$rT, $rA, $rB",
2978 ByteOp, pattern>;
2979
2980multiclass CmpGtrByte
2981{
2982 def v16i8 :
2983 CGTBInst<(outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
2984 [(set (v16i8 VECREG:$rT), (setgt (v8i16 VECREG:$rA),
2985 (v8i16 VECREG:$rB)))]>;
2986
2987 def r8 :
2988 CGTBInst<(outs R8C:$rT), (ins R8C:$rA, R8C:$rB),
2989 [(set R8C:$rT, (setgt R8C:$rA, R8C:$rB))]>;
2990}
2991
2992class CGTBIInst<dag OOL, dag IOL, list<dag> pattern> :
2993 RI10Form<0b01110010, OOL, IOL, "cgtbi\t$rT, $rA, $val",
2994 ByteOp, pattern>;
2995
2996multiclass CmpGtrByteImm
2997{
2998 def v16i8 :
2999 CGTBIInst<(outs VECREG:$rT), (ins VECREG:$rA, s10imm_i8:$val),
3000 [(set (v16i8 VECREG:$rT), (setgt (v16i8 VECREG:$rA),
3001 v16i8SExt8Imm:$val))]>;
3002 def r8:
3003 CGTBIInst<(outs R8C:$rT), (ins R8C:$rA, s10imm_i8:$val),
3004 [(set R8C:$rT, (setgt R8C:$rA, immSExt8:$val))]>;
3005}
3006
3007class CGTHInst<dag OOL, dag IOL, list<dag> pattern> :
3008 RRForm<0b00010010010, OOL, IOL, "cgth\t$rT, $rA, $rB",
3009 ByteOp, pattern>;
3010
3011multiclass CmpGtrHalfword
3012{
3013 def v8i16 : CGTHInst<(outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
3014 [(set (v8i16 VECREG:$rT), (setgt (v8i16 VECREG:$rA),
3015 (v8i16 VECREG:$rB)))]>;
3016
3017 def r16 : CGTHInst<(outs R16C:$rT), (ins R16C:$rA, R16C:$rB),
3018 [(set R16C:$rT, (setgt R16C:$rA, R16C:$rB))]>;
3019}
3020
3021class CGTHIInst<dag OOL, dag IOL, list<dag> pattern> :
3022 RI10Form<0b10110010, OOL, IOL, "cgthi\t$rT, $rA, $val",
3023 ByteOp, pattern>;
3024
3025multiclass CmpGtrHalfwordImm
3026{
3027 def v8i16 : CGTHIInst<(outs VECREG:$rT), (ins VECREG:$rA, s10imm:$val),
3028 [(set (v8i16 VECREG:$rT),
3029 (setgt (v8i16 VECREG:$rA),
3030 (v8i16 v8i16SExt10Imm:$val)))]>;
3031 def r16 : CGTHIInst<(outs R16C:$rT), (ins R16C:$rA, s10imm:$val),
3032 [(set R16C:$rT, (setgt R16C:$rA, i16ImmSExt10:$val))]>;
3033}
3034
3035class CGTInst<dag OOL, dag IOL, list<dag> pattern> :
3036 RRForm<0b00000010010, OOL, IOL, "cgt\t$rT, $rA, $rB",
3037 ByteOp, pattern>;
3038
3039multiclass CmpGtrWord
3040{
3041 def v4i32 : CGTInst<(outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
3042 [(set (v4i32 VECREG:$rT),
3043 (setgt (v4i32 VECREG:$rA), (v4i32 VECREG:$rB)))]>;
3044
3045 def r32 : CGTInst<(outs R32C:$rT), (ins R32C:$rA, R32C:$rB),
3046 [(set R32C:$rT, (setgt R32C:$rA, R32C:$rB))]>;
3047}
3048
3049class CGTIInst<dag OOL, dag IOL, list<dag> pattern> :
3050 RI10Form<0b00110010, OOL, IOL, "cgti\t$rT, $rA, $val",
3051 ByteOp, pattern>;
3052
3053multiclass CmpGtrWordImm
3054{
3055 def v4i32 : CGTIInst<(outs VECREG:$rT), (ins VECREG:$rA, s10imm:$val),
3056 [(set (v4i32 VECREG:$rT),
3057 (setgt (v4i32 VECREG:$rA),
3058 (v4i32 v4i32SExt16Imm:$val)))]>;
3059
3060 def r32: CGTIInst<(outs R32C:$rT), (ins R32C:$rA, s10imm_i32:$val),
3061 [(set R32C:$rT, (setgt R32C:$rA, i32ImmSExt10:$val))]>;
3062}
3063
3064class CLGTBInst<dag OOL, dag IOL, list<dag> pattern> :
3065 RRForm<0b00001011010, OOL, IOL, "cgtb\t$rT, $rA, $rB",
3066 ByteOp, pattern>;
3067
3068multiclass CmpLGtrByte
3069{
3070 def v16i8 :
3071 CLGTBInst<(outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
3072 [(set (v16i8 VECREG:$rT), (setugt (v8i16 VECREG:$rA),
3073 (v8i16 VECREG:$rB)))]>;
3074
3075 def r8 :
3076 CLGTBInst<(outs R8C:$rT), (ins R8C:$rA, R8C:$rB),
3077 [(set R8C:$rT, (setugt R8C:$rA, R8C:$rB))]>;
3078}
3079
3080class CLGTBIInst<dag OOL, dag IOL, list<dag> pattern> :
3081 RI10Form<0b01111010, OOL, IOL, "cgtbi\t$rT, $rA, $val",
3082 ByteOp, pattern>;
3083
3084multiclass CmpLGtrByteImm
3085{
3086 def v16i8 :
3087 CLGTBIInst<(outs VECREG:$rT), (ins VECREG:$rA, s10imm_i8:$val),
3088 [(set (v16i8 VECREG:$rT), (setugt (v16i8 VECREG:$rA),
3089 v16i8SExt8Imm:$val))]>;
3090 def r8:
3091 CLGTBIInst<(outs R8C:$rT), (ins R8C:$rA, s10imm_i8:$val),
3092 [(set R8C:$rT, (setugt R8C:$rA, immSExt8:$val))]>;
3093}
3094
3095class CLGTHInst<dag OOL, dag IOL, list<dag> pattern> :
3096 RRForm<0b00010011010, OOL, IOL, "cgth\t$rT, $rA, $rB",
3097 ByteOp, pattern>;
3098
3099multiclass CmpLGtrHalfword
3100{
3101 def v8i16 : CLGTHInst<(outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
3102 [(set (v8i16 VECREG:$rT), (setugt (v8i16 VECREG:$rA),
3103 (v8i16 VECREG:$rB)))]>;
3104
3105 def r16 : CLGTHInst<(outs R16C:$rT), (ins R16C:$rA, R16C:$rB),
3106 [(set R16C:$rT, (setugt R16C:$rA, R16C:$rB))]>;
3107}
3108
3109class CLGTHIInst<dag OOL, dag IOL, list<dag> pattern> :
3110 RI10Form<0b10111010, OOL, IOL, "cgthi\t$rT, $rA, $val",
3111 ByteOp, pattern>;
3112
3113multiclass CmpLGtrHalfwordImm
3114{
3115 def v8i16 : CLGTHIInst<(outs VECREG:$rT), (ins VECREG:$rA, s10imm:$val),
3116 [(set (v8i16 VECREG:$rT),
3117 (setugt (v8i16 VECREG:$rA),
3118 (v8i16 v8i16SExt10Imm:$val)))]>;
3119 def r16 : CLGTHIInst<(outs R16C:$rT), (ins R16C:$rA, s10imm:$val),
3120 [(set R16C:$rT, (setugt R16C:$rA, i16ImmSExt10:$val))]>;
3121}
3122
3123class CLGTInst<dag OOL, dag IOL, list<dag> pattern> :
3124 RRForm<0b00000011010, OOL, IOL, "cgt\t$rT, $rA, $rB",
3125 ByteOp, pattern>;
3126
3127multiclass CmpLGtrWord
3128{
3129 def v4i32 : CLGTInst<(outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
3130 [(set (v4i32 VECREG:$rT),
3131 (setugt (v4i32 VECREG:$rA), (v4i32 VECREG:$rB)))]>;
3132
3133 def r32 : CLGTInst<(outs R32C:$rT), (ins R32C:$rA, R32C:$rB),
3134 [(set R32C:$rT, (setugt R32C:$rA, R32C:$rB))]>;
3135}
3136
3137class CLGTIInst<dag OOL, dag IOL, list<dag> pattern> :
3138 RI10Form<0b00111010, OOL, IOL, "cgti\t$rT, $rA, $val",
3139 ByteOp, pattern>;
3140
3141multiclass CmpLGtrWordImm
3142{
3143 def v4i32 : CLGTIInst<(outs VECREG:$rT), (ins VECREG:$rA, s10imm:$val),
3144 [(set (v4i32 VECREG:$rT),
3145 (setugt (v4i32 VECREG:$rA),
3146 (v4i32 v4i32SExt16Imm:$val)))]>;
3147
3148 def r32: CLGTIInst<(outs R32C:$rT), (ins R32C:$rA, s10imm_i32:$val),
3149 [(set R32C:$rT, (setugt R32C:$rA, i32ImmSExt10:$val))]>;
3150}
3151
3152defm CEQB : CmpEqualByte;
3153defm CEQBI : CmpEqualByteImm;
3154defm CEQH : CmpEqualHalfword;
3155defm CEQHI : CmpEqualHalfwordImm;
3156defm CEQ : CmpEqualWord;
3157defm CEQI : CmpEqualWordImm;
3158defm CGTB : CmpGtrByte;
3159defm CGTBI : CmpGtrByteImm;
3160defm CGTH : CmpGtrHalfword;
3161defm CGTHI : CmpGtrHalfwordImm;
3162defm CGT : CmpGtrWord;
3163defm CGTI : CmpGtrWordImm;
3164defm CLGTB : CmpLGtrByte;
3165defm CLGTBI : CmpLGtrByteImm;
3166defm CLGTH : CmpLGtrHalfword;
3167defm CLGTHI : CmpLGtrHalfwordImm;
3168defm CLGT : CmpLGtrWord;
3169defm CLGTI : CmpLGtrWordImm;
3170
3171// For SETCC primitives not supported above (setlt, setle, setge, etc.)
3172// define a pattern to generate the right code, as a binary operator
3173// (in a manner of speaking.)
3174
3175class SETCCNegCond<PatFrag cond, RegisterClass rclass, dag pattern>:
3176 Pat<(cond rclass:$rA, rclass:$rB), pattern>;
3177
3178class SETCCBinOpReg<PatFrag cond, RegisterClass rclass,
3179 SPUInstr binop, SPUInstr cmpOp1, SPUInstr cmpOp2>:
3180 Pat<(cond rclass:$rA, rclass:$rB),
3181 (binop (cmpOp1 rclass:$rA, rclass:$rB),
3182 (cmpOp2 rclass:$rA, rclass:$rB))>;
3183
3184class SETCCBinOpImm<PatFrag cond, RegisterClass rclass, PatLeaf immpred,
3185 ValueType immtype,
3186 SPUInstr binop, SPUInstr cmpOp1, SPUInstr cmpOp2>:
3187 Pat<(cond rclass:$rA, (immtype immpred:$imm)),
3188 (binop (cmpOp1 rclass:$rA, (immtype immpred:$imm)),
3189 (cmpOp2 rclass:$rA, (immtype immpred:$imm)))>;
3190
3191def CGTEQBr8: SETCCBinOpReg<setge, R8C, ORr8, CGTBr8, CEQBr8>;
3192def CGTEQBIr8: SETCCBinOpImm<setge, R8C, immSExt8, i8, ORr8, CGTBIr8, CEQBIr8>;
3193def CLTBr8: SETCCBinOpReg<setlt, R8C, NORr8, CGTBr8, CEQBr8>;
3194def CLTBIr8: SETCCBinOpImm<setlt, R8C, immSExt8, i8, NORr8, CGTBIr8, CEQBIr8>;
3195def CLTEQr8: Pat<(setle R8C:$rA, R8C:$rB),
3196 (XORBIr8 (CGTBIr8 R8C:$rA, R8C:$rB), 0xff)>;
3197def CLTEQIr8: Pat<(setle R8C:$rA, immU8:$imm),
3198 (XORBIr8 (CGTBIr8 R8C:$rA, immU8:$imm), 0xff)>;
3199
3200def CGTEQHr16: SETCCBinOpReg<setge, R16C, ORr16, CGTHr16, CEQHr16>;
3201def CGTEQHIr16: SETCCBinOpImm<setge, R16C, i16ImmUns10, i16,
3202 ORr16, CGTHIr16, CEQHIr16>;
3203def CLTEQr16: Pat<(setle R16C:$rA, R16C:$rB),
3204 (XORHIr16 (CGTHIr16 R16C:$rA, R16C:$rB), 0xffff)>;
3205def CLTEQIr16: Pat<(setle R16C:$rA, i16ImmUns10:$imm),
3206 (XORHIr16 (CGTHIr16 R16C:$rA, i16ImmSExt10:$imm), 0xffff)>;
3207
3208
3209def CGTEQHr32: SETCCBinOpReg<setge, R32C, ORr32, CGTr32, CEQr32>;
3210def CGTEQHIr32: SETCCBinOpImm<setge, R32C, i32ImmUns10, i32,
3211 ORr32, CGTIr32, CEQIr32>;
3212def CLTEQr32: Pat<(setle R32C:$rA, R32C:$rB),
3213 (XORIr32 (CGTIr32 R32C:$rA, R32C:$rB), 0xffffffff)>;
3214def CLTEQIr32: Pat<(setle R32C:$rA, i32ImmUns10:$imm),
3215 (XORIr32 (CGTIr32 R32C:$rA, i32ImmSExt10:$imm), 0xffffffff)>;
3216
3217def CLGTEQBr8: SETCCBinOpReg<setuge, R8C, ORr8, CLGTBr8, CEQBr8>;
3218def CLGTEQBIr8: SETCCBinOpImm<setuge, R8C, immSExt8, i8, ORr8, CLGTBIr8, CEQBIr8>;
3219def CLLTBr8: SETCCBinOpReg<setult, R8C, NORr8, CLGTBr8, CEQBr8>;
3220def CLLTBIr8: SETCCBinOpImm<setult, R8C, immSExt8, i8, NORr8, CLGTBIr8, CEQBIr8>;
3221def CLLTEQr8: Pat<(setule R8C:$rA, R8C:$rB),
3222 (XORBIr8 (CLGTBIr8 R8C:$rA, R8C:$rB), 0xff)>;
3223def CLLTEQIr8: Pat<(setule R8C:$rA, immU8:$imm),
3224 (XORBIr8 (CLGTBIr8 R8C:$rA, immU8:$imm), 0xff)>;
3225
3226def CLGTEQHr16: SETCCBinOpReg<setuge, R16C, ORr16, CLGTHr16, CEQHr16>;
3227def CLGTEQHIr16: SETCCBinOpImm<setuge, R16C, i16ImmUns10, i16,
3228 ORr16, CLGTHIr16, CEQHIr16>;
3229def CLLTEQr16: Pat<(setule R16C:$rA, R16C:$rB),
3230 (XORHIr16 (CLGTHIr16 R16C:$rA, R16C:$rB), 0xffff)>;
3231def CLLTEQIr16: Pat<(setule R16C:$rA, i16ImmUns10:$imm),
3232 (XORHIr16 (CLGTHIr16 R16C:$rA, i16ImmSExt10:$imm), 0xffff)>;
3233
3234
3235def CLGTEQHr32: SETCCBinOpReg<setuge, R32C, ORr32, CLGTr32, CEQr32>;
3236def CLGTEQHIr32: SETCCBinOpImm<setuge, R32C, i32ImmUns10, i32,
3237 ORr32, CLGTIr32, CEQIr32>;
3238def CLLTEQr32: Pat<(setule R32C:$rA, R32C:$rB),
3239 (XORIr32 (CLGTIr32 R32C:$rA, R32C:$rB), 0xffffffff)>;
3240def CLLTEQIr32: Pat<(setule R32C:$rA, i32ImmUns10:$imm),
3241 (XORIr32 (CLGTIr32 R32C:$rA, i32ImmSExt10:$imm), 0xffffffff)>;
3242
3243//-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~-~
Scott Michel8b6b4202007-12-04 22:35:58 +00003244
3245let isCall = 1,
3246 // All calls clobber the non-callee-saved registers:
3247 Defs = [R0, R1, R2, R3, R4, R5, R6, R7, R8, R9,
3248 R10,R11,R12,R13,R14,R15,R16,R17,R18,R19,
3249 R20,R21,R22,R23,R24,R25,R26,R27,R28,R29,
3250 R30,R31,R32,R33,R34,R35,R36,R37,R38,R39,
3251 R40,R41,R42,R43,R44,R45,R46,R47,R48,R49,
3252 R50,R51,R52,R53,R54,R55,R56,R57,R58,R59,
3253 R60,R61,R62,R63,R64,R65,R66,R67,R68,R69,
3254 R70,R71,R72,R73,R74,R75,R76,R77,R78,R79],
3255 // All of these instructions use $lr (aka $0)
3256 Uses = [R0] in {
3257 // Branch relative and set link: Used if we actually know that the target
3258 // is within [-32768, 32767] bytes of the target
3259 def BRSL:
3260 BranchSetLink<0b011001100, (outs), (ins relcalltarget:$func, variable_ops),
3261 "brsl\t$$lr, $func",
3262 [(SPUcall (SPUpcrel tglobaladdr:$func, 0))]>;
3263
3264 // Branch absolute and set link: Used if we actually know that the target
3265 // is an absolute address
3266 def BRASL:
3267 BranchSetLink<0b011001100, (outs), (ins calltarget:$func, variable_ops),
3268 "brasl\t$$lr, $func",
Scott Micheldbac4cf2008-01-11 02:53:15 +00003269 [(SPUcall (SPUaform tglobaladdr:$func, 0))]>;
Scott Michel8b6b4202007-12-04 22:35:58 +00003270
3271 // Branch indirect and set link if external data. These instructions are not
3272 // actually generated, matched by an intrinsic:
3273 def BISLED_00: BISLEDForm<0b11, "bisled\t$$lr, $func", [/* empty pattern */]>;
3274 def BISLED_E0: BISLEDForm<0b10, "bisled\t$$lr, $func", [/* empty pattern */]>;
3275 def BISLED_0D: BISLEDForm<0b01, "bisled\t$$lr, $func", [/* empty pattern */]>;
3276 def BISLED_ED: BISLEDForm<0b00, "bisled\t$$lr, $func", [/* empty pattern */]>;
3277
3278 // Branch indirect and set link. This is the "X-form" address version of a
3279 // function call
3280 def BISL:
3281 BIForm<0b10010101100, "bisl\t$$lr, $func", [(SPUcall R32C:$func)]>;
3282}
3283
3284// Unconditional branches:
3285let isBranch = 1, isTerminator = 1, hasCtrlDep = 1, isBarrier = 1 in {
3286 def BR :
3287 UncondBranch<0b001001100, (outs), (ins brtarget:$dest),
3288 "br\t$dest",
3289 [(br bb:$dest)]>;
3290
3291 // Unconditional, absolute address branch
3292 def BRA:
3293 UncondBranch<0b001100000, (outs), (ins brtarget:$dest),
3294 "bra\t$dest",
3295 [/* no pattern */]>;
3296
3297 // Indirect branch
3298 def BI:
3299 BIForm<0b00010101100, "bi\t$func", [(brind R32C:$func)]>;
3300
3301 // Various branches:
3302 def BRNZ:
3303 RI16Form<0b010000100, (outs), (ins R32C:$rCond, brtarget:$dest),
3304 "brnz\t$rCond,$dest",
3305 BranchResolv,
3306 [(brcond R32C:$rCond, bb:$dest)]>;
3307
3308 def BRZ:
3309 RI16Form<0b000000100, (outs), (ins R32C:$rT, brtarget:$dest),
3310 "brz\t$rT,$dest",
3311 BranchResolv,
3312 [/* no pattern */]>;
3313
3314 def BRHNZ:
3315 RI16Form<0b011000100, (outs), (ins R16C:$rCond, brtarget:$dest),
3316 "brhnz\t$rCond,$dest",
3317 BranchResolv,
3318 [(brcond R16C:$rCond, bb:$dest)]>;
3319
3320 def BRHZ:
3321 RI16Form<0b001000100, (outs), (ins R16C:$rT, brtarget:$dest),
3322 "brhz\t$rT,$dest",
3323 BranchResolv,
3324 [/* no pattern */]>;
3325
3326/*
3327 def BINZ:
3328 BICondForm<0b10010100100, "binz\t$rA, $func",
3329 [(SPUbinz R32C:$rA, R32C:$func)]>;
3330
3331 def BIZ:
3332 BICondForm<0b00010100100, "biz\t$rA, $func",
3333 [(SPUbiz R32C:$rA, R32C:$func)]>;
3334*/
3335}
3336
Scott Michel394e26d2008-01-17 20:38:41 +00003337//===----------------------------------------------------------------------===//
Scott Michelf9f42e62008-01-29 02:16:57 +00003338// setcc and brcond patterns:
Scott Michel394e26d2008-01-17 20:38:41 +00003339//===----------------------------------------------------------------------===//
Scott Michelf9f42e62008-01-29 02:16:57 +00003340
Scott Michel8b6b4202007-12-04 22:35:58 +00003341def : Pat<(brcond (i16 (seteq R16C:$rA, 0)), bb:$dest),
3342 (BRHZ R16C:$rA, bb:$dest)>;
Scott Michelf9f42e62008-01-29 02:16:57 +00003343def : Pat<(brcond (i16 (setne R16C:$rA, 0)), bb:$dest),
3344 (BRHNZ R16C:$rA, bb:$dest)>;
Scott Michel97872d32008-02-23 18:41:37 +00003345
3346def : Pat<(brcond (i32 (seteq R32C:$rA, 0)), bb:$dest),
3347 (BRZ R32C:$rA, bb:$dest)>;
Scott Michel8b6b4202007-12-04 22:35:58 +00003348def : Pat<(brcond (i32 (setne R32C:$rA, 0)), bb:$dest),
Scott Michel394e26d2008-01-17 20:38:41 +00003349 (BRNZ R32C:$rA, bb:$dest)>;
Scott Michel8b6b4202007-12-04 22:35:58 +00003350
Scott Michel97872d32008-02-23 18:41:37 +00003351multiclass BranchCondEQ<PatFrag cond, SPUInstr brinst16, SPUInstr brinst32>
3352{
3353 def r16imm: Pat<(brcond (i16 (cond R16C:$rA, i16ImmSExt10:$val)), bb:$dest),
3354 (brinst16 (CEQHIr16 R16C:$rA, i16ImmSExt10:$val), bb:$dest)>;
Scott Michelf9f42e62008-01-29 02:16:57 +00003355
Scott Michel97872d32008-02-23 18:41:37 +00003356 def r16 : Pat<(brcond (i16 (cond R16C:$rA, R16C:$rB)), bb:$dest),
3357 (brinst16 (CEQHr16 R16C:$rA, R16:$rB), bb:$dest)>;
3358
3359 def r32imm : Pat<(brcond (i32 (cond R32C:$rA, i32ImmSExt10:$val)), bb:$dest),
3360 (brinst32 (CEQIr32 R32C:$rA, i32ImmSExt10:$val), bb:$dest)>;
3361
3362 def r32 : Pat<(brcond (i32 (cond R32C:$rA, R32C:$rB)), bb:$dest),
3363 (brinst32 (CEQr32 R32C:$rA, R32C:$rB), bb:$dest)>;
3364}
3365
3366defm BRCONDeq : BranchCondEQ<seteq, BRHZ, BRZ>;
3367defm BRCONDne : BranchCondEQ<setne, BRHNZ, BRNZ>;
3368
3369multiclass BranchCondLGT<PatFrag cond, SPUInstr brinst16, SPUInstr brinst32>
3370{
3371 def r16imm : Pat<(brcond (i16 (cond R16C:$rA, i16ImmSExt10:$val)), bb:$dest),
3372 (brinst16 (CLGTHIr16 R16C:$rA, i16ImmSExt10:$val), bb:$dest)>;
3373
3374 def r16 : Pat<(brcond (i16 (cond R16C:$rA, R16C:$rB)), bb:$dest),
3375 (brinst16 (CLGTHr16 R16C:$rA, R16:$rB), bb:$dest)>;
3376
3377 def r32imm : Pat<(brcond (i32 (cond R32C:$rA, i32ImmSExt10:$val)), bb:$dest),
3378 (brinst32 (CLGTIr32 R32C:$rA, i32ImmSExt10:$val), bb:$dest)>;
3379
3380 def r32 : Pat<(brcond (i32 (cond R32C:$rA, R32C:$rB)), bb:$dest),
3381 (brinst32 (CLGTr32 R32C:$rA, R32C:$rB), bb:$dest)>;
3382}
3383
3384defm BRCONDugt : BranchCondLGT<setugt, BRHNZ, BRNZ>;
3385defm BRCONDule : BranchCondLGT<setule, BRHZ, BRZ>;
3386
3387multiclass BranchCondLGTEQ<PatFrag cond, SPUInstr orinst16, SPUInstr brinst16,
3388 SPUInstr orinst32, SPUInstr brinst32>
3389{
3390 def r16imm: Pat<(brcond (i16 (cond R16C:$rA, i16ImmSExt10:$val)), bb:$dest),
3391 (brinst16 (orinst16 (CLGTHIr16 R16C:$rA, i16ImmSExt10:$val),
3392 (CEQHIr16 R16C:$rA, i16ImmSExt10:$val)),
3393 bb:$dest)>;
3394
3395 def r16: Pat<(brcond (i16 (cond R16C:$rA, R16C:$rB)), bb:$dest),
3396 (brinst16 (orinst16 (CLGTHr16 R16C:$rA, R16:$rB),
3397 (CEQHr16 R16C:$rA, R16:$rB)),
3398 bb:$dest)>;
3399
3400 def r32imm : Pat<(brcond (i32 (cond R32C:$rA, i32ImmSExt10:$val)), bb:$dest),
3401 (brinst32 (orinst32 (CLGTIr32 R32C:$rA, i32ImmSExt10:$val),
3402 (CEQIr32 R32C:$rA, i32ImmSExt10:$val)),
3403 bb:$dest)>;
3404
3405 def r32 : Pat<(brcond (i32 (cond R32C:$rA, R32C:$rB)), bb:$dest),
3406 (brinst32 (orinst32 (CLGTr32 R32C:$rA, R32C:$rB),
3407 (CEQr32 R32C:$rA, R32C:$rB)),
3408 bb:$dest)>;
3409}
3410
3411defm BRCONDuge : BranchCondLGTEQ<setuge, ORr16, BRHNZ, ORr32, BRNZ>;
3412defm BRCONDult : BranchCondLGTEQ<setult, ORr16, BRHZ, ORr32, BRZ>;
3413
3414multiclass BranchCondGT<PatFrag cond, SPUInstr brinst16, SPUInstr brinst32>
3415{
3416 def r16imm : Pat<(brcond (i16 (cond R16C:$rA, i16ImmSExt10:$val)), bb:$dest),
3417 (brinst16 (CGTHIr16 R16C:$rA, i16ImmSExt10:$val), bb:$dest)>;
3418
3419 def r16 : Pat<(brcond (i16 (cond R16C:$rA, R16C:$rB)), bb:$dest),
3420 (brinst16 (CGTHr16 R16C:$rA, R16:$rB), bb:$dest)>;
3421
3422 def r32imm : Pat<(brcond (i32 (cond R32C:$rA, i32ImmSExt10:$val)), bb:$dest),
3423 (brinst32 (CGTIr32 R32C:$rA, i32ImmSExt10:$val), bb:$dest)>;
3424
3425 def r32 : Pat<(brcond (i32 (cond R32C:$rA, R32C:$rB)), bb:$dest),
3426 (brinst32 (CGTr32 R32C:$rA, R32C:$rB), bb:$dest)>;
3427}
3428
3429defm BRCONDgt : BranchCondGT<setgt, BRHNZ, BRNZ>;
3430defm BRCONDle : BranchCondGT<setle, BRHZ, BRZ>;
3431
3432multiclass BranchCondGTEQ<PatFrag cond, SPUInstr orinst16, SPUInstr brinst16,
3433 SPUInstr orinst32, SPUInstr brinst32>
3434{
3435 def r16imm: Pat<(brcond (i16 (cond R16C:$rA, i16ImmSExt10:$val)), bb:$dest),
3436 (brinst16 (orinst16 (CGTHIr16 R16C:$rA, i16ImmSExt10:$val),
3437 (CEQHIr16 R16C:$rA, i16ImmSExt10:$val)),
3438 bb:$dest)>;
3439
3440 def r16: Pat<(brcond (i16 (cond R16C:$rA, R16C:$rB)), bb:$dest),
3441 (brinst16 (orinst16 (CGTHr16 R16C:$rA, R16:$rB),
3442 (CEQHr16 R16C:$rA, R16:$rB)),
3443 bb:$dest)>;
3444
3445 def r32imm : Pat<(brcond (i32 (cond R32C:$rA, i32ImmSExt10:$val)), bb:$dest),
3446 (brinst32 (orinst32 (CGTIr32 R32C:$rA, i32ImmSExt10:$val),
3447 (CEQIr32 R32C:$rA, i32ImmSExt10:$val)),
3448 bb:$dest)>;
3449
3450 def r32 : Pat<(brcond (i32 (cond R32C:$rA, R32C:$rB)), bb:$dest),
3451 (brinst32 (orinst32 (CGTr32 R32C:$rA, R32C:$rB),
3452 (CEQr32 R32C:$rA, R32C:$rB)),
3453 bb:$dest)>;
3454}
3455
3456defm BRCONDge : BranchCondGTEQ<setge, ORr16, BRHNZ, ORr32, BRNZ>;
3457defm BRCONDlt : BranchCondGTEQ<setlt, ORr16, BRHZ, ORr32, BRZ>;
Scott Michelf9f42e62008-01-29 02:16:57 +00003458
Scott Michel8b6b4202007-12-04 22:35:58 +00003459let isTerminator = 1, isBarrier = 1 in {
3460 let isReturn = 1 in {
3461 def RET:
3462 RETForm<"bi\t$$lr", [(retflag)]>;
3463 }
3464}
3465
3466//===----------------------------------------------------------------------===//
Scott Michel8b6b4202007-12-04 22:35:58 +00003467// Single precision floating point instructions
3468//===----------------------------------------------------------------------===//
3469
3470def FAv4f32:
3471 RRForm<0b00100011010, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
3472 "fa\t$rT, $rA, $rB", SPrecFP,
3473 [(set (v4f32 VECREG:$rT), (fadd (v4f32 VECREG:$rA), (v4f32 VECREG:$rB)))]>;
3474
3475def FAf32 :
3476 RRForm<0b00100011010, (outs R32FP:$rT), (ins R32FP:$rA, R32FP:$rB),
3477 "fa\t$rT, $rA, $rB", SPrecFP,
3478 [(set R32FP:$rT, (fadd R32FP:$rA, R32FP:$rB))]>;
3479
3480def FSv4f32:
3481 RRForm<0b00100011010, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
3482 "fs\t$rT, $rA, $rB", SPrecFP,
3483 [(set (v4f32 VECREG:$rT), (fsub (v4f32 VECREG:$rA), (v4f32 VECREG:$rB)))]>;
3484
3485def FSf32 :
3486 RRForm<0b10100011010, (outs R32FP:$rT), (ins R32FP:$rA, R32FP:$rB),
3487 "fs\t$rT, $rA, $rB", SPrecFP,
3488 [(set R32FP:$rT, (fsub R32FP:$rA, R32FP:$rB))]>;
3489
3490// Floating point reciprocal estimate
3491def FREv4f32 :
3492 RRForm_1<0b00011101100, (outs VECREG:$rT), (ins VECREG:$rA),
3493 "frest\t$rT, $rA", SPrecFP,
3494 [(set (v4f32 VECREG:$rT), (SPUreciprocalEst (v4f32 VECREG:$rA)))]>;
3495
3496def FREf32 :
3497 RRForm_1<0b00011101100, (outs R32FP:$rT), (ins R32FP:$rA),
3498 "frest\t$rT, $rA", SPrecFP,
3499 [(set R32FP:$rT, (SPUreciprocalEst R32FP:$rA))]>;
3500
3501// Floating point interpolate (used in conjunction with reciprocal estimate)
3502def FIv4f32 :
3503 RRForm<0b00101011110, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
3504 "fi\t$rT, $rA, $rB", SPrecFP,
3505 [(set (v4f32 VECREG:$rT), (SPUinterpolate (v4f32 VECREG:$rA),
3506 (v4f32 VECREG:$rB)))]>;
3507
3508def FIf32 :
3509 RRForm<0b00101011110, (outs R32FP:$rT), (ins R32FP:$rA, R32FP:$rB),
3510 "fi\t$rT, $rA, $rB", SPrecFP,
3511 [(set R32FP:$rT, (SPUinterpolate R32FP:$rA, R32FP:$rB))]>;
3512
3513// Floating Compare Equal
3514def FCEQf32 :
3515 RRForm<0b01000011110, (outs R32C:$rT), (ins R32FP:$rA, R32FP:$rB),
3516 "fceq\t$rT, $rA, $rB", SPrecFP,
3517 [(set R32C:$rT, (setoeq R32FP:$rA, R32FP:$rB))]>;
3518
3519def FCMEQf32 :
3520 RRForm<0b01010011110, (outs R32C:$rT), (ins R32FP:$rA, R32FP:$rB),
3521 "fcmeq\t$rT, $rA, $rB", SPrecFP,
3522 [(set R32C:$rT, (setoeq (fabs R32FP:$rA), (fabs R32FP:$rB)))]>;
3523
3524def FCGTf32 :
3525 RRForm<0b01000011010, (outs R32C:$rT), (ins R32FP:$rA, R32FP:$rB),
3526 "fcgt\t$rT, $rA, $rB", SPrecFP,
3527 [(set R32C:$rT, (setogt R32FP:$rA, R32FP:$rB))]>;
3528
3529def FCMGTf32 :
3530 RRForm<0b01010011010, (outs R32C:$rT), (ins R32FP:$rA, R32FP:$rB),
3531 "fcmgt\t$rT, $rA, $rB", SPrecFP,
3532 [(set R32C:$rT, (setogt (fabs R32FP:$rA), (fabs R32FP:$rB)))]>;
3533
3534// FP Status and Control Register Write
3535// Why isn't rT a don't care in the ISA?
3536// Should we create a special RRForm_3 for this guy and zero out the rT?
3537def FSCRWf32 :
3538 RRForm_1<0b01011101110, (outs R32FP:$rT), (ins R32FP:$rA),
3539 "fscrwr\t$rA", SPrecFP,
3540 [/* This instruction requires an intrinsic. Note: rT is unused. */]>;
3541
3542// FP Status and Control Register Read
3543def FSCRRf32 :
3544 RRForm_2<0b01011101110, (outs R32FP:$rT), (ins),
3545 "fscrrd\t$rT", SPrecFP,
3546 [/* This instruction requires an intrinsic */]>;
3547
3548// llvm instruction space
3549// How do these map onto cell instructions?
3550// fdiv rA rB
3551// frest rC rB # c = 1/b (both lines)
3552// fi rC rB rC
3553// fm rD rA rC # d = a * 1/b
3554// fnms rB rD rB rA # b = - (d * b - a) --should == 0 in a perfect world
3555// fma rB rB rC rD # b = b * c + d
3556// = -(d *b -a) * c + d
3557// = a * c - c ( a *b *c - a)
3558
3559// fcopysign (???)
3560
3561// Library calls:
3562// These llvm instructions will actually map to library calls.
3563// All that's needed, then, is to check that the appropriate library is
3564// imported and do a brsl to the proper function name.
3565// frem # fmod(x, y): x - (x/y) * y
3566// (Note: fmod(double, double), fmodf(float,float)
3567// fsqrt?
3568// fsin?
3569// fcos?
3570// Unimplemented SPU instruction space
3571// floating reciprocal absolute square root estimate (frsqest)
3572
3573// The following are probably just intrinsics
3574// status and control register write
3575// status and control register read
3576
3577//--------------------------------------
3578// Floating point multiply instructions
3579//--------------------------------------
3580
3581def FMv4f32:
3582 RRForm<0b00100011010, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
3583 "fm\t$rT, $rA, $rB", SPrecFP,
3584 [(set (v4f32 VECREG:$rT), (fmul (v4f32 VECREG:$rA),
3585 (v4f32 VECREG:$rB)))]>;
3586
3587def FMf32 :
3588 RRForm<0b01100011010, (outs R32FP:$rT), (ins R32FP:$rA, R32FP:$rB),
3589 "fm\t$rT, $rA, $rB", SPrecFP,
3590 [(set R32FP:$rT, (fmul R32FP:$rA, R32FP:$rB))]>;
3591
3592// Floating point multiply and add
3593// e.g. d = c + (a * b)
3594def FMAv4f32:
3595 RRRForm<0b0111, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB, VECREG:$rC),
3596 "fma\t$rT, $rA, $rB, $rC", SPrecFP,
3597 [(set (v4f32 VECREG:$rT),
3598 (fadd (v4f32 VECREG:$rC),
3599 (fmul (v4f32 VECREG:$rA), (v4f32 VECREG:$rB))))]>;
3600
3601def FMAf32:
3602 RRRForm<0b0111, (outs R32FP:$rT), (ins R32FP:$rA, R32FP:$rB, R32FP:$rC),
3603 "fma\t$rT, $rA, $rB, $rC", SPrecFP,
3604 [(set R32FP:$rT, (fadd R32FP:$rC, (fmul R32FP:$rA, R32FP:$rB)))]>;
3605
3606// FP multiply and subtract
3607// Subtracts value in rC from product
3608// res = a * b - c
3609def FMSv4f32 :
3610 RRRForm<0b0111, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB, VECREG:$rC),
3611 "fms\t$rT, $rA, $rB, $rC", SPrecFP,
3612 [(set (v4f32 VECREG:$rT),
3613 (fsub (fmul (v4f32 VECREG:$rA), (v4f32 VECREG:$rB)),
3614 (v4f32 VECREG:$rC)))]>;
3615
3616def FMSf32 :
3617 RRRForm<0b0111, (outs R32FP:$rT), (ins R32FP:$rA, R32FP:$rB, R32FP:$rC),
3618 "fms\t$rT, $rA, $rB, $rC", SPrecFP,
3619 [(set R32FP:$rT,
3620 (fsub (fmul R32FP:$rA, R32FP:$rB), R32FP:$rC))]>;
3621
3622// Floating Negative Mulitply and Subtract
3623// Subtracts product from value in rC
3624// res = fneg(fms a b c)
3625// = - (a * b - c)
3626// = c - a * b
3627// NOTE: subtraction order
3628// fsub a b = a - b
3629// fs a b = b - a?
3630def FNMSf32 :
3631 RRRForm<0b1101, (outs R32FP:$rT), (ins R32FP:$rA, R32FP:$rB, R32FP:$rC),
3632 "fnms\t$rT, $rA, $rB, $rC", SPrecFP,
3633 [(set R32FP:$rT, (fsub R32FP:$rC, (fmul R32FP:$rA, R32FP:$rB)))]>;
3634
3635def FNMSv4f32 :
3636 RRRForm<0b1101, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB, VECREG:$rC),
3637 "fnms\t$rT, $rA, $rB, $rC", SPrecFP,
3638 [(set (v4f32 VECREG:$rT),
3639 (fsub (v4f32 VECREG:$rC),
3640 (fmul (v4f32 VECREG:$rA),
3641 (v4f32 VECREG:$rB))))]>;
3642
3643//--------------------------------------
3644// Floating Point Conversions
3645// Signed conversions:
3646def CSiFv4f32:
3647 CVTIntFPForm<0b0101101110, (outs VECREG:$rT), (ins VECREG:$rA),
3648 "csflt\t$rT, $rA, 0", SPrecFP,
3649 [(set (v4f32 VECREG:$rT), (sint_to_fp (v4i32 VECREG:$rA)))]>;
3650
3651// Convert signed integer to floating point
3652def CSiFf32 :
3653 CVTIntFPForm<0b0101101110, (outs R32FP:$rT), (ins R32C:$rA),
3654 "csflt\t$rT, $rA, 0", SPrecFP,
3655 [(set R32FP:$rT, (sint_to_fp R32C:$rA))]>;
3656
3657// Convert unsigned into to float
3658def CUiFv4f32 :
3659 CVTIntFPForm<0b1101101110, (outs VECREG:$rT), (ins VECREG:$rA),
3660 "cuflt\t$rT, $rA, 0", SPrecFP,
3661 [(set (v4f32 VECREG:$rT), (uint_to_fp (v4i32 VECREG:$rA)))]>;
3662
3663def CUiFf32 :
3664 CVTIntFPForm<0b1101101110, (outs R32FP:$rT), (ins R32C:$rA),
3665 "cuflt\t$rT, $rA, 0", SPrecFP,
3666 [(set R32FP:$rT, (uint_to_fp R32C:$rA))]>;
3667
3668// Convert float to unsigned int
3669// Assume that scale = 0
3670
3671def CFUiv4f32 :
3672 CVTIntFPForm<0b1101101110, (outs VECREG:$rT), (ins VECREG:$rA),
3673 "cfltu\t$rT, $rA, 0", SPrecFP,
3674 [(set (v4i32 VECREG:$rT), (fp_to_uint (v4f32 VECREG:$rA)))]>;
3675
3676def CFUif32 :
3677 CVTIntFPForm<0b1101101110, (outs R32C:$rT), (ins R32FP:$rA),
3678 "cfltu\t$rT, $rA, 0", SPrecFP,
3679 [(set R32C:$rT, (fp_to_uint R32FP:$rA))]>;
3680
3681// Convert float to signed int
3682// Assume that scale = 0
3683
3684def CFSiv4f32 :
3685 CVTIntFPForm<0b1101101110, (outs VECREG:$rT), (ins VECREG:$rA),
3686 "cflts\t$rT, $rA, 0", SPrecFP,
3687 [(set (v4i32 VECREG:$rT), (fp_to_sint (v4f32 VECREG:$rA)))]>;
3688
3689def CFSif32 :
3690 CVTIntFPForm<0b1101101110, (outs R32C:$rT), (ins R32FP:$rA),
3691 "cflts\t$rT, $rA, 0", SPrecFP,
3692 [(set R32C:$rT, (fp_to_sint R32FP:$rA))]>;
3693
3694//===----------------------------------------------------------------------==//
3695// Single<->Double precision conversions
3696//===----------------------------------------------------------------------==//
3697
3698// NOTE: We use "vec" name suffix here to avoid confusion (e.g. input is a
3699// v4f32, output is v2f64--which goes in the name?)
3700
3701// Floating point extend single to double
3702// NOTE: Not sure if passing in v4f32 to FESDvec is correct since it
3703// operates on two double-word slots (i.e. 1st and 3rd fp numbers
3704// are ignored).
3705def FESDvec :
3706 RRForm_1<0b00011101110, (outs VECREG:$rT), (ins VECREG:$rA),
3707 "fesd\t$rT, $rA", SPrecFP,
3708 [(set (v2f64 VECREG:$rT), (fextend (v4f32 VECREG:$rA)))]>;
3709
3710def FESDf32 :
3711 RRForm_1<0b00011101110, (outs R64FP:$rT), (ins R32FP:$rA),
3712 "fesd\t$rT, $rA", SPrecFP,
3713 [(set R64FP:$rT, (fextend R32FP:$rA))]>;
3714
3715// Floating point round double to single
3716//def FRDSvec :
3717// RRForm_1<0b10011101110, (outs VECREG:$rT), (ins VECREG:$rA),
3718// "frds\t$rT, $rA,", SPrecFP,
3719// [(set (v4f32 R32FP:$rT), (fround (v2f64 R64FP:$rA)))]>;
3720
3721def FRDSf64 :
3722 RRForm_1<0b10011101110, (outs R32FP:$rT), (ins R64FP:$rA),
3723 "frds\t$rT, $rA", SPrecFP,
3724 [(set R32FP:$rT, (fround R64FP:$rA))]>;
3725
3726//ToDo include anyextend?
3727
3728//===----------------------------------------------------------------------==//
3729// Double precision floating point instructions
3730//===----------------------------------------------------------------------==//
3731def FAf64 :
3732 RRForm<0b00110011010, (outs R64FP:$rT), (ins R64FP:$rA, R64FP:$rB),
3733 "dfa\t$rT, $rA, $rB", DPrecFP,
3734 [(set R64FP:$rT, (fadd R64FP:$rA, R64FP:$rB))]>;
3735
3736def FAv2f64 :
3737 RRForm<0b00110011010, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
3738 "dfa\t$rT, $rA, $rB", DPrecFP,
3739 [(set (v2f64 VECREG:$rT), (fadd (v2f64 VECREG:$rA), (v2f64 VECREG:$rB)))]>;
3740
3741def FSf64 :
3742 RRForm<0b10100011010, (outs R64FP:$rT), (ins R64FP:$rA, R64FP:$rB),
3743 "dfs\t$rT, $rA, $rB", DPrecFP,
3744 [(set R64FP:$rT, (fsub R64FP:$rA, R64FP:$rB))]>;
3745
3746def FSv2f64 :
3747 RRForm<0b10100011010, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
3748 "dfs\t$rT, $rA, $rB", DPrecFP,
3749 [(set (v2f64 VECREG:$rT),
3750 (fsub (v2f64 VECREG:$rA), (v2f64 VECREG:$rB)))]>;
3751
3752def FMf64 :
3753 RRForm<0b01100011010, (outs R64FP:$rT), (ins R64FP:$rA, R64FP:$rB),
3754 "dfm\t$rT, $rA, $rB", DPrecFP,
3755 [(set R64FP:$rT, (fmul R64FP:$rA, R64FP:$rB))]>;
3756
3757def FMv2f64:
3758 RRForm<0b00100011010, (outs VECREG:$rT), (ins VECREG:$rA, VECREG:$rB),
3759 "dfm\t$rT, $rA, $rB", DPrecFP,
3760 [(set (v2f64 VECREG:$rT),
3761 (fmul (v2f64 VECREG:$rA), (v2f64 VECREG:$rB)))]>;
3762
3763def FMAf64:
3764 RRForm<0b00111010110, (outs R64FP:$rT),
3765 (ins R64FP:$rA, R64FP:$rB, R64FP:$rC),
3766 "dfma\t$rT, $rA, $rB", DPrecFP,
3767 [(set R64FP:$rT, (fadd R64FP:$rC, (fmul R64FP:$rA, R64FP:$rB)))]>,
3768 RegConstraint<"$rC = $rT">,
3769 NoEncode<"$rC">;
3770
3771def FMAv2f64:
3772 RRForm<0b00111010110, (outs VECREG:$rT),
3773 (ins VECREG:$rA, VECREG:$rB, VECREG:$rC),
3774 "dfma\t$rT, $rA, $rB", DPrecFP,
3775 [(set (v2f64 VECREG:$rT),
3776 (fadd (v2f64 VECREG:$rC),
3777 (fmul (v2f64 VECREG:$rA), (v2f64 VECREG:$rB))))]>,
3778 RegConstraint<"$rC = $rT">,
3779 NoEncode<"$rC">;
3780
3781def FMSf64 :
3782 RRForm<0b10111010110, (outs R64FP:$rT),
3783 (ins R64FP:$rA, R64FP:$rB, R64FP:$rC),
3784 "dfms\t$rT, $rA, $rB", DPrecFP,
3785 [(set R64FP:$rT, (fsub (fmul R64FP:$rA, R64FP:$rB), R64FP:$rC))]>,
3786 RegConstraint<"$rC = $rT">,
3787 NoEncode<"$rC">;
3788
3789def FMSv2f64 :
3790 RRForm<0b10111010110, (outs VECREG:$rT),
3791 (ins VECREG:$rA, VECREG:$rB, VECREG:$rC),
3792 "dfms\t$rT, $rA, $rB", DPrecFP,
3793 [(set (v2f64 VECREG:$rT),
3794 (fsub (fmul (v2f64 VECREG:$rA), (v2f64 VECREG:$rB)),
3795 (v2f64 VECREG:$rC)))]>;
3796
3797// FNMS: - (a * b - c)
3798// - (a * b) + c => c - (a * b)
3799def FNMSf64 :
3800 RRForm<0b01111010110, (outs R64FP:$rT),
3801 (ins R64FP:$rA, R64FP:$rB, R64FP:$rC),
3802 "dfnms\t$rT, $rA, $rB", DPrecFP,
3803 [(set R64FP:$rT, (fsub R64FP:$rC, (fmul R64FP:$rA, R64FP:$rB)))]>,
3804 RegConstraint<"$rC = $rT">,
3805 NoEncode<"$rC">;
3806
3807def : Pat<(fneg (fsub (fmul R64FP:$rA, R64FP:$rB), R64FP:$rC)),
3808 (FNMSf64 R64FP:$rA, R64FP:$rB, R64FP:$rC)>;
3809
3810def FNMSv2f64 :
3811 RRForm<0b01111010110, (outs VECREG:$rT),
3812 (ins VECREG:$rA, VECREG:$rB, VECREG:$rC),
3813 "dfnms\t$rT, $rA, $rB", DPrecFP,
3814 [(set (v2f64 VECREG:$rT),
3815 (fsub (v2f64 VECREG:$rC),
3816 (fmul (v2f64 VECREG:$rA),
3817 (v2f64 VECREG:$rB))))]>,
3818 RegConstraint<"$rC = $rT">,
3819 NoEncode<"$rC">;
3820
3821def : Pat<(fneg (fsub (fmul (v2f64 VECREG:$rA), (v2f64 VECREG:$rB)),
3822 (v2f64 VECREG:$rC))),
3823 (FNMSv2f64 VECREG:$rA, VECREG:$rB, VECREG:$rC)>;
3824
3825// - (a * b + c)
3826// - (a * b) - c
3827def FNMAf64 :
3828 RRForm<0b11111010110, (outs R64FP:$rT),
3829 (ins R64FP:$rA, R64FP:$rB, R64FP:$rC),
3830 "dfnma\t$rT, $rA, $rB", DPrecFP,
3831 [(set R64FP:$rT, (fneg (fadd R64FP:$rC, (fmul R64FP:$rA, R64FP:$rB))))]>,
3832 RegConstraint<"$rC = $rT">,
3833 NoEncode<"$rC">;
3834
3835def FNMAv2f64 :
3836 RRForm<0b11111010110, (outs VECREG:$rT),
3837 (ins VECREG:$rA, VECREG:$rB, VECREG:$rC),
3838 "dfnma\t$rT, $rA, $rB", DPrecFP,
3839 [(set (v2f64 VECREG:$rT),
3840 (fneg (fadd (v2f64 VECREG:$rC),
3841 (fmul (v2f64 VECREG:$rA),
3842 (v2f64 VECREG:$rB)))))]>,
3843 RegConstraint<"$rC = $rT">,
3844 NoEncode<"$rC">;
3845
3846//===----------------------------------------------------------------------==//
3847// Floating point negation and absolute value
3848//===----------------------------------------------------------------------==//
3849
3850def : Pat<(fneg (v4f32 VECREG:$rA)),
3851 (XORfnegvec (v4f32 VECREG:$rA),
3852 (v4f32 (ILHUv4i32 0x8000)))>;
3853
3854def : Pat<(fneg R32FP:$rA),
3855 (XORfneg32 R32FP:$rA, (ILHUr32 0x8000))>;
3856
3857def : Pat<(fneg (v2f64 VECREG:$rA)),
3858 (XORfnegvec (v2f64 VECREG:$rA),
3859 (v2f64 (ANDBIv16i8 (FSMBIv16i8 0x8080), 0x80)))>;
3860
3861def : Pat<(fneg R64FP:$rA),
3862 (XORfneg64 R64FP:$rA,
3863 (ANDBIv16i8 (FSMBIv16i8 0x8080), 0x80))>;
3864
3865// Floating point absolute value
3866
3867def : Pat<(fabs R32FP:$rA),
3868 (ANDfabs32 R32FP:$rA, (IOHLr32 (ILHUr32 0x7fff), 0xffff))>;
3869
3870def : Pat<(fabs (v4f32 VECREG:$rA)),
3871 (ANDfabsvec (v4f32 VECREG:$rA),
3872 (v4f32 (ANDBIv16i8 (FSMBIv16i8 0xffff), 0x7f)))>;
3873
3874def : Pat<(fabs R64FP:$rA),
3875 (ANDfabs64 R64FP:$rA, (ANDBIv16i8 (FSMBIv16i8 0xffff), 0x7f))>;
3876
3877def : Pat<(fabs (v2f64 VECREG:$rA)),
3878 (ANDfabsvec (v2f64 VECREG:$rA),
3879 (v2f64 (ANDBIv16i8 (FSMBIv16i8 0xffff), 0x7f)))>;
3880
3881//===----------------------------------------------------------------------===//
3882// Execution, Load NOP (execute NOPs belong in even pipeline, load NOPs belong
3883// in the odd pipeline)
3884//===----------------------------------------------------------------------===//
3885
Scott Michel97872d32008-02-23 18:41:37 +00003886def ENOP : SPUInstr<(outs), (ins), "enop", ExecNOP> {
Scott Michel8b6b4202007-12-04 22:35:58 +00003887 let Pattern = [];
3888
3889 let Inst{0-10} = 0b10000000010;
3890 let Inst{11-17} = 0;
3891 let Inst{18-24} = 0;
3892 let Inst{25-31} = 0;
3893}
3894
Scott Michel97872d32008-02-23 18:41:37 +00003895def LNOP : SPUInstr<(outs), (ins), "lnop", LoadNOP> {
Scott Michel8b6b4202007-12-04 22:35:58 +00003896 let Pattern = [];
3897
3898 let Inst{0-10} = 0b10000000000;
3899 let Inst{11-17} = 0;
3900 let Inst{18-24} = 0;
3901 let Inst{25-31} = 0;
3902}
3903
3904//===----------------------------------------------------------------------===//
3905// Bit conversions (type conversions between vector/packed types)
3906// NOTE: Promotions are handled using the XS* instructions. Truncation
3907// is not handled.
3908//===----------------------------------------------------------------------===//
3909def : Pat<(v16i8 (bitconvert (v8i16 VECREG:$src))), (v16i8 VECREG:$src)>;
3910def : Pat<(v16i8 (bitconvert (v4i32 VECREG:$src))), (v16i8 VECREG:$src)>;
3911def : Pat<(v16i8 (bitconvert (v2i64 VECREG:$src))), (v16i8 VECREG:$src)>;
3912def : Pat<(v16i8 (bitconvert (v4f32 VECREG:$src))), (v16i8 VECREG:$src)>;
3913def : Pat<(v16i8 (bitconvert (v2f64 VECREG:$src))), (v16i8 VECREG:$src)>;
3914
3915def : Pat<(v8i16 (bitconvert (v16i8 VECREG:$src))), (v8i16 VECREG:$src)>;
3916def : Pat<(v8i16 (bitconvert (v4i32 VECREG:$src))), (v8i16 VECREG:$src)>;
3917def : Pat<(v8i16 (bitconvert (v2i64 VECREG:$src))), (v8i16 VECREG:$src)>;
3918def : Pat<(v8i16 (bitconvert (v4f32 VECREG:$src))), (v8i16 VECREG:$src)>;
3919def : Pat<(v8i16 (bitconvert (v2f64 VECREG:$src))), (v8i16 VECREG:$src)>;
3920
3921def : Pat<(v4i32 (bitconvert (v16i8 VECREG:$src))), (v4i32 VECREG:$src)>;
3922def : Pat<(v4i32 (bitconvert (v8i16 VECREG:$src))), (v4i32 VECREG:$src)>;
3923def : Pat<(v4i32 (bitconvert (v2i64 VECREG:$src))), (v4i32 VECREG:$src)>;
3924def : Pat<(v4i32 (bitconvert (v4f32 VECREG:$src))), (v4i32 VECREG:$src)>;
3925def : Pat<(v4i32 (bitconvert (v2f64 VECREG:$src))), (v4i32 VECREG:$src)>;
3926
3927def : Pat<(v2i64 (bitconvert (v16i8 VECREG:$src))), (v2i64 VECREG:$src)>;
3928def : Pat<(v2i64 (bitconvert (v8i16 VECREG:$src))), (v2i64 VECREG:$src)>;
3929def : Pat<(v2i64 (bitconvert (v4i32 VECREG:$src))), (v2i64 VECREG:$src)>;
3930def : Pat<(v2i64 (bitconvert (v4f32 VECREG:$src))), (v2i64 VECREG:$src)>;
3931def : Pat<(v2i64 (bitconvert (v2f64 VECREG:$src))), (v2i64 VECREG:$src)>;
3932
3933def : Pat<(v4f32 (bitconvert (v16i8 VECREG:$src))), (v4f32 VECREG:$src)>;
3934def : Pat<(v4f32 (bitconvert (v8i16 VECREG:$src))), (v4f32 VECREG:$src)>;
3935def : Pat<(v4f32 (bitconvert (v2i64 VECREG:$src))), (v4f32 VECREG:$src)>;
3936def : Pat<(v4f32 (bitconvert (v4i32 VECREG:$src))), (v4f32 VECREG:$src)>;
3937def : Pat<(v4f32 (bitconvert (v2f64 VECREG:$src))), (v4f32 VECREG:$src)>;
3938
3939def : Pat<(v2f64 (bitconvert (v16i8 VECREG:$src))), (v2f64 VECREG:$src)>;
3940def : Pat<(v2f64 (bitconvert (v8i16 VECREG:$src))), (v2f64 VECREG:$src)>;
3941def : Pat<(v2f64 (bitconvert (v4i32 VECREG:$src))), (v2f64 VECREG:$src)>;
3942def : Pat<(v2f64 (bitconvert (v2i64 VECREG:$src))), (v2f64 VECREG:$src)>;
3943def : Pat<(v2f64 (bitconvert (v2f64 VECREG:$src))), (v2f64 VECREG:$src)>;
3944
3945def : Pat<(f32 (bitconvert (i32 R32C:$src))), (f32 R32FP:$src)>;
Scott Michel754d8662007-12-20 00:44:13 +00003946def : Pat<(f64 (bitconvert (i64 R64C:$src))), (f64 R64FP:$src)>;
Scott Michel8b6b4202007-12-04 22:35:58 +00003947
3948//===----------------------------------------------------------------------===//
3949// Instruction patterns:
3950//===----------------------------------------------------------------------===//
3951
3952// General 32-bit constants:
3953def : Pat<(i32 imm:$imm),
3954 (IOHLr32 (ILHUr32 (HI16 imm:$imm)), (LO16 imm:$imm))>;
3955
3956// Single precision float constants:
Nate Begeman78125042008-02-14 18:43:04 +00003957def : Pat<(f32 fpimm:$imm),
Scott Michel8b6b4202007-12-04 22:35:58 +00003958 (IOHLf32 (ILHUf32 (HI16_f32 fpimm:$imm)), (LO16_f32 fpimm:$imm))>;
3959
3960// General constant 32-bit vectors
3961def : Pat<(v4i32 v4i32Imm:$imm),
3962 (IOHLvec (v4i32 (ILHUv4i32 (HI16_vec v4i32Imm:$imm))),
3963 (LO16_vec v4i32Imm:$imm))>;
Scott Michel438be252007-12-17 22:32:34 +00003964
3965// 8-bit constants
3966def : Pat<(i8 imm:$imm),
3967 (ILHr8 imm:$imm)>;
Scott Michel8b6b4202007-12-04 22:35:58 +00003968
3969//===----------------------------------------------------------------------===//
3970// Call instruction patterns:
3971//===----------------------------------------------------------------------===//
3972// Return void
3973def : Pat<(ret),
3974 (RET)>;
3975
3976//===----------------------------------------------------------------------===//
3977// Zero/Any/Sign extensions
3978//===----------------------------------------------------------------------===//
3979
3980// zext 1->32: Zero extend i1 to i32
3981def : Pat<(SPUextract_i1_zext R32C:$rSrc),
3982 (ANDIr32 R32C:$rSrc, 0x1)>;
3983
3984// sext 8->32: Sign extend bytes to words
3985def : Pat<(sext_inreg R32C:$rSrc, i8),
3986 (XSHWr32 (XSBHr32 R32C:$rSrc))>;
3987
Scott Michel438be252007-12-17 22:32:34 +00003988def : Pat<(i32 (sext R8C:$rSrc)),
3989 (XSHWr16 (XSBHr8 R8C:$rSrc))>;
3990
Scott Michel8b6b4202007-12-04 22:35:58 +00003991def : Pat<(SPUextract_i8_sext VECREG:$rSrc),
3992 (XSHWr32 (XSBHr32 (ORi32_v4i32 (v4i32 VECREG:$rSrc),
3993 (v4i32 VECREG:$rSrc))))>;
3994
Scott Michel438be252007-12-17 22:32:34 +00003995// zext 8->16: Zero extend bytes to halfwords
3996def : Pat<(i16 (zext R8C:$rSrc)),
Scott Michel97872d32008-02-23 18:41:37 +00003997 (ANDHIi8i16 R8C:$rSrc, 0xff)>;
Scott Michel438be252007-12-17 22:32:34 +00003998
3999// zext 8->32 from preferred slot in load/store
Scott Michel8b6b4202007-12-04 22:35:58 +00004000def : Pat<(SPUextract_i8_zext VECREG:$rSrc),
4001 (ANDIr32 (ORi32_v4i32 (v4i32 VECREG:$rSrc), (v4i32 VECREG:$rSrc)),
4002 0xff)>;
4003
Scott Michel438be252007-12-17 22:32:34 +00004004// zext 8->32: Zero extend bytes to words
4005def : Pat<(i32 (zext R8C:$rSrc)),
Scott Michel97872d32008-02-23 18:41:37 +00004006 (ANDIi8i32 R8C:$rSrc, 0xff)>;
Scott Michel438be252007-12-17 22:32:34 +00004007
4008// anyext 8->16: Extend 8->16 bits, irrespective of sign
4009def : Pat<(i16 (anyext R8C:$rSrc)),
Scott Michel97872d32008-02-23 18:41:37 +00004010 (ORHIi8i16 R8C:$rSrc, 0)>;
Scott Michel438be252007-12-17 22:32:34 +00004011
4012// anyext 8->32: Extend 8->32 bits, irrespective of sign
4013def : Pat<(i32 (anyext R8C:$rSrc)),
Scott Michel97872d32008-02-23 18:41:37 +00004014 (ORIi8i32 R8C:$rSrc, 0)>;
Scott Michel438be252007-12-17 22:32:34 +00004015
Scott Michel97872d32008-02-23 18:41:37 +00004016// zext 16->32: Zero extend halfwords to words
Scott Michel8b6b4202007-12-04 22:35:58 +00004017def : Pat<(i32 (zext R16C:$rSrc)),
Scott Michel97872d32008-02-23 18:41:37 +00004018 (ANDi16i32 R16C:$rSrc, (ILAr32 0xffff))>;
Scott Michel8b6b4202007-12-04 22:35:58 +00004019
4020def : Pat<(i32 (zext (and R16C:$rSrc, 0xf))),
Scott Michel97872d32008-02-23 18:41:37 +00004021 (ANDIi16i32 R16C:$rSrc, 0xf)>;
Scott Michel8b6b4202007-12-04 22:35:58 +00004022
4023def : Pat<(i32 (zext (and R16C:$rSrc, 0xff))),
Scott Michel97872d32008-02-23 18:41:37 +00004024 (ANDIi16i32 R16C:$rSrc, 0xff)>;
Scott Michel8b6b4202007-12-04 22:35:58 +00004025
4026def : Pat<(i32 (zext (and R16C:$rSrc, 0xfff))),
Scott Michel97872d32008-02-23 18:41:37 +00004027 (ANDIi16i32 R16C:$rSrc, 0xfff)>;
Scott Michel8b6b4202007-12-04 22:35:58 +00004028
4029// anyext 16->32: Extend 16->32 bits, irrespective of sign
4030def : Pat<(i32 (anyext R16C:$rSrc)),
Scott Michel97872d32008-02-23 18:41:37 +00004031 (ORIi16i32 R16C:$rSrc, 0)>;
Scott Michel8b6b4202007-12-04 22:35:58 +00004032
4033//===----------------------------------------------------------------------===//
Scott Michelf9f42e62008-01-29 02:16:57 +00004034// Address generation: SPU, like PPC, has to split addresses into high and
Scott Michel8b6b4202007-12-04 22:35:58 +00004035// low parts in order to load them into a register.
4036//===----------------------------------------------------------------------===//
4037
Scott Michelf9f42e62008-01-29 02:16:57 +00004038def : Pat<(SPUaform tglobaladdr:$in, 0), (ILAlsa tglobaladdr:$in)>;
4039def : Pat<(SPUaform texternalsym:$in, 0), (ILAlsa texternalsym:$in)>;
4040def : Pat<(SPUaform tjumptable:$in, 0), (ILAlsa tjumptable:$in)>;
4041def : Pat<(SPUaform tconstpool:$in, 0), (ILAlsa tconstpool:$in)>;
4042
4043def : Pat<(SPUindirect (SPUhi tglobaladdr:$in, 0),
4044 (SPUlo tglobaladdr:$in, 0)),
Scott Micheldbac4cf2008-01-11 02:53:15 +00004045 (IOHLlo (ILHUhi tglobaladdr:$in), tglobaladdr:$in)>;
Scott Michel394e26d2008-01-17 20:38:41 +00004046
Scott Michelf9f42e62008-01-29 02:16:57 +00004047def : Pat<(SPUindirect (SPUhi texternalsym:$in, 0),
4048 (SPUlo texternalsym:$in, 0)),
4049 (IOHLlo (ILHUhi texternalsym:$in), texternalsym:$in)>;
4050
4051def : Pat<(SPUindirect (SPUhi tjumptable:$in, 0),
4052 (SPUlo tjumptable:$in, 0)),
Scott Micheldbac4cf2008-01-11 02:53:15 +00004053 (IOHLlo (ILHUhi tjumptable:$in), tjumptable:$in)>;
Scott Michel394e26d2008-01-17 20:38:41 +00004054
Scott Michelf9f42e62008-01-29 02:16:57 +00004055def : Pat<(SPUindirect (SPUhi tconstpool:$in, 0),
4056 (SPUlo tconstpool:$in, 0)),
4057 (IOHLlo (ILHUhi tconstpool:$in), tconstpool:$in)>;
4058
4059def : Pat<(add (SPUhi tglobaladdr:$in, 0), (SPUlo tglobaladdr:$in, 0)),
4060 (IOHLlo (ILHUhi tglobaladdr:$in), tglobaladdr:$in)>;
4061
4062def : Pat<(add (SPUhi texternalsym:$in, 0), (SPUlo texternalsym:$in, 0)),
4063 (IOHLlo (ILHUhi texternalsym:$in), texternalsym:$in)>;
4064
4065def : Pat<(add (SPUhi tjumptable:$in, 0), (SPUlo tjumptable:$in, 0)),
4066 (IOHLlo (ILHUhi tjumptable:$in), tjumptable:$in)>;
4067
4068def : Pat<(add (SPUhi tconstpool:$in, 0), (SPUlo tconstpool:$in, 0)),
4069 (IOHLlo (ILHUhi tconstpool:$in), tconstpool:$in)>;
Scott Michel8b6b4202007-12-04 22:35:58 +00004070
Scott Michel8b6b4202007-12-04 22:35:58 +00004071// Instrinsics:
4072include "CellSDKIntrinsics.td"