Bill Wendling | bc9bffa | 2007-03-07 05:43:18 +0000 | [diff] [blame] | 1 | //====- X86InstrMMX.td - Describe the X86 Instruction Set --*- tablegen -*-===// |
Evan Cheng | ffcb95b | 2006-02-21 19:13:53 +0000 | [diff] [blame] | 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file was developed by the Evan Cheng and is distributed under |
| 6 | // the University of Illinois Open Source License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // This file describes the X86 MMX instruction set, defining the instructions, |
| 11 | // and properties of the instructions which are needed for code generation, |
| 12 | // machine code emission, and analysis. |
| 13 | // |
| 14 | //===----------------------------------------------------------------------===// |
| 15 | |
Bill Wendling | a31bd27 | 2007-03-06 18:53:42 +0000 | [diff] [blame] | 16 | //===----------------------------------------------------------------------===// |
Evan Cheng | fcf5e21 | 2006-04-11 06:57:30 +0000 | [diff] [blame] | 17 | // Instruction templates |
Bill Wendling | a31bd27 | 2007-03-06 18:53:42 +0000 | [diff] [blame] | 18 | //===----------------------------------------------------------------------===// |
| 19 | |
Evan Cheng | d2a6d54 | 2006-04-12 23:42:44 +0000 | [diff] [blame] | 20 | // MMXI - MMX instructions with TB prefix. |
| 21 | // MMX2I - MMX / SSE2 instructions with TB and OpSize prefixes. |
| 22 | // MMXIi8 - MMX instructions with ImmT == Imm8 and TB prefix. |
| 23 | class MMXI<bits<8> o, Format F, dag ops, string asm, list<dag> pattern> |
| 24 | : I<o, F, ops, asm, pattern>, TB, Requires<[HasMMX]>; |
| 25 | class MMX2I<bits<8> o, Format F, dag ops, string asm, list<dag> pattern> |
| 26 | : I<o, F, ops, asm, pattern>, TB, OpSize, Requires<[HasSSE2]>; |
Evan Cheng | fcf5e21 | 2006-04-11 06:57:30 +0000 | [diff] [blame] | 27 | class MMXIi8<bits<8> o, Format F, dag ops, string asm, list<dag> pattern> |
Evan Cheng | 1693e48 | 2006-07-19 00:27:29 +0000 | [diff] [blame] | 28 | : Ii8<o, F, ops, asm, pattern>, TB, Requires<[HasMMX]>; |
Evan Cheng | fcf5e21 | 2006-04-11 06:57:30 +0000 | [diff] [blame] | 29 | |
Evan Cheng | ba753c6 | 2006-03-20 06:04:52 +0000 | [diff] [blame] | 30 | // Some 'special' instructions |
| 31 | def IMPLICIT_DEF_VR64 : I<0, Pseudo, (ops VR64:$dst), |
| 32 | "#IMPLICIT_DEF $dst", |
| 33 | [(set VR64:$dst, (v8i8 (undef)))]>, |
| 34 | Requires<[HasMMX]>; |
| 35 | |
Bill Wendling | bc9bffa | 2007-03-07 05:43:18 +0000 | [diff] [blame] | 36 | // 64-bit vector undef's. |
| 37 | def : Pat<(v8i8 (undef)), (IMPLICIT_DEF_VR64)>; |
| 38 | def : Pat<(v4i16 (undef)), (IMPLICIT_DEF_VR64)>; |
| 39 | def : Pat<(v2i32 (undef)), (IMPLICIT_DEF_VR64)>; |
Evan Cheng | ba753c6 | 2006-03-20 06:04:52 +0000 | [diff] [blame] | 40 | |
Bill Wendling | a31bd27 | 2007-03-06 18:53:42 +0000 | [diff] [blame] | 41 | //===----------------------------------------------------------------------===// |
| 42 | // MMX Pattern Fragments |
| 43 | //===----------------------------------------------------------------------===// |
| 44 | |
| 45 | def loadv2i32 : PatFrag<(ops node:$ptr), (v2i32 (load node:$ptr))>; |
| 46 | |
| 47 | //===----------------------------------------------------------------------===// |
Bill Wendling | 2f88dcd | 2007-03-08 22:09:11 +0000 | [diff] [blame] | 48 | // MMX Multiclasses |
| 49 | //===----------------------------------------------------------------------===// |
| 50 | |
| 51 | let isTwoAddress = 1 in { |
| 52 | // MMXI_binop_rm - Simple MMX binary operator. |
| 53 | multiclass MMXI_binop_rm<bits<8> opc, string OpcodeStr, SDNode OpNode, |
| 54 | ValueType OpVT, bit Commutable = 0> { |
| 55 | def rr : MMXI<opc, MRMSrcReg, (ops VR64:$dst, VR64:$src1, VR64:$src2), |
| 56 | !strconcat(OpcodeStr, " {$src2, $dst|$dst, $src2}"), |
| 57 | [(set VR64:$dst, (OpVT (OpNode VR64:$src1, VR64:$src2)))]> { |
| 58 | let isCommutable = Commutable; |
| 59 | } |
| 60 | def rm : MMXI<opc, MRMSrcMem, (ops VR64:$dst, VR64:$src1, i64mem:$src2), |
| 61 | !strconcat(OpcodeStr, " {$src2, $dst|$dst, $src2}"), |
| 62 | [(set VR64:$dst, (OpVT (OpNode VR64:$src1, |
| 63 | (bitconvert |
| 64 | (loadv2i32 addr:$src2)))))]>; |
| 65 | } |
| 66 | } |
| 67 | |
| 68 | let isTwoAddress = 1 in { |
| 69 | multiclass MMXI_binop_rm_int<bits<8> opc, string OpcodeStr, Intrinsic IntId, |
| 70 | bit Commutable = 0> { |
| 71 | def rr : MMXI<opc, MRMSrcReg, (ops VR64:$dst, VR64:$src1, VR64:$src2), |
| 72 | !strconcat(OpcodeStr, " {$src2, $dst|$dst, $src2}"), |
| 73 | [(set VR64:$dst, (IntId VR64:$src1, VR64:$src2))]> { |
| 74 | let isCommutable = Commutable; |
| 75 | } |
| 76 | def rm : MMXI<opc, MRMSrcMem, (ops VR64:$dst, VR64:$src1, i64mem:$src2), |
| 77 | !strconcat(OpcodeStr, " {$src2, $dst|$dst, $src2}"), |
| 78 | [(set VR64:$dst, (IntId VR64:$src1, |
| 79 | (bitconvert (loadv2i32 addr:$src2))))]>; |
| 80 | } |
| 81 | } |
| 82 | |
| 83 | //===----------------------------------------------------------------------===// |
Bill Wendling | a31bd27 | 2007-03-06 18:53:42 +0000 | [diff] [blame] | 84 | // MMX EMMS Instruction |
| 85 | //===----------------------------------------------------------------------===// |
| 86 | |
| 87 | def EMMS : MMXI<0x77, RawFrm, (ops), "emms", [(int_x86_mmx_emms)]>; |
| 88 | |
| 89 | //===----------------------------------------------------------------------===// |
| 90 | // MMX Scalar Instructions |
| 91 | //===----------------------------------------------------------------------===// |
Bill Wendling | 229baff | 2007-03-05 23:09:45 +0000 | [diff] [blame] | 92 | |
Bill Wendling | 2f88dcd | 2007-03-08 22:09:11 +0000 | [diff] [blame] | 93 | // Arithmetic Instructions |
| 94 | defm MMX_PADDB : MMXI_binop_rm<0xFC, "paddb", add, v8i8, 1>; |
| 95 | defm MMX_PADDW : MMXI_binop_rm<0xFD, "paddw", add, v4i16, 1>; |
| 96 | defm MMX_PADDD : MMXI_binop_rm<0xFE, "paddd", add, v2i32, 1>; |
| 97 | |
| 98 | defm MMX_PADDSB : MMXI_binop_rm_int<0xEC, "paddsb" , int_x86_mmx_padds_b, 1>; |
| 99 | defm MMX_PADDSW : MMXI_binop_rm_int<0xED, "paddsw" , int_x86_mmx_padds_w, 1>; |
| 100 | |
| 101 | defm MMX_PADDUSB : MMXI_binop_rm_int<0xDC, "paddusb", int_x86_mmx_paddus_b, 1>; |
| 102 | defm MMX_PADDUSW : MMXI_binop_rm_int<0xDD, "paddusw", int_x86_mmx_paddus_w, 1>; |
| 103 | |
Bill Wendling | c1fb047 | 2007-03-10 09:57:05 +0000 | [diff] [blame] | 104 | defm MMX_PSUBB : MMXI_binop_rm<0xF8, "psubb", sub, v8i8>; |
| 105 | defm MMX_PSUBW : MMXI_binop_rm<0xF9, "psubw", sub, v4i16>; |
| 106 | defm MMX_PSUBD : MMXI_binop_rm<0xFA, "psubd", sub, v2i32>; |
| 107 | |
| 108 | defm MMX_PSUBSB : MMXI_binop_rm_int<0xE8, "psubsb" , int_x86_mmx_psubs_b>; |
| 109 | defm MMX_PSUBSW : MMXI_binop_rm_int<0xE9, "psubsw" , int_x86_mmx_psubs_w>; |
| 110 | |
| 111 | defm MMX_PSUBUSB : MMXI_binop_rm_int<0xD8, "psubusb", int_x86_mmx_psubus_b>; |
| 112 | defm MMX_PSUBUSW : MMXI_binop_rm_int<0xD9, "psubusw", int_x86_mmx_psubus_w>; |
| 113 | |
Bill Wendling | 74027e9 | 2007-03-15 21:24:36 +0000 | [diff] [blame^] | 114 | defm MMX_PMULLW : MMXI_binop_rm<0xD5, "pmullw", mul, v4i16, 1>; |
| 115 | |
| 116 | defm MMX_PMULHW : MMXI_binop_rm_int<0xE5, "pmulhw" , int_x86_mmx_pmulh_w , 1>; |
| 117 | defm MMX_PMADDWD : MMXI_binop_rm_int<0xF5, "pmaddwd", int_x86_mmx_pmadd_wd, 1>; |
| 118 | |
Evan Cheng | ffcb95b | 2006-02-21 19:13:53 +0000 | [diff] [blame] | 119 | // Move Instructions |
Bill Wendling | a31bd27 | 2007-03-06 18:53:42 +0000 | [diff] [blame] | 120 | def MOVD64rr : MMXI<0x6E, MRMSrcReg, (ops VR64:$dst, GR32:$src), |
| 121 | "movd {$src, $dst|$dst, $src}", []>; |
| 122 | def MOVD64rm : MMXI<0x6E, MRMSrcMem, (ops VR64:$dst, i32mem:$src), |
| 123 | "movd {$src, $dst|$dst, $src}", []>; |
| 124 | def MOVD64mr : MMXI<0x7E, MRMDestMem, (ops i32mem:$dst, VR64:$src), |
| 125 | "movd {$src, $dst|$dst, $src}", []>; |
Evan Cheng | ffcb95b | 2006-02-21 19:13:53 +0000 | [diff] [blame] | 126 | |
Bill Wendling | a31bd27 | 2007-03-06 18:53:42 +0000 | [diff] [blame] | 127 | def MOVQ64rr : MMXI<0x6F, MRMSrcReg, (ops VR64:$dst, VR64:$src), |
| 128 | "movq {$src, $dst|$dst, $src}", []>; |
| 129 | def MOVQ64rm : MMXI<0x6F, MRMSrcMem, (ops VR64:$dst, i64mem:$src), |
| 130 | "movq {$src, $dst|$dst, $src}", |
| 131 | [(set VR64:$dst, (loadv2i32 addr:$src))]>; |
| 132 | def MOVQ64mr : MMXI<0x7F, MRMDestMem, (ops i64mem:$dst, VR64:$src), |
| 133 | "movq {$src, $dst|$dst, $src}", |
| 134 | [(store (v2i32 VR64:$src), addr:$dst)]>; |
Evan Cheng | 3246e06 | 2006-03-25 01:31:59 +0000 | [diff] [blame] | 135 | |
| 136 | // Conversion instructions |
Evan Cheng | d2a6d54 | 2006-04-12 23:42:44 +0000 | [diff] [blame] | 137 | def CVTPI2PSrr : MMXI<0x2A, MRMSrcReg, (ops VR128:$dst, VR64:$src), |
| 138 | "cvtpi2ps {$src, $dst|$dst, $src}", []>; |
| 139 | def CVTPI2PSrm : MMXI<0x2A, MRMSrcMem, (ops VR128:$dst, i64mem:$src), |
| 140 | "cvtpi2ps {$src, $dst|$dst, $src}", []>; |
| 141 | def CVTPI2PDrr : MMX2I<0x2A, MRMSrcReg, (ops VR128:$dst, VR64:$src), |
| 142 | "cvtpi2pd {$src, $dst|$dst, $src}", []>; |
| 143 | def CVTPI2PDrm : MMX2I<0x2A, MRMSrcMem, (ops VR128:$dst, i64mem:$src), |
| 144 | "cvtpi2pd {$src, $dst|$dst, $src}", []>; |
Evan Cheng | 3246e06 | 2006-03-25 01:31:59 +0000 | [diff] [blame] | 145 | def CVTTPS2PIrr: I<0x2C, MRMSrcReg, (ops VR64:$dst, VR128:$src), |
| 146 | "cvttps2pi {$src, $dst|$dst, $src}", []>, TB, |
Bill Wendling | 74027e9 | 2007-03-15 21:24:36 +0000 | [diff] [blame^] | 147 | Requires<[HasMMX]>; |
Evan Cheng | cc4f047 | 2006-03-25 06:00:03 +0000 | [diff] [blame] | 148 | def CVTTPS2PIrm: I<0x2C, MRMSrcMem, (ops VR64:$dst, f64mem:$src), |
Evan Cheng | 3246e06 | 2006-03-25 01:31:59 +0000 | [diff] [blame] | 149 | "cvttps2pi {$src, $dst|$dst, $src}", []>, TB, |
| 150 | Requires<[HasMMX]>; |
Evan Cheng | d2a6d54 | 2006-04-12 23:42:44 +0000 | [diff] [blame] | 151 | def CVTPS2PIrr : MMXI<0x2D, MRMSrcReg, (ops VR64:$dst, VR128:$src), |
| 152 | "cvtps2pi {$src, $dst|$dst, $src}", []>; |
| 153 | def CVTPS2PIrm : MMXI<0x2D, MRMSrcMem, (ops VR64:$dst, f64mem:$src), |
| 154 | "cvtps2pi {$src, $dst|$dst, $src}", []>; |
| 155 | def CVTPD2PIrr : MMX2I<0x2D, MRMSrcReg, (ops VR64:$dst, VR128:$src), |
| 156 | "cvtpd2pi {$src, $dst|$dst, $src}", []>; |
| 157 | def CVTPD2PIrm : MMX2I<0x2D, MRMSrcMem, (ops VR64:$dst, f128mem:$src), |
| 158 | "cvtpd2pi {$src, $dst|$dst, $src}", []>; |
Evan Cheng | fcf5e21 | 2006-04-11 06:57:30 +0000 | [diff] [blame] | 159 | |
| 160 | // Shuffle and unpack instructions |
| 161 | def PSHUFWri : MMXIi8<0x70, MRMSrcReg, |
| 162 | (ops VR64:$dst, VR64:$src1, i8imm:$src2), |
| 163 | "pshufw {$src2, $src1, $dst|$dst, $src1, $src2}", []>; |
| 164 | def PSHUFWmi : MMXIi8<0x70, MRMSrcMem, |
| 165 | (ops VR64:$dst, i64mem:$src1, i8imm:$src2), |
| 166 | "pshufw {$src2, $src1, $dst|$dst, $src1, $src2}", []>; |
| 167 | |
| 168 | // Misc. |
| 169 | def MOVNTQ : I<0xE7, MRMDestMem, (ops i64mem:$dst, VR64:$src), |
| 170 | "movntq {$src, $dst|$dst, $src}", []>, TB, |
| 171 | Requires<[HasMMX]>; |
| 172 | |
| 173 | def MASKMOVQ : I<0xF7, MRMDestMem, (ops VR64:$src, VR64:$mask), |
| 174 | "maskmovq {$mask, $src|$src, $mask}", []>, TB, |
| 175 | Requires<[HasMMX]>; |
Bill Wendling | a31bd27 | 2007-03-06 18:53:42 +0000 | [diff] [blame] | 176 | |
| 177 | //===----------------------------------------------------------------------===// |
| 178 | // Non-Instruction Patterns |
| 179 | //===----------------------------------------------------------------------===// |
| 180 | |
| 181 | // Store 64-bit integer vector values. |
| 182 | def : Pat<(store (v8i8 VR64:$src), addr:$dst), |
| 183 | (MOVQ64mr addr:$dst, VR64:$src)>; |
| 184 | def : Pat<(store (v4i16 VR64:$src), addr:$dst), |
| 185 | (MOVQ64mr addr:$dst, VR64:$src)>; |
Bill Wendling | bc9bffa | 2007-03-07 05:43:18 +0000 | [diff] [blame] | 186 | |
| 187 | // Bit convert. |
| 188 | def : Pat<(v8i8 (bitconvert (v2i32 VR64:$src))), (v8i8 VR64:$src)>; |
| 189 | def : Pat<(v8i8 (bitconvert (v4i16 VR64:$src))), (v8i8 VR64:$src)>; |
| 190 | def : Pat<(v4i16 (bitconvert (v2i32 VR64:$src))), (v4i16 VR64:$src)>; |
| 191 | def : Pat<(v4i16 (bitconvert (v8i8 VR64:$src))), (v4i16 VR64:$src)>; |
| 192 | def : Pat<(v2i32 (bitconvert (v4i16 VR64:$src))), (v2i32 VR64:$src)>; |
| 193 | def : Pat<(v2i32 (bitconvert (v8i8 VR64:$src))), (v2i32 VR64:$src)>; |