Chris Lattner | 40ead95 | 2002-12-02 21:24:12 +0000 | [diff] [blame] | 1 | //===-- X86/MachineCodeEmitter.cpp - Convert X86 code to machine code -----===// |
| 2 | // |
| 3 | // This file contains the pass that transforms the X86 machine instructions into |
| 4 | // actual executable machine code. |
| 5 | // |
| 6 | //===----------------------------------------------------------------------===// |
| 7 | |
| 8 | #include "X86TargetMachine.h" |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 9 | #include "X86.h" |
Chris Lattner | 40ead95 | 2002-12-02 21:24:12 +0000 | [diff] [blame] | 10 | #include "llvm/PassManager.h" |
| 11 | #include "llvm/CodeGen/MachineCodeEmitter.h" |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 12 | #include "llvm/CodeGen/MachineFunction.h" |
| 13 | #include "llvm/CodeGen/MachineInstr.h" |
Chris Lattner | dbf30f7 | 2002-12-04 06:45:19 +0000 | [diff] [blame] | 14 | #include "llvm/Value.h" |
Chris Lattner | 40ead95 | 2002-12-02 21:24:12 +0000 | [diff] [blame] | 15 | |
| 16 | namespace { |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 17 | class Emitter : public FunctionPass { |
Chris Lattner | 8f04b09 | 2002-12-02 21:56:18 +0000 | [diff] [blame] | 18 | X86TargetMachine &TM; |
| 19 | const X86InstrInfo ⅈ |
| 20 | MachineCodeEmitter &MCE; |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 21 | public: |
Chris Lattner | 40ead95 | 2002-12-02 21:24:12 +0000 | [diff] [blame] | 22 | |
Chris Lattner | 8f04b09 | 2002-12-02 21:56:18 +0000 | [diff] [blame] | 23 | Emitter(X86TargetMachine &tm, MachineCodeEmitter &mce) |
| 24 | : TM(tm), II(TM.getInstrInfo()), MCE(mce) {} |
Chris Lattner | 40ead95 | 2002-12-02 21:24:12 +0000 | [diff] [blame] | 25 | |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 26 | bool runOnFunction(Function &F); |
| 27 | |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 28 | private: |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 29 | void emitBasicBlock(MachineBasicBlock &MBB); |
| 30 | void emitInstruction(MachineInstr &MI); |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 31 | |
| 32 | void emitRegModRMByte(unsigned ModRMReg, unsigned RegOpcodeField); |
| 33 | void emitSIBByte(unsigned SS, unsigned Index, unsigned Base); |
| 34 | void emitConstant(unsigned Val, unsigned Size); |
| 35 | |
| 36 | void emitMemModRMByte(const MachineInstr &MI, |
| 37 | unsigned Op, unsigned RegOpcodeField); |
| 38 | |
Chris Lattner | 40ead95 | 2002-12-02 21:24:12 +0000 | [diff] [blame] | 39 | }; |
| 40 | } |
| 41 | |
| 42 | |
| 43 | /// addPassesToEmitMachineCode - Add passes to the specified pass manager to get |
| 44 | /// machine code emitted. This uses a MAchineCodeEmitter object to handle |
| 45 | /// actually outputting the machine code and resolving things like the address |
| 46 | /// of functions. This method should returns true if machine code emission is |
| 47 | /// not supported. |
| 48 | /// |
| 49 | bool X86TargetMachine::addPassesToEmitMachineCode(PassManager &PM, |
| 50 | MachineCodeEmitter &MCE) { |
| 51 | PM.add(new Emitter(*this, MCE)); |
| 52 | return false; |
| 53 | } |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 54 | |
| 55 | bool Emitter::runOnFunction(Function &F) { |
| 56 | MachineFunction &MF = MachineFunction::get(&F); |
| 57 | |
| 58 | MCE.startFunction(MF); |
| 59 | for (MachineFunction::iterator I = MF.begin(), E = MF.end(); I != E; ++I) |
| 60 | emitBasicBlock(*I); |
| 61 | MCE.finishFunction(MF); |
| 62 | return false; |
| 63 | } |
| 64 | |
| 65 | void Emitter::emitBasicBlock(MachineBasicBlock &MBB) { |
| 66 | MCE.startBasicBlock(MBB); |
| 67 | for (MachineBasicBlock::iterator I = MBB.begin(), E = MBB.end(); I != E; ++I) |
| 68 | emitInstruction(**I); |
| 69 | } |
| 70 | |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 71 | |
| 72 | namespace N86 { // Native X86 Register numbers... |
| 73 | enum { |
| 74 | EAX = 0, ECX = 1, EDX = 2, EBX = 3, ESP = 4, EBP = 5, ESI = 6, EDI = 7 |
| 75 | }; |
| 76 | } |
| 77 | |
| 78 | |
| 79 | // getX86RegNum - This function maps LLVM register identifiers to their X86 |
| 80 | // specific numbering, which is used in various places encoding instructions. |
| 81 | // |
| 82 | static unsigned getX86RegNum(unsigned RegNo) { |
| 83 | switch(RegNo) { |
| 84 | case X86::EAX: case X86::AX: case X86::AL: return N86::EAX; |
| 85 | case X86::ECX: case X86::CX: case X86::CL: return N86::ECX; |
| 86 | case X86::EDX: case X86::DX: case X86::DL: return N86::EDX; |
| 87 | case X86::EBX: case X86::BX: case X86::BL: return N86::EBX; |
| 88 | case X86::ESP: case X86::SP: case X86::AH: return N86::ESP; |
| 89 | case X86::EBP: case X86::BP: case X86::CH: return N86::EBP; |
| 90 | case X86::ESI: case X86::SI: case X86::DH: return N86::ESI; |
| 91 | case X86::EDI: case X86::DI: case X86::BH: return N86::EDI; |
| 92 | default: |
| 93 | assert(RegNo >= MRegisterInfo::FirstVirtualRegister && |
| 94 | "Unknown physical register!"); |
| 95 | assert(0 && "Register allocator hasn't allocated reg correctly yet!"); |
| 96 | return 0; |
| 97 | } |
| 98 | } |
| 99 | |
| 100 | inline static unsigned char ModRMByte(unsigned Mod, unsigned RegOpcode, |
| 101 | unsigned RM) { |
| 102 | assert(Mod < 4 && RegOpcode < 8 && RM < 8 && "ModRM Fields out of range!"); |
| 103 | return RM | (RegOpcode << 3) | (Mod << 6); |
| 104 | } |
| 105 | |
| 106 | void Emitter::emitRegModRMByte(unsigned ModRMReg, unsigned RegOpcodeFld){ |
| 107 | MCE.emitByte(ModRMByte(3, RegOpcodeFld, getX86RegNum(ModRMReg))); |
| 108 | } |
| 109 | |
| 110 | void Emitter::emitSIBByte(unsigned SS, unsigned Index, unsigned Base) { |
| 111 | // SIB byte is in the same format as the ModRMByte... |
| 112 | MCE.emitByte(ModRMByte(SS, Index, Base)); |
| 113 | } |
| 114 | |
| 115 | void Emitter::emitConstant(unsigned Val, unsigned Size) { |
| 116 | // Output the constant in little endian byte order... |
| 117 | for (unsigned i = 0; i != Size; ++i) { |
| 118 | MCE.emitByte(Val & 255); |
| 119 | Val >>= 8; |
| 120 | } |
| 121 | } |
| 122 | |
| 123 | static bool isDisp8(int Value) { |
| 124 | return Value == (signed char)Value; |
| 125 | } |
| 126 | |
| 127 | void Emitter::emitMemModRMByte(const MachineInstr &MI, |
| 128 | unsigned Op, unsigned RegOpcodeField) { |
| 129 | const MachineOperand &BaseReg = MI.getOperand(Op); |
| 130 | const MachineOperand &Scale = MI.getOperand(Op+1); |
| 131 | const MachineOperand &IndexReg = MI.getOperand(Op+2); |
| 132 | const MachineOperand &Disp = MI.getOperand(Op+3); |
| 133 | |
| 134 | // Is a SIB byte needed? |
| 135 | if (IndexReg.getReg() == 0 && BaseReg.getReg() != X86::ESP) { |
| 136 | if (BaseReg.getReg() == 0) { // Just a displacement? |
| 137 | // Emit special case [disp32] encoding |
| 138 | MCE.emitByte(ModRMByte(0, RegOpcodeField, 5)); |
| 139 | emitConstant(Disp.getImmedValue(), 4); |
| 140 | } else { |
| 141 | unsigned BaseRegNo = getX86RegNum(BaseReg.getReg()); |
| 142 | if (Disp.getImmedValue() == 0 && BaseRegNo != N86::EBP) { |
| 143 | // Emit simple indirect register encoding... [EAX] f.e. |
| 144 | MCE.emitByte(ModRMByte(0, RegOpcodeField, BaseRegNo)); |
| 145 | } else if (isDisp8(Disp.getImmedValue())) { |
| 146 | // Emit the disp8 encoding... [REG+disp8] |
| 147 | MCE.emitByte(ModRMByte(1, RegOpcodeField, BaseRegNo)); |
| 148 | emitConstant(Disp.getImmedValue(), 1); |
| 149 | } else { |
| 150 | // Emit the most general non-SIB encoding: [REG+disp32] |
| 151 | MCE.emitByte(ModRMByte(1, RegOpcodeField, BaseRegNo)); |
| 152 | emitConstant(Disp.getImmedValue(), 4); |
| 153 | } |
| 154 | } |
| 155 | |
| 156 | } else { // We need a SIB byte, so start by outputting the ModR/M byte first |
| 157 | assert(IndexReg.getReg() != X86::ESP && "Cannot use ESP as index reg!"); |
| 158 | |
| 159 | bool ForceDisp32 = false; |
| 160 | if (BaseReg.getReg() == 0) { |
| 161 | // If there is no base register, we emit the special case SIB byte with |
| 162 | // MOD=0, BASE=5, to JUST get the index, scale, and displacement. |
| 163 | MCE.emitByte(ModRMByte(0, RegOpcodeField, 4)); |
| 164 | ForceDisp32 = true; |
| 165 | } else if (Disp.getImmedValue() == 0) { |
| 166 | // Emit no displacement ModR/M byte |
| 167 | MCE.emitByte(ModRMByte(0, RegOpcodeField, 4)); |
| 168 | } else if (isDisp8(Disp.getImmedValue())) { |
| 169 | // Emit the disp8 encoding... |
| 170 | MCE.emitByte(ModRMByte(1, RegOpcodeField, 4)); |
| 171 | } else { |
| 172 | // Emit the normal disp32 encoding... |
| 173 | MCE.emitByte(ModRMByte(2, RegOpcodeField, 4)); |
| 174 | } |
| 175 | |
| 176 | // Calculate what the SS field value should be... |
| 177 | static const unsigned SSTable[] = { ~0, 0, 1, ~0, 2, ~0, ~0, ~0, 3 }; |
| 178 | unsigned SS = SSTable[Scale.getImmedValue()]; |
| 179 | |
| 180 | if (BaseReg.getReg() == 0) { |
| 181 | // Handle the SIB byte for the case where there is no base. The |
| 182 | // displacement has already been output. |
| 183 | assert(IndexReg.getReg() && "Index register must be specified!"); |
| 184 | emitSIBByte(SS, getX86RegNum(IndexReg.getReg()), 5); |
| 185 | } else { |
| 186 | unsigned BaseRegNo = getX86RegNum(BaseReg.getReg()); |
| 187 | unsigned IndexRegNo = getX86RegNum(IndexReg.getReg()); |
| 188 | emitSIBByte(SS, IndexRegNo, BaseRegNo); |
| 189 | } |
| 190 | |
| 191 | // Do we need to output a displacement? |
| 192 | if (Disp.getImmedValue() != 0 || ForceDisp32) { |
| 193 | if (!ForceDisp32 && isDisp8(Disp.getImmedValue())) |
| 194 | emitConstant(Disp.getImmedValue(), 1); |
| 195 | else |
| 196 | emitConstant(Disp.getImmedValue(), 4); |
| 197 | } |
| 198 | } |
| 199 | } |
| 200 | |
| 201 | static bool isImmediate(const MachineOperand &MO) { |
| 202 | return MO.getType() == MachineOperand::MO_SignExtendedImmed || |
| 203 | MO.getType() == MachineOperand::MO_UnextendedImmed; |
| 204 | } |
| 205 | |
Misha Brukman | 5000e43 | 2002-12-13 02:13:15 +0000 | [diff] [blame] | 206 | unsigned sizeOfPtr (const MachineInstrDescriptor &Desc) { |
| 207 | switch (Desc.TSFlags & X86II::MemArgMask) { |
| 208 | case X86II::MemArg8: return 1; |
| 209 | case X86II::MemArg16: return 2; |
| 210 | case X86II::MemArg32: return 4; |
| 211 | case X86II::MemArg64: return 8; |
| 212 | case X86II::MemArg80: return 10; |
| 213 | case X86II::MemArg128: return 16; |
Chris Lattner | a6a382c | 2002-12-13 03:50:13 +0000 | [diff] [blame^] | 214 | default: assert(0 && "Memory size not set!"); |
Misha Brukman | 5000e43 | 2002-12-13 02:13:15 +0000 | [diff] [blame] | 215 | } |
| 216 | } |
| 217 | |
| 218 | |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 219 | void Emitter::emitInstruction(MachineInstr &MI) { |
| 220 | unsigned Opcode = MI.getOpcode(); |
Chris Lattner | 8f04b09 | 2002-12-02 21:56:18 +0000 | [diff] [blame] | 221 | const MachineInstrDescriptor &Desc = II.get(Opcode); |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 222 | |
| 223 | // Emit instruction prefixes if neccesary |
| 224 | if (Desc.TSFlags & X86II::OpSize) MCE.emitByte(0x66);// Operand size... |
Chris Lattner | 8f04b09 | 2002-12-02 21:56:18 +0000 | [diff] [blame] | 225 | if (Desc.TSFlags & X86II::TB) MCE.emitByte(0x0F);// Two-byte opcode prefix |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 226 | |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 227 | unsigned char BaseOpcode = II.getBaseOpcodeFor(Opcode); |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 228 | switch (Desc.TSFlags & X86II::FormMask) { |
| 229 | case X86II::RawFrm: |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 230 | MCE.emitByte(BaseOpcode); |
Chris Lattner | 8f04b09 | 2002-12-02 21:56:18 +0000 | [diff] [blame] | 231 | |
| 232 | if (MI.getNumOperands() == 1) { |
| 233 | assert(MI.getOperand(0).getType() == MachineOperand::MO_PCRelativeDisp); |
| 234 | MCE.emitPCRelativeDisp(MI.getOperand(0).getVRegValue()); |
| 235 | } |
Chris Lattner | 8f04b09 | 2002-12-02 21:56:18 +0000 | [diff] [blame] | 236 | break; |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 237 | case X86II::AddRegFrm: |
| 238 | MCE.emitByte(BaseOpcode + getX86RegNum(MI.getOperand(0).getReg())); |
| 239 | if (MI.getNumOperands() == 2) { |
Misha Brukman | 5000e43 | 2002-12-13 02:13:15 +0000 | [diff] [blame] | 240 | unsigned Size = sizeOfPtr(Desc); |
Chris Lattner | ac573f6 | 2002-12-04 17:32:52 +0000 | [diff] [blame] | 241 | if (Value *V = MI.getOperand(1).getVRegValueOrNull()) { |
Chris Lattner | dbf30f7 | 2002-12-04 06:45:19 +0000 | [diff] [blame] | 242 | assert(Size == 4 && "Don't know how to emit non-pointer values!"); |
| 243 | MCE.emitGlobalAddress(cast<GlobalValue>(V)); |
| 244 | } else { |
| 245 | emitConstant(MI.getOperand(1).getImmedValue(), Size); |
| 246 | } |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 247 | } |
| 248 | break; |
| 249 | case X86II::MRMDestReg: |
| 250 | MCE.emitByte(BaseOpcode); |
| 251 | emitRegModRMByte(MI.getOperand(0).getReg(), |
| 252 | getX86RegNum(MI.getOperand(MI.getNumOperands()-1).getReg())); |
| 253 | break; |
| 254 | case X86II::MRMDestMem: |
| 255 | MCE.emitByte(BaseOpcode); |
| 256 | emitMemModRMByte(MI, 0, getX86RegNum(MI.getOperand(4).getReg())); |
| 257 | break; |
| 258 | case X86II::MRMSrcReg: |
| 259 | MCE.emitByte(BaseOpcode); |
| 260 | emitRegModRMByte(MI.getOperand(MI.getNumOperands()-1).getReg(), |
| 261 | getX86RegNum(MI.getOperand(0).getReg())); |
| 262 | break; |
| 263 | case X86II::MRMSrcMem: |
| 264 | MCE.emitByte(BaseOpcode); |
| 265 | emitMemModRMByte(MI, MI.getNumOperands()-4, |
| 266 | getX86RegNum(MI.getOperand(0).getReg())); |
| 267 | break; |
| 268 | |
| 269 | case X86II::MRMS0r: case X86II::MRMS1r: |
| 270 | case X86II::MRMS2r: case X86II::MRMS3r: |
| 271 | case X86II::MRMS4r: case X86II::MRMS5r: |
| 272 | case X86II::MRMS6r: case X86II::MRMS7r: |
| 273 | MCE.emitByte(BaseOpcode); |
| 274 | emitRegModRMByte(MI.getOperand(0).getReg(), |
| 275 | (Desc.TSFlags & X86II::FormMask)-X86II::MRMS0r); |
| 276 | |
| 277 | if (isImmediate(MI.getOperand(MI.getNumOperands()-1))) { |
Misha Brukman | 5000e43 | 2002-12-13 02:13:15 +0000 | [diff] [blame] | 278 | unsigned Size = sizeOfPtr(Desc); |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 279 | emitConstant(MI.getOperand(MI.getNumOperands()-1).getImmedValue(), Size); |
| 280 | } |
| 281 | break; |
| 282 | |
| 283 | |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 284 | } |
| 285 | } |