Chris Lattner | 40ead95 | 2002-12-02 21:24:12 +0000 | [diff] [blame] | 1 | //===-- X86/MachineCodeEmitter.cpp - Convert X86 code to machine code -----===// |
| 2 | // |
| 3 | // This file contains the pass that transforms the X86 machine instructions into |
| 4 | // actual executable machine code. |
| 5 | // |
| 6 | //===----------------------------------------------------------------------===// |
| 7 | |
| 8 | #include "X86TargetMachine.h" |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 9 | #include "X86.h" |
Chris Lattner | 40ead95 | 2002-12-02 21:24:12 +0000 | [diff] [blame] | 10 | #include "llvm/PassManager.h" |
| 11 | #include "llvm/CodeGen/MachineCodeEmitter.h" |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 12 | #include "llvm/CodeGen/MachineFunction.h" |
| 13 | #include "llvm/CodeGen/MachineInstr.h" |
Chris Lattner | dbf30f7 | 2002-12-04 06:45:19 +0000 | [diff] [blame] | 14 | #include "llvm/Value.h" |
Chris Lattner | 40ead95 | 2002-12-02 21:24:12 +0000 | [diff] [blame] | 15 | |
| 16 | namespace { |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 17 | class Emitter : public FunctionPass { |
Chris Lattner | 8f04b09 | 2002-12-02 21:56:18 +0000 | [diff] [blame] | 18 | X86TargetMachine &TM; |
| 19 | const X86InstrInfo ⅈ |
| 20 | MachineCodeEmitter &MCE; |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 21 | public: |
Chris Lattner | 40ead95 | 2002-12-02 21:24:12 +0000 | [diff] [blame] | 22 | |
Chris Lattner | 8f04b09 | 2002-12-02 21:56:18 +0000 | [diff] [blame] | 23 | Emitter(X86TargetMachine &tm, MachineCodeEmitter &mce) |
| 24 | : TM(tm), II(TM.getInstrInfo()), MCE(mce) {} |
Chris Lattner | 40ead95 | 2002-12-02 21:24:12 +0000 | [diff] [blame] | 25 | |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 26 | bool runOnFunction(Function &F); |
| 27 | |
Chris Lattner | f0eb7be | 2002-12-15 21:13:40 +0000 | [diff] [blame^] | 28 | virtual const char *getPassName() const { |
| 29 | return "X86 Machine Code Emitter"; |
| 30 | } |
| 31 | |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 32 | private: |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 33 | void emitBasicBlock(MachineBasicBlock &MBB); |
| 34 | void emitInstruction(MachineInstr &MI); |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 35 | |
| 36 | void emitRegModRMByte(unsigned ModRMReg, unsigned RegOpcodeField); |
| 37 | void emitSIBByte(unsigned SS, unsigned Index, unsigned Base); |
| 38 | void emitConstant(unsigned Val, unsigned Size); |
| 39 | |
| 40 | void emitMemModRMByte(const MachineInstr &MI, |
| 41 | unsigned Op, unsigned RegOpcodeField); |
| 42 | |
Chris Lattner | 40ead95 | 2002-12-02 21:24:12 +0000 | [diff] [blame] | 43 | }; |
| 44 | } |
| 45 | |
| 46 | |
| 47 | /// addPassesToEmitMachineCode - Add passes to the specified pass manager to get |
| 48 | /// machine code emitted. This uses a MAchineCodeEmitter object to handle |
| 49 | /// actually outputting the machine code and resolving things like the address |
| 50 | /// of functions. This method should returns true if machine code emission is |
| 51 | /// not supported. |
| 52 | /// |
| 53 | bool X86TargetMachine::addPassesToEmitMachineCode(PassManager &PM, |
| 54 | MachineCodeEmitter &MCE) { |
| 55 | PM.add(new Emitter(*this, MCE)); |
| 56 | return false; |
| 57 | } |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 58 | |
| 59 | bool Emitter::runOnFunction(Function &F) { |
| 60 | MachineFunction &MF = MachineFunction::get(&F); |
| 61 | |
| 62 | MCE.startFunction(MF); |
| 63 | for (MachineFunction::iterator I = MF.begin(), E = MF.end(); I != E; ++I) |
| 64 | emitBasicBlock(*I); |
| 65 | MCE.finishFunction(MF); |
| 66 | return false; |
| 67 | } |
| 68 | |
| 69 | void Emitter::emitBasicBlock(MachineBasicBlock &MBB) { |
| 70 | MCE.startBasicBlock(MBB); |
| 71 | for (MachineBasicBlock::iterator I = MBB.begin(), E = MBB.end(); I != E; ++I) |
| 72 | emitInstruction(**I); |
| 73 | } |
| 74 | |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 75 | |
| 76 | namespace N86 { // Native X86 Register numbers... |
| 77 | enum { |
| 78 | EAX = 0, ECX = 1, EDX = 2, EBX = 3, ESP = 4, EBP = 5, ESI = 6, EDI = 7 |
| 79 | }; |
| 80 | } |
| 81 | |
| 82 | |
| 83 | // getX86RegNum - This function maps LLVM register identifiers to their X86 |
| 84 | // specific numbering, which is used in various places encoding instructions. |
| 85 | // |
| 86 | static unsigned getX86RegNum(unsigned RegNo) { |
| 87 | switch(RegNo) { |
| 88 | case X86::EAX: case X86::AX: case X86::AL: return N86::EAX; |
| 89 | case X86::ECX: case X86::CX: case X86::CL: return N86::ECX; |
| 90 | case X86::EDX: case X86::DX: case X86::DL: return N86::EDX; |
| 91 | case X86::EBX: case X86::BX: case X86::BL: return N86::EBX; |
| 92 | case X86::ESP: case X86::SP: case X86::AH: return N86::ESP; |
| 93 | case X86::EBP: case X86::BP: case X86::CH: return N86::EBP; |
| 94 | case X86::ESI: case X86::SI: case X86::DH: return N86::ESI; |
| 95 | case X86::EDI: case X86::DI: case X86::BH: return N86::EDI; |
| 96 | default: |
| 97 | assert(RegNo >= MRegisterInfo::FirstVirtualRegister && |
| 98 | "Unknown physical register!"); |
| 99 | assert(0 && "Register allocator hasn't allocated reg correctly yet!"); |
| 100 | return 0; |
| 101 | } |
| 102 | } |
| 103 | |
| 104 | inline static unsigned char ModRMByte(unsigned Mod, unsigned RegOpcode, |
| 105 | unsigned RM) { |
| 106 | assert(Mod < 4 && RegOpcode < 8 && RM < 8 && "ModRM Fields out of range!"); |
| 107 | return RM | (RegOpcode << 3) | (Mod << 6); |
| 108 | } |
| 109 | |
| 110 | void Emitter::emitRegModRMByte(unsigned ModRMReg, unsigned RegOpcodeFld){ |
| 111 | MCE.emitByte(ModRMByte(3, RegOpcodeFld, getX86RegNum(ModRMReg))); |
| 112 | } |
| 113 | |
| 114 | void Emitter::emitSIBByte(unsigned SS, unsigned Index, unsigned Base) { |
| 115 | // SIB byte is in the same format as the ModRMByte... |
| 116 | MCE.emitByte(ModRMByte(SS, Index, Base)); |
| 117 | } |
| 118 | |
| 119 | void Emitter::emitConstant(unsigned Val, unsigned Size) { |
| 120 | // Output the constant in little endian byte order... |
| 121 | for (unsigned i = 0; i != Size; ++i) { |
| 122 | MCE.emitByte(Val & 255); |
| 123 | Val >>= 8; |
| 124 | } |
| 125 | } |
| 126 | |
| 127 | static bool isDisp8(int Value) { |
| 128 | return Value == (signed char)Value; |
| 129 | } |
| 130 | |
| 131 | void Emitter::emitMemModRMByte(const MachineInstr &MI, |
| 132 | unsigned Op, unsigned RegOpcodeField) { |
| 133 | const MachineOperand &BaseReg = MI.getOperand(Op); |
| 134 | const MachineOperand &Scale = MI.getOperand(Op+1); |
| 135 | const MachineOperand &IndexReg = MI.getOperand(Op+2); |
| 136 | const MachineOperand &Disp = MI.getOperand(Op+3); |
| 137 | |
| 138 | // Is a SIB byte needed? |
| 139 | if (IndexReg.getReg() == 0 && BaseReg.getReg() != X86::ESP) { |
| 140 | if (BaseReg.getReg() == 0) { // Just a displacement? |
| 141 | // Emit special case [disp32] encoding |
| 142 | MCE.emitByte(ModRMByte(0, RegOpcodeField, 5)); |
| 143 | emitConstant(Disp.getImmedValue(), 4); |
| 144 | } else { |
| 145 | unsigned BaseRegNo = getX86RegNum(BaseReg.getReg()); |
| 146 | if (Disp.getImmedValue() == 0 && BaseRegNo != N86::EBP) { |
| 147 | // Emit simple indirect register encoding... [EAX] f.e. |
| 148 | MCE.emitByte(ModRMByte(0, RegOpcodeField, BaseRegNo)); |
| 149 | } else if (isDisp8(Disp.getImmedValue())) { |
| 150 | // Emit the disp8 encoding... [REG+disp8] |
| 151 | MCE.emitByte(ModRMByte(1, RegOpcodeField, BaseRegNo)); |
| 152 | emitConstant(Disp.getImmedValue(), 1); |
| 153 | } else { |
| 154 | // Emit the most general non-SIB encoding: [REG+disp32] |
Chris Lattner | 2067184 | 2002-12-13 05:05:05 +0000 | [diff] [blame] | 155 | MCE.emitByte(ModRMByte(2, RegOpcodeField, BaseRegNo)); |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 156 | emitConstant(Disp.getImmedValue(), 4); |
| 157 | } |
| 158 | } |
| 159 | |
| 160 | } else { // We need a SIB byte, so start by outputting the ModR/M byte first |
| 161 | assert(IndexReg.getReg() != X86::ESP && "Cannot use ESP as index reg!"); |
| 162 | |
| 163 | bool ForceDisp32 = false; |
Brian Gaeke | 95780cc | 2002-12-13 07:56:18 +0000 | [diff] [blame] | 164 | bool ForceDisp8 = false; |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 165 | if (BaseReg.getReg() == 0) { |
| 166 | // If there is no base register, we emit the special case SIB byte with |
| 167 | // MOD=0, BASE=5, to JUST get the index, scale, and displacement. |
| 168 | MCE.emitByte(ModRMByte(0, RegOpcodeField, 4)); |
| 169 | ForceDisp32 = true; |
Brian Gaeke | 95780cc | 2002-12-13 07:56:18 +0000 | [diff] [blame] | 170 | } else if (Disp.getImmedValue() == 0 && BaseReg.getReg() != X86::EBP) { |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 171 | // Emit no displacement ModR/M byte |
| 172 | MCE.emitByte(ModRMByte(0, RegOpcodeField, 4)); |
| 173 | } else if (isDisp8(Disp.getImmedValue())) { |
| 174 | // Emit the disp8 encoding... |
| 175 | MCE.emitByte(ModRMByte(1, RegOpcodeField, 4)); |
Brian Gaeke | 95780cc | 2002-12-13 07:56:18 +0000 | [diff] [blame] | 176 | ForceDisp8 = true; // Make sure to force 8 bit disp if Base=EBP |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 177 | } else { |
| 178 | // Emit the normal disp32 encoding... |
| 179 | MCE.emitByte(ModRMByte(2, RegOpcodeField, 4)); |
| 180 | } |
| 181 | |
| 182 | // Calculate what the SS field value should be... |
| 183 | static const unsigned SSTable[] = { ~0, 0, 1, ~0, 2, ~0, ~0, ~0, 3 }; |
| 184 | unsigned SS = SSTable[Scale.getImmedValue()]; |
| 185 | |
| 186 | if (BaseReg.getReg() == 0) { |
| 187 | // Handle the SIB byte for the case where there is no base. The |
| 188 | // displacement has already been output. |
| 189 | assert(IndexReg.getReg() && "Index register must be specified!"); |
| 190 | emitSIBByte(SS, getX86RegNum(IndexReg.getReg()), 5); |
| 191 | } else { |
| 192 | unsigned BaseRegNo = getX86RegNum(BaseReg.getReg()); |
| 193 | unsigned IndexRegNo = getX86RegNum(IndexReg.getReg()); |
| 194 | emitSIBByte(SS, IndexRegNo, BaseRegNo); |
| 195 | } |
| 196 | |
| 197 | // Do we need to output a displacement? |
Brian Gaeke | 95780cc | 2002-12-13 07:56:18 +0000 | [diff] [blame] | 198 | if (Disp.getImmedValue() != 0 || ForceDisp32 || ForceDisp8) { |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 199 | if (!ForceDisp32 && isDisp8(Disp.getImmedValue())) |
| 200 | emitConstant(Disp.getImmedValue(), 1); |
| 201 | else |
| 202 | emitConstant(Disp.getImmedValue(), 4); |
| 203 | } |
| 204 | } |
| 205 | } |
| 206 | |
Misha Brukman | 5000e43 | 2002-12-13 02:13:15 +0000 | [diff] [blame] | 207 | unsigned sizeOfPtr (const MachineInstrDescriptor &Desc) { |
Chris Lattner | a0f38c8 | 2002-12-13 03:51:55 +0000 | [diff] [blame] | 208 | switch (Desc.TSFlags & X86II::ArgMask) { |
| 209 | case X86II::Arg8: return 1; |
| 210 | case X86II::Arg16: return 2; |
| 211 | case X86II::Arg32: return 4; |
| 212 | case X86II::Arg64: return 8; |
| 213 | case X86II::Arg80: return 10; |
| 214 | case X86II::Arg128: return 16; |
Chris Lattner | a6a382c | 2002-12-13 03:50:13 +0000 | [diff] [blame] | 215 | default: assert(0 && "Memory size not set!"); |
Misha Brukman | 5000e43 | 2002-12-13 02:13:15 +0000 | [diff] [blame] | 216 | } |
| 217 | } |
| 218 | |
| 219 | |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 220 | void Emitter::emitInstruction(MachineInstr &MI) { |
| 221 | unsigned Opcode = MI.getOpcode(); |
Chris Lattner | 8f04b09 | 2002-12-02 21:56:18 +0000 | [diff] [blame] | 222 | const MachineInstrDescriptor &Desc = II.get(Opcode); |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 223 | |
| 224 | // Emit instruction prefixes if neccesary |
| 225 | if (Desc.TSFlags & X86II::OpSize) MCE.emitByte(0x66);// Operand size... |
Chris Lattner | 8f04b09 | 2002-12-02 21:56:18 +0000 | [diff] [blame] | 226 | if (Desc.TSFlags & X86II::TB) MCE.emitByte(0x0F);// Two-byte opcode prefix |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 227 | |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 228 | unsigned char BaseOpcode = II.getBaseOpcodeFor(Opcode); |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 229 | switch (Desc.TSFlags & X86II::FormMask) { |
| 230 | case X86II::RawFrm: |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 231 | MCE.emitByte(BaseOpcode); |
Chris Lattner | 8f04b09 | 2002-12-02 21:56:18 +0000 | [diff] [blame] | 232 | |
| 233 | if (MI.getNumOperands() == 1) { |
| 234 | assert(MI.getOperand(0).getType() == MachineOperand::MO_PCRelativeDisp); |
| 235 | MCE.emitPCRelativeDisp(MI.getOperand(0).getVRegValue()); |
| 236 | } |
Chris Lattner | 8f04b09 | 2002-12-02 21:56:18 +0000 | [diff] [blame] | 237 | break; |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 238 | case X86II::AddRegFrm: |
| 239 | MCE.emitByte(BaseOpcode + getX86RegNum(MI.getOperand(0).getReg())); |
| 240 | if (MI.getNumOperands() == 2) { |
Misha Brukman | 5000e43 | 2002-12-13 02:13:15 +0000 | [diff] [blame] | 241 | unsigned Size = sizeOfPtr(Desc); |
Chris Lattner | ac573f6 | 2002-12-04 17:32:52 +0000 | [diff] [blame] | 242 | if (Value *V = MI.getOperand(1).getVRegValueOrNull()) { |
Chris Lattner | dbf30f7 | 2002-12-04 06:45:19 +0000 | [diff] [blame] | 243 | assert(Size == 4 && "Don't know how to emit non-pointer values!"); |
| 244 | MCE.emitGlobalAddress(cast<GlobalValue>(V)); |
| 245 | } else { |
| 246 | emitConstant(MI.getOperand(1).getImmedValue(), Size); |
| 247 | } |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 248 | } |
| 249 | break; |
| 250 | case X86II::MRMDestReg: |
| 251 | MCE.emitByte(BaseOpcode); |
| 252 | emitRegModRMByte(MI.getOperand(0).getReg(), |
| 253 | getX86RegNum(MI.getOperand(MI.getNumOperands()-1).getReg())); |
| 254 | break; |
| 255 | case X86II::MRMDestMem: |
| 256 | MCE.emitByte(BaseOpcode); |
| 257 | emitMemModRMByte(MI, 0, getX86RegNum(MI.getOperand(4).getReg())); |
| 258 | break; |
| 259 | case X86II::MRMSrcReg: |
| 260 | MCE.emitByte(BaseOpcode); |
| 261 | emitRegModRMByte(MI.getOperand(MI.getNumOperands()-1).getReg(), |
| 262 | getX86RegNum(MI.getOperand(0).getReg())); |
| 263 | break; |
| 264 | case X86II::MRMSrcMem: |
| 265 | MCE.emitByte(BaseOpcode); |
| 266 | emitMemModRMByte(MI, MI.getNumOperands()-4, |
| 267 | getX86RegNum(MI.getOperand(0).getReg())); |
| 268 | break; |
| 269 | |
| 270 | case X86II::MRMS0r: case X86II::MRMS1r: |
| 271 | case X86II::MRMS2r: case X86II::MRMS3r: |
| 272 | case X86II::MRMS4r: case X86II::MRMS5r: |
| 273 | case X86II::MRMS6r: case X86II::MRMS7r: |
| 274 | MCE.emitByte(BaseOpcode); |
| 275 | emitRegModRMByte(MI.getOperand(0).getReg(), |
| 276 | (Desc.TSFlags & X86II::FormMask)-X86II::MRMS0r); |
| 277 | |
Chris Lattner | d909683 | 2002-12-15 08:01:39 +0000 | [diff] [blame] | 278 | if (MI.getOperand(MI.getNumOperands()-1).isImmediate()) { |
Misha Brukman | 5000e43 | 2002-12-13 02:13:15 +0000 | [diff] [blame] | 279 | unsigned Size = sizeOfPtr(Desc); |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 280 | emitConstant(MI.getOperand(MI.getNumOperands()-1).getImmedValue(), Size); |
| 281 | } |
| 282 | break; |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 283 | } |
| 284 | } |