blob: d52f24145f4448bbc4253a7f06292e59e9b7dee4 [file] [log] [blame]
Chris Lattnercf3056d2003-10-13 03:32:08 +00001//===-- InstructionWriter.cpp - Functions for writing instructions --------===//
John Criswellb576c942003-10-20 19:43:21 +00002//
3// The LLVM Compiler Infrastructure
4//
5// This file was developed by the LLVM research group and is distributed under
6// the University of Illinois Open Source License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
Chris Lattner00950542001-06-06 20:29:01 +00009//
10// This file implements the routines for encoding instruction opcodes to a
11// bytecode stream.
12//
Chris Lattner00950542001-06-06 20:29:01 +000013//===----------------------------------------------------------------------===//
14
15#include "WriterInternals.h"
16#include "llvm/Module.h"
Chris Lattner00950542001-06-06 20:29:01 +000017#include "llvm/DerivedTypes.h"
Chris Lattner0fe56f42003-09-08 17:58:37 +000018#include "llvm/Instructions.h"
Chris Lattnera92f6962002-10-01 22:38:41 +000019#include "Support/Statistic.h"
Chris Lattner00950542001-06-06 20:29:01 +000020#include <algorithm>
21
Brian Gaeked0fde302003-11-11 22:41:34 +000022namespace llvm {
23
Chris Lattnerce6ef112002-07-26 18:40:14 +000024static Statistic<>
Chris Lattnera407ba12003-01-21 20:13:49 +000025NumInstrs("bytecodewriter", "Number of instructions");
Chris Lattnerce6ef112002-07-26 18:40:14 +000026
Chris Lattner00950542001-06-06 20:29:01 +000027typedef unsigned char uchar;
28
29// outputInstructionFormat0 - Output those wierd instructions that have a large
30// number of operands or have large operands themselves...
31//
32// Format: [opcode] [type] [numargs] [arg0] [arg1] ... [arg<numargs-1>]
33//
Chris Lattner0fe56f42003-09-08 17:58:37 +000034static void outputInstructionFormat0(const Instruction *I, unsigned Opcode,
Chris Lattner00950542001-06-06 20:29:01 +000035 const SlotCalculator &Table,
Chris Lattner697954c2002-01-20 22:54:45 +000036 unsigned Type, std::deque<uchar> &Out) {
Chris Lattner00950542001-06-06 20:29:01 +000037 // Opcode must have top two bits clear...
Chris Lattner0fe56f42003-09-08 17:58:37 +000038 output_vbr(Opcode << 2, Out); // Instruction Opcode ID
Chris Lattner00950542001-06-06 20:29:01 +000039 output_vbr(Type, Out); // Result type
40
Chris Lattnerc8b25d42001-07-07 08:36:50 +000041 unsigned NumArgs = I->getNumOperands();
Chris Lattnereff112c2003-10-18 05:54:48 +000042 output_vbr(NumArgs + (isa<CastInst>(I) || isa<VANextInst>(I) ||
43 isa<VAArgInst>(I)), Out);
Chris Lattner00950542001-06-06 20:29:01 +000044
Chris Lattnerc8b25d42001-07-07 08:36:50 +000045 for (unsigned i = 0; i < NumArgs; ++i) {
Alkis Evlogimenos60596382003-10-17 02:02:40 +000046 int Slot = Table.getSlot(I->getOperand(i));
Chris Lattnere5a57ee2001-07-25 22:47:55 +000047 assert(Slot >= 0 && "No slot number for value!?!?");
48 output_vbr((unsigned)Slot, Out);
49 }
Chris Lattner5ab1f872001-10-21 00:14:44 +000050
Chris Lattnereff112c2003-10-18 05:54:48 +000051 if (isa<CastInst>(I) || isa<VAArgInst>(I)) {
Alkis Evlogimenos60596382003-10-17 02:02:40 +000052 int Slot = Table.getSlot(I->getType());
Chris Lattnereff112c2003-10-18 05:54:48 +000053 assert(Slot != -1 && "Cast return type unknown?");
54 output_vbr((unsigned)Slot, Out);
55 } else if (const VANextInst *VAI = dyn_cast<VANextInst>(I)) {
56 int Slot = Table.getSlot(VAI->getArgType());
57 assert(Slot != -1 && "VarArg argument type unknown?");
Chris Lattner5ab1f872001-10-21 00:14:44 +000058 output_vbr((unsigned)Slot, Out);
59 }
60
Chris Lattnere5a57ee2001-07-25 22:47:55 +000061 align32(Out); // We must maintain correct alignment!
62}
63
64
Misha Brukman37f92e22003-09-11 22:34:13 +000065// outputInstrVarArgsCall - Output the absurdly annoying varargs function calls.
Chris Lattnere5a57ee2001-07-25 22:47:55 +000066// This are more annoying than most because the signature of the call does not
67// tell us anything about the types of the arguments in the varargs portion.
68// Because of this, we encode (as type 0) all of the argument types explicitly
69// before the argument value. This really sucks, but you shouldn't be using
70// varargs functions in your code! *death to printf*!
71//
72// Format: [opcode] [type] [numargs] [arg0] [arg1] ... [arg<numargs-1>]
73//
Chris Lattner0fe56f42003-09-08 17:58:37 +000074static void outputInstrVarArgsCall(const Instruction *I, unsigned Opcode,
Chris Lattnere5a57ee2001-07-25 22:47:55 +000075 const SlotCalculator &Table, unsigned Type,
Chris Lattner697954c2002-01-20 22:54:45 +000076 std::deque<uchar> &Out) {
Chris Lattner1b98c5c2001-10-13 06:48:38 +000077 assert(isa<CallInst>(I) || isa<InvokeInst>(I));
Chris Lattnere5a57ee2001-07-25 22:47:55 +000078 // Opcode must have top two bits clear...
Chris Lattner0fe56f42003-09-08 17:58:37 +000079 output_vbr(Opcode << 2, Out); // Instruction Opcode ID
Chris Lattnere5a57ee2001-07-25 22:47:55 +000080 output_vbr(Type, Out); // Result type (varargs type)
81
Chris Lattnereff112c2003-10-18 05:54:48 +000082 const PointerType *PTy = cast<PointerType>(I->getOperand(0)->getType());
83 const FunctionType *FTy = cast<FunctionType>(PTy->getElementType());
84 unsigned NumParams = FTy->getNumParams();
85
86 unsigned NumFixedOperands;
87 if (isa<CallInst>(I)) {
88 // Output an operand for the callee and each fixed argument, then two for
89 // each variable argument.
90 NumFixedOperands = 1+NumParams;
91 } else {
92 assert(isa<InvokeInst>(I) && "Not call or invoke??");
93 // Output an operand for the callee and destinations, then two for each
94 // variable argument.
95 NumFixedOperands = 3+NumParams;
96 }
97 output_vbr(2 * I->getNumOperands()-NumFixedOperands, Out);
Chris Lattnere5a57ee2001-07-25 22:47:55 +000098
Chris Lattner2fbfdcf2002-04-07 20:49:59 +000099 // The type for the function has already been emitted in the type field of the
Chris Lattner1b98c5c2001-10-13 06:48:38 +0000100 // instruction. Just emit the slot # now.
Chris Lattnereff112c2003-10-18 05:54:48 +0000101 for (unsigned i = 0; i != NumFixedOperands; ++i) {
102 int Slot = Table.getSlot(I->getOperand(i));
Chris Lattnere5a57ee2001-07-25 22:47:55 +0000103 assert(Slot >= 0 && "No slot number for value!?!?");
104 output_vbr((unsigned)Slot, Out);
Chris Lattnereff112c2003-10-18 05:54:48 +0000105 }
Chris Lattnere5a57ee2001-07-25 22:47:55 +0000106
Chris Lattnereff112c2003-10-18 05:54:48 +0000107 for (unsigned i = NumFixedOperands, e = I->getNumOperands(); i != e; ++i) {
108 // Output Arg Type ID
109 int Slot = Table.getSlot(I->getOperand(i)->getType());
110 assert(Slot >= 0 && "No slot number for value!?!?");
111 output_vbr((unsigned)Slot, Out);
112
Chris Lattnere5a57ee2001-07-25 22:47:55 +0000113 // Output arg ID itself
Alkis Evlogimenos60596382003-10-17 02:02:40 +0000114 Slot = Table.getSlot(I->getOperand(i));
Chris Lattnerc8b25d42001-07-07 08:36:50 +0000115 assert(Slot >= 0 && "No slot number for value!?!?");
Chris Lattner00950542001-06-06 20:29:01 +0000116 output_vbr((unsigned)Slot, Out);
117 }
118 align32(Out); // We must maintain correct alignment!
119}
120
121
122// outputInstructionFormat1 - Output one operand instructions, knowing that no
123// operand index is >= 2^12.
124//
Chris Lattner0fe56f42003-09-08 17:58:37 +0000125static void outputInstructionFormat1(const Instruction *I, unsigned Opcode,
Chris Lattner00950542001-06-06 20:29:01 +0000126 const SlotCalculator &Table, int *Slots,
Chris Lattner697954c2002-01-20 22:54:45 +0000127 unsigned Type, std::deque<uchar> &Out) {
Chris Lattner00950542001-06-06 20:29:01 +0000128 // bits Instruction format:
129 // --------------------------
Chris Lattner2b9f6002001-10-23 03:21:10 +0000130 // 01-00: Opcode type, fixed to 1.
131 // 07-02: Opcode
132 // 19-08: Resulting type plane
133 // 31-20: Operand #1 (if set to (2^12-1), then zero operands)
Chris Lattner00950542001-06-06 20:29:01 +0000134 //
Chris Lattner2b9f6002001-10-23 03:21:10 +0000135 unsigned Bits = 1 | (Opcode << 2) | (Type << 8) | (Slots[0] << 20);
Chris Lattner00950542001-06-06 20:29:01 +0000136 // cerr << "1 " << IType << " " << Type << " " << Slots[0] << endl;
Chris Lattner2b9f6002001-10-23 03:21:10 +0000137 output(Bits, Out);
Chris Lattner00950542001-06-06 20:29:01 +0000138}
139
140
141// outputInstructionFormat2 - Output two operand instructions, knowing that no
142// operand index is >= 2^8.
143//
Chris Lattner0fe56f42003-09-08 17:58:37 +0000144static void outputInstructionFormat2(const Instruction *I, unsigned Opcode,
Chris Lattner00950542001-06-06 20:29:01 +0000145 const SlotCalculator &Table, int *Slots,
Chris Lattner697954c2002-01-20 22:54:45 +0000146 unsigned Type, std::deque<uchar> &Out) {
Chris Lattner00950542001-06-06 20:29:01 +0000147 // bits Instruction format:
148 // --------------------------
Chris Lattner2b9f6002001-10-23 03:21:10 +0000149 // 01-00: Opcode type, fixed to 2.
150 // 07-02: Opcode
151 // 15-08: Resulting type plane
152 // 23-16: Operand #1
153 // 31-24: Operand #2
Chris Lattner00950542001-06-06 20:29:01 +0000154 //
Chris Lattner2b9f6002001-10-23 03:21:10 +0000155 unsigned Bits = 2 | (Opcode << 2) | (Type << 8) |
156 (Slots[0] << 16) | (Slots[1] << 24);
Chris Lattner00950542001-06-06 20:29:01 +0000157 // cerr << "2 " << IType << " " << Type << " " << Slots[0] << " "
158 // << Slots[1] << endl;
Chris Lattner2b9f6002001-10-23 03:21:10 +0000159 output(Bits, Out);
Chris Lattner00950542001-06-06 20:29:01 +0000160}
161
162
163// outputInstructionFormat3 - Output three operand instructions, knowing that no
164// operand index is >= 2^6.
165//
Chris Lattner0fe56f42003-09-08 17:58:37 +0000166static void outputInstructionFormat3(const Instruction *I, unsigned Opcode,
Chris Lattner00950542001-06-06 20:29:01 +0000167 const SlotCalculator &Table, int *Slots,
Chris Lattner697954c2002-01-20 22:54:45 +0000168 unsigned Type, std::deque<uchar> &Out) {
Chris Lattner00950542001-06-06 20:29:01 +0000169 // bits Instruction format:
170 // --------------------------
Chris Lattner2b9f6002001-10-23 03:21:10 +0000171 // 01-00: Opcode type, fixed to 3.
172 // 07-02: Opcode
173 // 13-08: Resulting type plane
174 // 19-14: Operand #1
175 // 25-20: Operand #2
176 // 31-26: Operand #3
Chris Lattner00950542001-06-06 20:29:01 +0000177 //
Chris Lattner2b9f6002001-10-23 03:21:10 +0000178 unsigned Bits = 3 | (Opcode << 2) | (Type << 8) |
179 (Slots[0] << 14) | (Slots[1] << 20) | (Slots[2] << 26);
Chris Lattnerc8b25d42001-07-07 08:36:50 +0000180 //cerr << "3 " << IType << " " << Type << " " << Slots[0] << " "
181 // << Slots[1] << " " << Slots[2] << endl;
Chris Lattner2b9f6002001-10-23 03:21:10 +0000182 output(Bits, Out);
Chris Lattner00950542001-06-06 20:29:01 +0000183}
184
Chris Lattner0b12b5f2002-06-25 16:13:21 +0000185void BytecodeWriter::processInstruction(const Instruction &I) {
Chris Lattner0fe56f42003-09-08 17:58:37 +0000186 assert(I.getOpcode() < 62 && "Opcode too big???");
187 unsigned Opcode = I.getOpcode();
188
189 // Encode 'volatile load' as 62 and 'volatile store' as 63.
190 if (isa<LoadInst>(I) && cast<LoadInst>(I).isVolatile())
191 Opcode = 62;
192 if (isa<StoreInst>(I) && cast<StoreInst>(I).isVolatile())
193 Opcode = 63;
Chris Lattner00950542001-06-06 20:29:01 +0000194
Chris Lattner0b12b5f2002-06-25 16:13:21 +0000195 unsigned NumOperands = I.getNumOperands();
Chris Lattner00950542001-06-06 20:29:01 +0000196 int MaxOpSlot = 0;
Chris Lattnerc8b25d42001-07-07 08:36:50 +0000197 int Slots[3]; Slots[0] = (1 << 12)-1; // Marker to signify 0 operands
Chris Lattner00950542001-06-06 20:29:01 +0000198
Chris Lattnerc8b25d42001-07-07 08:36:50 +0000199 for (unsigned i = 0; i < NumOperands; ++i) {
Chris Lattner0b12b5f2002-06-25 16:13:21 +0000200 const Value *Def = I.getOperand(i);
Alkis Evlogimenos60596382003-10-17 02:02:40 +0000201 int slot = Table.getSlot(Def);
Chris Lattner00950542001-06-06 20:29:01 +0000202 assert(slot != -1 && "Broken bytecode!");
203 if (slot > MaxOpSlot) MaxOpSlot = slot;
Chris Lattnerc8b25d42001-07-07 08:36:50 +0000204 if (i < 3) Slots[i] = slot;
Chris Lattner00950542001-06-06 20:29:01 +0000205 }
206
207 // Figure out which type to encode with the instruction. Typically we want
208 // the type of the first parameter, as opposed to the type of the instruction
209 // (for example, with setcc, we always know it returns bool, but the type of
210 // the first param is actually interesting). But if we have no arguments
211 // we take the type of the instruction itself.
212 //
Chris Lattnerab5ac6b2001-07-08 23:22:50 +0000213 const Type *Ty;
Chris Lattner0b12b5f2002-06-25 16:13:21 +0000214 switch (I.getOpcode()) {
Chris Lattnerab5ac6b2001-07-08 23:22:50 +0000215 case Instruction::Malloc:
216 case Instruction::Alloca:
Chris Lattner0b12b5f2002-06-25 16:13:21 +0000217 Ty = I.getType(); // Malloc & Alloca ALWAYS want to encode the return type
Chris Lattnerab5ac6b2001-07-08 23:22:50 +0000218 break;
219 case Instruction::Store:
Chris Lattner0b12b5f2002-06-25 16:13:21 +0000220 Ty = I.getOperand(1)->getType(); // Encode the pointer type...
Chris Lattner9b625032002-05-06 16:15:30 +0000221 assert(isa<PointerType>(Ty) && "Store to nonpointer type!?!?");
Chris Lattnerab5ac6b2001-07-08 23:22:50 +0000222 break;
223 default: // Otherwise use the default behavior...
Chris Lattner0b12b5f2002-06-25 16:13:21 +0000224 Ty = NumOperands ? I.getOperand(0)->getType() : I.getType();
Chris Lattnerab5ac6b2001-07-08 23:22:50 +0000225 break;
226 }
Chris Lattner00950542001-06-06 20:29:01 +0000227
228 unsigned Type;
Alkis Evlogimenos60596382003-10-17 02:02:40 +0000229 int Slot = Table.getSlot(Ty);
Chris Lattner00950542001-06-06 20:29:01 +0000230 assert(Slot != -1 && "Type not available!!?!");
231 Type = (unsigned)Slot;
232
Chris Lattner7c501472001-07-28 17:51:21 +0000233 // Make sure that we take the type number into consideration. We don't want
234 // to overflow the field size for the instruction format we select.
235 //
236 if (Slot > MaxOpSlot) MaxOpSlot = Slot;
237
Chris Lattner09083092001-07-08 04:57:15 +0000238 // Handle the special case for cast...
Chris Lattnereff112c2003-10-18 05:54:48 +0000239 if (isa<CastInst>(I) || isa<VAArgInst>(I)) {
Chris Lattner09083092001-07-08 04:57:15 +0000240 // Cast has to encode the destination type as the second argument in the
241 // packet, or else we won't know what type to cast to!
Alkis Evlogimenos60596382003-10-17 02:02:40 +0000242 Slots[1] = Table.getSlot(I.getType());
Chris Lattner09083092001-07-08 04:57:15 +0000243 assert(Slots[1] != -1 && "Cast return type unknown?");
244 if (Slots[1] > MaxOpSlot) MaxOpSlot = Slots[1];
245 NumOperands++;
Chris Lattnereff112c2003-10-18 05:54:48 +0000246 } else if (const VANextInst *VANI = dyn_cast<VANextInst>(&I)) {
247 Slots[1] = Table.getSlot(VANI->getArgType());
248 assert(Slots[1] != -1 && "va_next return type unknown?");
249 if (Slots[1] > MaxOpSlot) MaxOpSlot = Slots[1];
250 NumOperands++;
Chris Lattner0b12b5f2002-06-25 16:13:21 +0000251 } else if (const CallInst *CI = dyn_cast<CallInst>(&I)){// Handle VarArg calls
Chris Lattner9fcccb02002-06-05 17:49:40 +0000252 const PointerType *Ty = cast<PointerType>(CI->getCalledValue()->getType());
Chris Lattner2aac6bf2002-04-04 22:19:18 +0000253 if (cast<FunctionType>(Ty->getElementType())->isVarArg()) {
Chris Lattner0fe56f42003-09-08 17:58:37 +0000254 outputInstrVarArgsCall(CI, Opcode, Table, Type, Out);
Chris Lattner1b98c5c2001-10-13 06:48:38 +0000255 return;
256 }
Chris Lattner0b12b5f2002-06-25 16:13:21 +0000257 } else if (const InvokeInst *II = dyn_cast<InvokeInst>(&I)) {// ... & Invokes
Chris Lattner9fcccb02002-06-05 17:49:40 +0000258 const PointerType *Ty = cast<PointerType>(II->getCalledValue()->getType());
Chris Lattner2aac6bf2002-04-04 22:19:18 +0000259 if (cast<FunctionType>(Ty->getElementType())->isVarArg()) {
Chris Lattner0fe56f42003-09-08 17:58:37 +0000260 outputInstrVarArgsCall(II, Opcode, Table, Type, Out);
Chris Lattneref9c23f2001-10-03 14:53:21 +0000261 return;
262 }
Chris Lattner09083092001-07-08 04:57:15 +0000263 }
Chris Lattner00950542001-06-06 20:29:01 +0000264
Chris Lattnera407ba12003-01-21 20:13:49 +0000265 ++NumInstrs;
266
Chris Lattner00950542001-06-06 20:29:01 +0000267 // Decide which instruction encoding to use. This is determined primarily by
268 // the number of operands, and secondarily by whether or not the max operand
269 // will fit into the instruction encoding. More operands == fewer bits per
270 // operand.
271 //
272 switch (NumOperands) {
273 case 0:
274 case 1:
275 if (MaxOpSlot < (1 << 12)-1) { // -1 because we use 4095 to indicate 0 ops
Chris Lattner0fe56f42003-09-08 17:58:37 +0000276 outputInstructionFormat1(&I, Opcode, Table, Slots, Type, Out);
Chris Lattnere8fdde12001-09-07 16:39:41 +0000277 return;
Chris Lattner00950542001-06-06 20:29:01 +0000278 }
279 break;
280
281 case 2:
282 if (MaxOpSlot < (1 << 8)) {
Chris Lattner0fe56f42003-09-08 17:58:37 +0000283 outputInstructionFormat2(&I, Opcode, Table, Slots, Type, Out);
Chris Lattnere8fdde12001-09-07 16:39:41 +0000284 return;
Chris Lattner00950542001-06-06 20:29:01 +0000285 }
286 break;
287
288 case 3:
289 if (MaxOpSlot < (1 << 6)) {
Chris Lattner0fe56f42003-09-08 17:58:37 +0000290 outputInstructionFormat3(&I, Opcode, Table, Slots, Type, Out);
Chris Lattnere8fdde12001-09-07 16:39:41 +0000291 return;
Chris Lattner00950542001-06-06 20:29:01 +0000292 }
293 break;
294 }
295
Chris Lattnerab5ac6b2001-07-08 23:22:50 +0000296 // If we weren't handled before here, we either have a large number of
Misha Brukman37f92e22003-09-11 22:34:13 +0000297 // operands or a large operand index that we are referring to.
Chris Lattner0fe56f42003-09-08 17:58:37 +0000298 outputInstructionFormat0(&I, Opcode, Table, Type, Out);
Chris Lattner00950542001-06-06 20:29:01 +0000299}
Brian Gaeked0fde302003-11-11 22:41:34 +0000300
301} // End llvm namespace