blob: c44da97a90e6837f482c1f69deaca734a70ff4b9 [file] [log] [blame]
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +00001/*
2 * Copyright (C) 2014 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#ifndef ART_COMPILER_OPTIMIZING_CODE_GENERATOR_X86_H_
18#define ART_COMPILER_OPTIMIZING_CODE_GENERATOR_X86_H_
19
Mark P Mendell17077d82015-12-16 19:15:59 +000020#include "arch/x86/instruction_set_features_x86.h"
Andreas Gampe542451c2016-07-26 09:02:02 -070021#include "base/enums.h"
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +000022#include "code_generator.h"
Andreas Gampe8a0128a2016-11-28 07:38:35 -080023#include "dex_file_types.h"
Calin Juravlecd6dffe2015-01-08 17:35:35 +000024#include "driver/compiler_options.h"
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +000025#include "nodes.h"
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +010026#include "parallel_move_resolver.h"
Nicolas Geoffray787c3072014-03-17 10:20:19 +000027#include "utils/x86/assembler_x86.h"
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +000028
29namespace art {
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +000030namespace x86 {
31
Nicolas Geoffray86a8d7a2014-11-19 08:47:18 +000032// Use a local definition to prevent copying mistakes.
Andreas Gampe542451c2016-07-26 09:02:02 -070033static constexpr size_t kX86WordSize = static_cast<size_t>(kX86PointerSize);
Nicolas Geoffray707c8092014-04-04 10:50:14 +010034
Nicolas Geoffray01bc96d2014-04-11 17:43:50 +010035class CodeGeneratorX86;
36
Nicolas Geoffraya747a392014-04-17 14:56:23 +010037static constexpr Register kParameterCoreRegisters[] = { ECX, EDX, EBX };
38static constexpr RegisterPair kParameterCorePairRegisters[] = { ECX_EDX, EDX_EBX };
39static constexpr size_t kParameterCoreRegistersLength = arraysize(kParameterCoreRegisters);
Mark P Mendell966c3ae2015-01-27 15:45:27 +000040static constexpr XmmRegister kParameterFpuRegisters[] = { XMM0, XMM1, XMM2, XMM3 };
41static constexpr size_t kParameterFpuRegistersLength = arraysize(kParameterFpuRegisters);
Nicolas Geoffraya747a392014-04-17 14:56:23 +010042
Nicolas Geoffrayd75948a2015-03-27 09:53:16 +000043static constexpr Register kRuntimeParameterCoreRegisters[] = { EAX, ECX, EDX, EBX };
44static constexpr size_t kRuntimeParameterCoreRegistersLength =
45 arraysize(kRuntimeParameterCoreRegisters);
46static constexpr XmmRegister kRuntimeParameterFpuRegisters[] = { XMM0, XMM1, XMM2, XMM3 };
47static constexpr size_t kRuntimeParameterFpuRegistersLength =
48 arraysize(kRuntimeParameterFpuRegisters);
49
50class InvokeRuntimeCallingConvention : public CallingConvention<Register, XmmRegister> {
51 public:
52 InvokeRuntimeCallingConvention()
53 : CallingConvention(kRuntimeParameterCoreRegisters,
54 kRuntimeParameterCoreRegistersLength,
55 kRuntimeParameterFpuRegisters,
Mathieu Chartiere401d142015-04-22 13:56:20 -070056 kRuntimeParameterFpuRegistersLength,
57 kX86PointerSize) {}
Nicolas Geoffrayd75948a2015-03-27 09:53:16 +000058
59 private:
60 DISALLOW_COPY_AND_ASSIGN(InvokeRuntimeCallingConvention);
61};
62
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +010063class InvokeDexCallingConvention : public CallingConvention<Register, XmmRegister> {
Nicolas Geoffraya747a392014-04-17 14:56:23 +010064 public:
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +010065 InvokeDexCallingConvention() : CallingConvention(
66 kParameterCoreRegisters,
67 kParameterCoreRegistersLength,
68 kParameterFpuRegisters,
Mathieu Chartiere401d142015-04-22 13:56:20 -070069 kParameterFpuRegistersLength,
70 kX86PointerSize) {}
Nicolas Geoffraya747a392014-04-17 14:56:23 +010071
72 RegisterPair GetRegisterPairAt(size_t argument_index) {
73 DCHECK_LT(argument_index + 1, GetNumberOfRegisters());
74 return kParameterCorePairRegisters[argument_index];
75 }
76
77 private:
78 DISALLOW_COPY_AND_ASSIGN(InvokeDexCallingConvention);
79};
80
Roland Levillain2d27c8e2015-04-28 15:48:45 +010081class InvokeDexCallingConventionVisitorX86 : public InvokeDexCallingConventionVisitor {
Nicolas Geoffraya747a392014-04-17 14:56:23 +010082 public:
Roland Levillain2d27c8e2015-04-28 15:48:45 +010083 InvokeDexCallingConventionVisitorX86() {}
84 virtual ~InvokeDexCallingConventionVisitorX86() {}
Nicolas Geoffraya747a392014-04-17 14:56:23 +010085
Roland Levillain2d27c8e2015-04-28 15:48:45 +010086 Location GetNextLocation(Primitive::Type type) OVERRIDE;
Nicolas Geoffrayfd88f162015-06-03 11:23:52 +010087 Location GetReturnLocation(Primitive::Type type) const OVERRIDE;
88 Location GetMethodLocation() const OVERRIDE;
Nicolas Geoffraya747a392014-04-17 14:56:23 +010089
90 private:
91 InvokeDexCallingConvention calling_convention;
Nicolas Geoffraya747a392014-04-17 14:56:23 +010092
Roland Levillain2d27c8e2015-04-28 15:48:45 +010093 DISALLOW_COPY_AND_ASSIGN(InvokeDexCallingConventionVisitorX86);
Nicolas Geoffraya747a392014-04-17 14:56:23 +010094};
95
Calin Juravlee460d1d2015-09-29 04:52:17 +010096class FieldAccessCallingConventionX86 : public FieldAccessCallingConvention {
97 public:
98 FieldAccessCallingConventionX86() {}
99
100 Location GetObjectLocation() const OVERRIDE {
101 return Location::RegisterLocation(ECX);
102 }
103 Location GetFieldIndexLocation() const OVERRIDE {
104 return Location::RegisterLocation(EAX);
105 }
106 Location GetReturnLocation(Primitive::Type type) const OVERRIDE {
107 return Primitive::Is64BitType(type)
108 ? Location::RegisterPairLocation(EAX, EDX)
109 : Location::RegisterLocation(EAX);
110 }
111 Location GetSetValueLocation(Primitive::Type type, bool is_instance) const OVERRIDE {
112 return Primitive::Is64BitType(type)
113 ? Location::RegisterPairLocation(EDX, EBX)
114 : (is_instance
115 ? Location::RegisterLocation(EDX)
116 : Location::RegisterLocation(ECX));
117 }
118 Location GetFpuLocation(Primitive::Type type ATTRIBUTE_UNUSED) const OVERRIDE {
119 return Location::FpuRegisterLocation(XMM0);
120 }
121
122 private:
123 DISALLOW_COPY_AND_ASSIGN(FieldAccessCallingConventionX86);
124};
125
Zheng Xuad4450e2015-04-17 18:48:56 +0800126class ParallelMoveResolverX86 : public ParallelMoveResolverWithSwap {
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +0100127 public:
128 ParallelMoveResolverX86(ArenaAllocator* allocator, CodeGeneratorX86* codegen)
Zheng Xuad4450e2015-04-17 18:48:56 +0800129 : ParallelMoveResolverWithSwap(allocator), codegen_(codegen) {}
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +0100130
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000131 void EmitMove(size_t index) OVERRIDE;
132 void EmitSwap(size_t index) OVERRIDE;
133 void SpillScratch(int reg) OVERRIDE;
134 void RestoreScratch(int reg) OVERRIDE;
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +0100135
136 X86Assembler* GetAssembler() const;
137
138 private:
139 void Exchange(Register reg, int mem);
140 void Exchange(int mem1, int mem2);
Mark Mendell7c8d0092015-01-26 11:21:33 -0500141 void Exchange32(XmmRegister reg, int mem);
142 void MoveMemoryToMemory32(int dst, int src);
143 void MoveMemoryToMemory64(int dst, int src);
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +0100144
145 CodeGeneratorX86* const codegen_;
146
147 DISALLOW_COPY_AND_ASSIGN(ParallelMoveResolverX86);
148};
149
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000150class LocationsBuilderX86 : public HGraphVisitor {
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000151 public:
Nicolas Geoffray01bc96d2014-04-11 17:43:50 +0100152 LocationsBuilderX86(HGraph* graph, CodeGeneratorX86* codegen)
153 : HGraphVisitor(graph), codegen_(codegen) {}
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000154
Nicolas Geoffray360231a2014-10-08 21:07:48 +0100155#define DECLARE_VISIT_INSTRUCTION(name, super) \
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000156 void Visit##name(H##name* instr) OVERRIDE;
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000157
Alexandre Ramesef20f712015-06-09 10:29:30 +0100158 FOR_EACH_CONCRETE_INSTRUCTION_COMMON(DECLARE_VISIT_INSTRUCTION)
159 FOR_EACH_CONCRETE_INSTRUCTION_X86(DECLARE_VISIT_INSTRUCTION)
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000160
161#undef DECLARE_VISIT_INSTRUCTION
162
Alexandre Ramesef20f712015-06-09 10:29:30 +0100163 void VisitInstruction(HInstruction* instruction) OVERRIDE {
164 LOG(FATAL) << "Unreachable instruction " << instruction->DebugName()
165 << " (id " << instruction->GetId() << ")";
166 }
167
Nicolas Geoffray9574c4b2014-11-12 13:19:37 +0000168 private:
169 void HandleBitwiseOperation(HBinaryOperation* instruction);
Nicolas Geoffraye982f0b2014-08-13 02:11:24 +0100170 void HandleInvoke(HInvoke* invoke);
Vladimir Marko5f7b58e2015-11-23 19:49:34 +0000171 void HandleCondition(HCondition* condition);
Calin Juravle9aec02f2014-11-18 23:06:35 +0000172 void HandleShift(HBinaryOperation* instruction);
Calin Juravle52c48962014-12-16 17:02:57 +0000173 void HandleFieldSet(HInstruction* instruction, const FieldInfo& field_info);
174 void HandleFieldGet(HInstruction* instruction, const FieldInfo& field_info);
Nicolas Geoffraye982f0b2014-08-13 02:11:24 +0100175
Nicolas Geoffray01bc96d2014-04-11 17:43:50 +0100176 CodeGeneratorX86* const codegen_;
Roland Levillain2d27c8e2015-04-28 15:48:45 +0100177 InvokeDexCallingConventionVisitorX86 parameter_visitor_;
Nicolas Geoffray01bc96d2014-04-11 17:43:50 +0100178
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000179 DISALLOW_COPY_AND_ASSIGN(LocationsBuilderX86);
180};
181
Aart Bik42249c32016-01-07 15:33:50 -0800182class InstructionCodeGeneratorX86 : public InstructionCodeGenerator {
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000183 public:
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100184 InstructionCodeGeneratorX86(HGraph* graph, CodeGeneratorX86* codegen);
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000185
Nicolas Geoffray360231a2014-10-08 21:07:48 +0100186#define DECLARE_VISIT_INSTRUCTION(name, super) \
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000187 void Visit##name(H##name* instr) OVERRIDE;
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000188
Alexandre Ramesef20f712015-06-09 10:29:30 +0100189 FOR_EACH_CONCRETE_INSTRUCTION_COMMON(DECLARE_VISIT_INSTRUCTION)
190 FOR_EACH_CONCRETE_INSTRUCTION_X86(DECLARE_VISIT_INSTRUCTION)
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000191
192#undef DECLARE_VISIT_INSTRUCTION
193
Alexandre Ramesef20f712015-06-09 10:29:30 +0100194 void VisitInstruction(HInstruction* instruction) OVERRIDE {
195 LOG(FATAL) << "Unreachable instruction " << instruction->DebugName()
196 << " (id " << instruction->GetId() << ")";
197 }
198
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100199 X86Assembler* GetAssembler() const { return assembler_; }
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000200
Vladimir Markof3e0ee22015-12-17 15:23:13 +0000201 // The compare/jump sequence will generate about (1.5 * num_entries) instructions. A jump
202 // table version generates 7 instructions and num_entries literals. Compare/jump sequence will
203 // generates less code/data with a small num_entries.
204 static constexpr uint32_t kPackedSwitchJumpTableThreshold = 5;
205
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000206 private:
Nicolas Geoffray3c049742014-09-24 18:10:46 +0100207 // Generate code for the given suspend check. If not null, `successor`
208 // is the block to branch to if the suspend check is not needed, and after
209 // the suspend call.
210 void GenerateSuspendCheck(HSuspendCheck* check, HBasicBlock* successor);
Andreas Gampe85b62f22015-09-09 13:15:38 -0700211 void GenerateClassInitializationCheck(SlowPathCode* slow_path, Register class_reg);
Nicolas Geoffray9574c4b2014-11-12 13:19:37 +0000212 void HandleBitwiseOperation(HBinaryOperation* instruction);
Calin Juravlebacfec32014-11-14 15:54:36 +0000213 void GenerateDivRemIntegral(HBinaryOperation* instruction);
Guillaume Sanchez0f88e872015-03-30 17:55:45 +0100214 void DivRemOneOrMinusOne(HBinaryOperation* instruction);
Guillaume Sanchezb19930c2015-04-09 21:12:15 +0100215 void DivByPowerOfTwo(HDiv* instruction);
Guillaume Sanchez0f88e872015-03-30 17:55:45 +0100216 void GenerateDivRemWithAnyConstant(HBinaryOperation* instruction);
Mark Mendellc4701932015-04-10 13:18:51 -0400217 void GenerateRemFP(HRem* rem);
Vladimir Marko5f7b58e2015-11-23 19:49:34 +0000218 void HandleCondition(HCondition* condition);
Calin Juravle9aec02f2014-11-18 23:06:35 +0000219 void HandleShift(HBinaryOperation* instruction);
220 void GenerateShlLong(const Location& loc, Register shifter);
221 void GenerateShrLong(const Location& loc, Register shifter);
222 void GenerateUShrLong(const Location& loc, Register shifter);
Mark P Mendell73945692015-04-29 14:56:17 +0000223 void GenerateShlLong(const Location& loc, int shift);
224 void GenerateShrLong(const Location& loc, int shift);
225 void GenerateUShrLong(const Location& loc, int shift);
Roland Levillain7c1559a2015-12-15 10:55:36 +0000226
Nicolas Geoffray07276db2015-05-18 14:22:09 +0100227 void HandleFieldSet(HInstruction* instruction,
228 const FieldInfo& field_info,
229 bool value_can_be_null);
Calin Juravle52c48962014-12-16 17:02:57 +0000230 void HandleFieldGet(HInstruction* instruction, const FieldInfo& field_info);
Roland Levillain7c1559a2015-12-15 10:55:36 +0000231
232 // Generate a heap reference load using one register `out`:
233 //
234 // out <- *(out + offset)
235 //
236 // while honoring heap poisoning and/or read barriers (if any).
Roland Levillain95e7ffc2016-01-22 11:57:25 +0000237 //
238 // Location `maybe_temp` is used when generating a read barrier and
239 // shall be a register in that case; it may be an invalid location
240 // otherwise.
Roland Levillain7c1559a2015-12-15 10:55:36 +0000241 void GenerateReferenceLoadOneRegister(HInstruction* instruction,
242 Location out,
243 uint32_t offset,
Mathieu Chartieraa474eb2016-11-09 15:18:27 -0800244 Location maybe_temp,
Mathieu Chartier3af00dc2016-11-10 11:25:57 -0800245 ReadBarrierOption read_barrier_option);
Roland Levillain7c1559a2015-12-15 10:55:36 +0000246 // Generate a heap reference load using two different registers
247 // `out` and `obj`:
248 //
249 // out <- *(obj + offset)
250 //
251 // while honoring heap poisoning and/or read barriers (if any).
Roland Levillain95e7ffc2016-01-22 11:57:25 +0000252 //
253 // Location `maybe_temp` is used when generating a Baker's (fast
254 // path) read barrier and shall be a register in that case; it may
255 // be an invalid location otherwise.
Roland Levillain7c1559a2015-12-15 10:55:36 +0000256 void GenerateReferenceLoadTwoRegisters(HInstruction* instruction,
257 Location out,
258 Location obj,
Mathieu Chartier5c44c1b2016-11-04 18:13:04 -0700259 uint32_t offset,
Mathieu Chartier3af00dc2016-11-10 11:25:57 -0800260 ReadBarrierOption read_barrier_option);
Roland Levillain7c1559a2015-12-15 10:55:36 +0000261 // Generate a GC root reference load:
262 //
Vladimir Markocac5a7e2016-02-22 10:39:50 +0000263 // root <- *address
Roland Levillain7c1559a2015-12-15 10:55:36 +0000264 //
Mathieu Chartier3af00dc2016-11-10 11:25:57 -0800265 // while honoring read barriers based on read_barrier_option.
Roland Levillain7c1559a2015-12-15 10:55:36 +0000266 void GenerateGcRootFieldLoad(HInstruction* instruction,
267 Location root,
Vladimir Markocac5a7e2016-02-22 10:39:50 +0000268 const Address& address,
Roland Levillain00468f32016-10-27 18:02:48 +0100269 Label* fixup_label,
Mathieu Chartier3af00dc2016-11-10 11:25:57 -0800270 ReadBarrierOption read_barrier_option);
Roland Levillain7c1559a2015-12-15 10:55:36 +0000271
Roland Levillain232ade02015-04-20 15:14:36 +0100272 // Push value to FPU stack. `is_fp` specifies whether the value is floating point or not.
273 // `is_wide` specifies whether it is long/double or not.
Mark Mendell24f2dfa2015-01-14 19:51:45 -0500274 void PushOntoFPStack(Location source, uint32_t temp_offset,
Roland Levillain232ade02015-04-20 15:14:36 +0100275 uint32_t stack_adjustment, bool is_fp, bool is_wide);
Nicolas Geoffray3c049742014-09-24 18:10:46 +0100276
Mark Mendell152408f2015-12-31 12:28:50 -0500277 template<class LabelType>
Mingyao Yangd43b3ac2015-04-01 14:03:04 -0700278 void GenerateTestAndBranch(HInstruction* instruction,
David Brazdil0debae72015-11-12 18:37:00 +0000279 size_t condition_input_index,
Mark Mendell152408f2015-12-31 12:28:50 -0500280 LabelType* true_target,
281 LabelType* false_target);
282 template<class LabelType>
David Brazdil0debae72015-11-12 18:37:00 +0000283 void GenerateCompareTestAndBranch(HCondition* condition,
Mark Mendell152408f2015-12-31 12:28:50 -0500284 LabelType* true_target,
285 LabelType* false_target);
286 template<class LabelType>
287 void GenerateFPJumps(HCondition* cond, LabelType* true_label, LabelType* false_label);
288 template<class LabelType>
289 void GenerateLongComparesAndJumps(HCondition* cond,
290 LabelType* true_label,
291 LabelType* false_label);
292
David Brazdilfc6a86a2015-06-26 10:33:45 +0000293 void HandleGoto(HInstruction* got, HBasicBlock* successor);
Vladimir Markof3e0ee22015-12-17 15:23:13 +0000294 void GenPackedSwitchWithCompares(Register value_reg,
295 int32_t lower_bound,
296 uint32_t num_entries,
297 HBasicBlock* switch_block,
298 HBasicBlock* default_block);
Calin Juravlecd6dffe2015-01-08 17:35:35 +0000299
Mark P Mendell2f10a5f2016-01-25 14:47:50 +0000300 void GenerateFPCompare(Location lhs, Location rhs, HInstruction* insn, bool is_double);
301
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100302 X86Assembler* const assembler_;
303 CodeGeneratorX86* const codegen_;
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000304
305 DISALLOW_COPY_AND_ASSIGN(InstructionCodeGeneratorX86);
306};
307
Mark Mendell805b3b52015-09-18 14:10:29 -0400308class JumpTableRIPFixup;
309
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000310class CodeGeneratorX86 : public CodeGenerator {
311 public:
Mark Mendellfb8d2792015-03-31 22:16:59 -0400312 CodeGeneratorX86(HGraph* graph,
313 const X86InstructionSetFeatures& isa_features,
Serban Constantinescuecc43662015-08-13 13:33:12 +0100314 const CompilerOptions& compiler_options,
315 OptimizingCompilerStats* stats = nullptr);
Nicolas Geoffrayf12feb82014-07-17 18:32:41 +0100316 virtual ~CodeGeneratorX86() {}
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000317
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000318 void GenerateFrameEntry() OVERRIDE;
319 void GenerateFrameExit() OVERRIDE;
320 void Bind(HBasicBlock* block) OVERRIDE;
Calin Juravle175dc732015-08-25 15:42:32 +0100321 void MoveConstant(Location destination, int32_t value) OVERRIDE;
Calin Juravlee460d1d2015-09-29 04:52:17 +0100322 void MoveLocation(Location dst, Location src, Primitive::Type dst_type) OVERRIDE;
323 void AddLocationAsTemp(Location location, LocationSummary* locations) OVERRIDE;
324
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000325 size_t SaveCoreRegister(size_t stack_index, uint32_t reg_id) OVERRIDE;
326 size_t RestoreCoreRegister(size_t stack_index, uint32_t reg_id) OVERRIDE;
Mark Mendell7c8d0092015-01-26 11:21:33 -0500327 size_t SaveFloatingPointRegister(size_t stack_index, uint32_t reg_id) OVERRIDE;
328 size_t RestoreFloatingPointRegister(size_t stack_index, uint32_t reg_id) OVERRIDE;
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000329
Alexandre Rames8158f282015-08-07 10:26:17 +0100330 // Generate code to invoke a runtime entry point.
Calin Juravle175dc732015-08-25 15:42:32 +0100331 void InvokeRuntime(QuickEntrypointEnum entrypoint,
332 HInstruction* instruction,
333 uint32_t dex_pc,
Serban Constantinescuba45db02016-07-12 22:53:02 +0100334 SlowPathCode* slow_path = nullptr) OVERRIDE;
Alexandre Rames8158f282015-08-07 10:26:17 +0100335
Roland Levillaindec8f632016-07-22 17:10:06 +0100336 // Generate code to invoke a runtime entry point, but do not record
337 // PC-related information in a stack map.
338 void InvokeRuntimeWithoutRecordingPcInfo(int32_t entry_point_offset,
339 HInstruction* instruction,
340 SlowPathCode* slow_path);
341
Serban Constantinescuba45db02016-07-12 22:53:02 +0100342 void GenerateInvokeRuntime(int32_t entry_point_offset);
343
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000344 size_t GetWordSize() const OVERRIDE {
Nicolas Geoffray707c8092014-04-04 10:50:14 +0100345 return kX86WordSize;
346 }
347
Mark Mendellf85a9ca2015-01-13 09:20:58 -0500348 size_t GetFloatingPointSpillSlotSize() const OVERRIDE {
349 // 8 bytes == 2 words for each spill.
350 return 2 * kX86WordSize;
351 }
352
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000353 HGraphVisitor* GetLocationBuilder() OVERRIDE {
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000354 return &location_builder_;
355 }
356
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000357 HGraphVisitor* GetInstructionVisitor() OVERRIDE {
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000358 return &instruction_visitor_;
359 }
360
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000361 X86Assembler* GetAssembler() OVERRIDE {
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000362 return &assembler_;
363 }
364
Alexandre Rameseb7b7392015-06-19 14:47:01 +0100365 const X86Assembler& GetAssembler() const OVERRIDE {
366 return assembler_;
367 }
368
Alexandre Ramesc01a6642016-04-15 11:54:06 +0100369 uintptr_t GetAddressOf(HBasicBlock* block) OVERRIDE {
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000370 return GetLabelOf(block)->Position();
371 }
Calin Juravle34bacdf2014-10-07 20:23:36 +0100372
David Brazdil58282f42016-01-14 12:45:10 +0000373 void SetupBlockedRegisters() const OVERRIDE;
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100374
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000375 void DumpCoreRegister(std::ostream& stream, int reg) const OVERRIDE;
376 void DumpFloatingPointRegister(std::ostream& stream, int reg) const OVERRIDE;
Nicolas Geoffraya7062e02014-05-22 12:50:17 +0100377
Nicolas Geoffrayf0e39372014-11-12 17:50:07 +0000378 ParallelMoveResolverX86* GetMoveResolver() OVERRIDE {
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +0100379 return &move_resolver_;
380 }
381
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000382 InstructionSet GetInstructionSet() const OVERRIDE {
Nicolas Geoffray412f10c2014-06-19 10:00:34 +0100383 return InstructionSet::kX86;
384 }
385
Nicolas Geoffray01bc96d2014-04-11 17:43:50 +0100386 // Helper method to move a 32bits value between two locations.
387 void Move32(Location destination, Location source);
388 // Helper method to move a 64bits value between two locations.
389 void Move64(Location destination, Location source);
390
Vladimir Markocac5a7e2016-02-22 10:39:50 +0000391 // Check if the desired_string_load_kind is supported. If it is, return it,
392 // otherwise return a fall-back kind that should be used instead.
393 HLoadString::LoadKind GetSupportedLoadStringKind(
394 HLoadString::LoadKind desired_string_load_kind) OVERRIDE;
395
Vladimir Markodbb7f5b2016-03-30 13:23:58 +0100396 // Check if the desired_class_load_kind is supported. If it is, return it,
397 // otherwise return a fall-back kind that should be used instead.
398 HLoadClass::LoadKind GetSupportedLoadClassKind(
399 HLoadClass::LoadKind desired_class_load_kind) OVERRIDE;
400
Vladimir Markodc151b22015-10-15 18:02:30 +0100401 // Check if the desired_dispatch_info is supported. If it is, return it,
402 // otherwise return a fall-back info that should be used instead.
403 HInvokeStaticOrDirect::DispatchInfo GetSupportedInvokeStaticOrDirectDispatch(
404 const HInvokeStaticOrDirect::DispatchInfo& desired_dispatch_info,
Nicolas Geoffray5e4e11e2016-09-22 13:17:41 +0100405 HInvokeStaticOrDirect* invoke) OVERRIDE;
Vladimir Markodc151b22015-10-15 18:02:30 +0100406
Mark Mendell09ed1a32015-03-25 08:30:06 -0400407 // Generate a call to a static or direct method.
Serguei Katkov288c7a82016-05-16 11:53:15 +0600408 Location GenerateCalleeMethodStaticOrDirectCall(HInvokeStaticOrDirect* invoke, Location temp);
Andreas Gampe85b62f22015-09-09 13:15:38 -0700409 void GenerateStaticOrDirectCall(HInvokeStaticOrDirect* invoke, Location temp) OVERRIDE;
Andreas Gampebfb5ba92015-09-01 15:45:02 +0000410 // Generate a call to a virtual method.
Andreas Gampe85b62f22015-09-09 13:15:38 -0700411 void GenerateVirtualCall(HInvokeVirtual* invoke, Location temp) OVERRIDE;
412
Vladimir Markocac5a7e2016-02-22 10:39:50 +0000413 void RecordSimplePatch();
Vladimir Markoaad75c62016-10-03 08:46:48 +0000414 void RecordBootStringPatch(HLoadString* load_string);
Vladimir Markodbb7f5b2016-03-30 13:23:58 +0100415 void RecordTypePatch(HLoadClass* load_class);
Vladimir Markoaad75c62016-10-03 08:46:48 +0000416 Label* NewStringBssEntryPatch(HLoadString* load_string);
Vladimir Markocac5a7e2016-02-22 10:39:50 +0000417 Label* NewPcRelativeDexCacheArrayPatch(const DexFile& dex_file, uint32_t element_offset);
Andreas Gampe8a0128a2016-11-28 07:38:35 -0800418 Label* NewJitRootStringPatch(const DexFile& dex_file, dex::StringIndex dex_index);
Nicolas Geoffray22384ae2016-12-12 22:33:36 +0000419 Label* NewJitRootClassPatch(const DexFile& dex_file, dex::TypeIndex dex_index, uint64_t address);
Vladimir Markocac5a7e2016-02-22 10:39:50 +0000420
Andreas Gampe85b62f22015-09-09 13:15:38 -0700421 void MoveFromReturnRegister(Location trg, Primitive::Type type) OVERRIDE;
Mark Mendell09ed1a32015-03-25 08:30:06 -0400422
Vladimir Marko58155012015-08-19 12:49:41 +0000423 // Emit linker patches.
424 void EmitLinkerPatches(ArenaVector<LinkerPatch>* linker_patches) OVERRIDE;
425
Nicolas Geoffray22384ae2016-12-12 22:33:36 +0000426 void PatchJitRootUse(uint8_t* code,
427 const uint8_t* roots_data,
428 const PatchInfo<Label>& info,
429 uint64_t index_in_table) const;
Nicolas Geoffray132d8362016-11-16 09:19:42 +0000430 void EmitJitRootPatches(uint8_t* code, const uint8_t* roots_data) OVERRIDE;
431
Nicolas Geoffray3c7bb982014-07-23 16:04:16 +0100432 // Emit a write barrier.
Nicolas Geoffray07276db2015-05-18 14:22:09 +0100433 void MarkGCCard(Register temp,
434 Register card,
435 Register object,
436 Register value,
437 bool value_can_be_null);
Nicolas Geoffray3c7bb982014-07-23 16:04:16 +0100438
Roland Levillain7c1559a2015-12-15 10:55:36 +0000439 void GenerateMemoryBarrier(MemBarrierKind kind);
440
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +0100441 Label* GetLabelOf(HBasicBlock* block) const {
Vladimir Marko225b6462015-09-28 12:17:40 +0100442 return CommonGetLabelOf<Label>(block_labels_, block);
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +0100443 }
444
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000445 void Initialize() OVERRIDE {
Vladimir Marko225b6462015-09-28 12:17:40 +0100446 block_labels_ = CommonInitializeLabels<Label>();
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +0100447 }
448
Nicolas Geoffray840e5462015-01-07 16:01:24 +0000449 bool NeedsTwoRegisters(Primitive::Type type) const OVERRIDE {
450 return type == Primitive::kPrimLong;
451 }
452
Nicolas Geoffray234d69d2015-03-09 10:28:50 +0000453 bool ShouldSplitLongMoves() const OVERRIDE { return true; }
454
Nicolas Geoffray1cf95282014-12-12 19:22:03 +0000455 Label* GetFrameEntryLabel() { return &frame_entry_label_; }
456
Mark Mendellfb8d2792015-03-31 22:16:59 -0400457 const X86InstructionSetFeatures& GetInstructionSetFeatures() const {
458 return isa_features_;
459 }
460
Mark Mendell0616ae02015-04-17 12:49:27 -0400461 void SetMethodAddressOffset(int32_t offset) {
462 method_address_offset_ = offset;
463 }
464
465 int32_t GetMethodAddressOffset() const {
466 return method_address_offset_;
467 }
468
469 int32_t ConstantAreaStart() const {
470 return constant_area_start_;
471 }
472
473 Address LiteralDoubleAddress(double v, Register reg);
474 Address LiteralFloatAddress(float v, Register reg);
475 Address LiteralInt32Address(int32_t v, Register reg);
476 Address LiteralInt64Address(int64_t v, Register reg);
477
Aart Bika19616e2016-02-01 18:57:58 -0800478 // Load a 32-bit value into a register in the most efficient manner.
479 void Load32BitValue(Register dest, int32_t value);
480
481 // Compare a register with a 32-bit value in the most efficient manner.
482 void Compare32BitValue(Register dest, int32_t value);
483
Vladimir Marko56f4bdd2016-09-16 11:32:36 +0100484 // Compare int values. Supports only register locations for `lhs`.
485 void GenerateIntCompare(Location lhs, Location rhs);
jessicahandojo4877b792016-09-08 19:49:13 -0700486 void GenerateIntCompare(Register lhs, Location rhs);
Vladimir Marko56f4bdd2016-09-16 11:32:36 +0100487
488 // Construct address for array access.
489 static Address ArrayAddress(Register obj,
490 Location index,
491 ScaleFactor scale,
492 uint32_t data_offset);
493
Mark Mendell805b3b52015-09-18 14:10:29 -0400494 Address LiteralCaseTable(HX86PackedSwitch* switch_instr, Register reg, Register value);
495
Mark Mendell0616ae02015-04-17 12:49:27 -0400496 void Finalize(CodeAllocator* allocator) OVERRIDE;
497
Roland Levillain7c1559a2015-12-15 10:55:36 +0000498 // Fast path implementation of ReadBarrier::Barrier for a heap
499 // reference field load when Baker's read barriers are used.
500 void GenerateFieldLoadWithBakerReadBarrier(HInstruction* instruction,
Roland Levillaine3f43ac2016-01-19 15:07:47 +0000501 Location ref,
Roland Levillain7c1559a2015-12-15 10:55:36 +0000502 Register obj,
503 uint32_t offset,
Roland Levillain7c1559a2015-12-15 10:55:36 +0000504 bool needs_null_check);
505 // Fast path implementation of ReadBarrier::Barrier for a heap
506 // reference array load when Baker's read barriers are used.
507 void GenerateArrayLoadWithBakerReadBarrier(HInstruction* instruction,
Roland Levillaine3f43ac2016-01-19 15:07:47 +0000508 Location ref,
Roland Levillain7c1559a2015-12-15 10:55:36 +0000509 Register obj,
510 uint32_t data_offset,
511 Location index,
Roland Levillain7c1559a2015-12-15 10:55:36 +0000512 bool needs_null_check);
Roland Levillaina1aa3b12016-10-26 13:03:38 +0100513 // Factored implementation, used by GenerateFieldLoadWithBakerReadBarrier,
514 // GenerateArrayLoadWithBakerReadBarrier and some intrinsics.
515 //
516 // Load the object reference located at address `src`, held by
517 // object `obj`, into `ref`, and mark it if needed. The base of
518 // address `src` must be `obj`.
519 //
520 // If `always_update_field` is true, the value of the reference is
521 // atomically updated in the holder (`obj`). This operation
522 // requires a temporary register, which must be provided as a
523 // non-null pointer (`temp`).
Sang, Chunlei0fcd2b82016-04-05 17:12:59 +0800524 void GenerateReferenceLoadWithBakerReadBarrier(HInstruction* instruction,
525 Location ref,
526 Register obj,
527 const Address& src,
Roland Levillaina1aa3b12016-10-26 13:03:38 +0100528 bool needs_null_check,
529 bool always_update_field = false,
530 Register* temp = nullptr);
Roland Levillain7c1559a2015-12-15 10:55:36 +0000531
532 // Generate a read barrier for a heap reference within `instruction`
533 // using a slow path.
Roland Levillain0d5a2812015-11-13 10:07:31 +0000534 //
535 // A read barrier for an object reference read from the heap is
536 // implemented as a call to the artReadBarrierSlow runtime entry
537 // point, which is passed the values in locations `ref`, `obj`, and
538 // `offset`:
539 //
540 // mirror::Object* artReadBarrierSlow(mirror::Object* ref,
541 // mirror::Object* obj,
542 // uint32_t offset);
543 //
544 // The `out` location contains the value returned by
545 // artReadBarrierSlow.
546 //
547 // When `index` is provided (i.e. for array accesses), the offset
548 // value passed to artReadBarrierSlow is adjusted to take `index`
549 // into account.
Roland Levillain7c1559a2015-12-15 10:55:36 +0000550 void GenerateReadBarrierSlow(HInstruction* instruction,
551 Location out,
552 Location ref,
553 Location obj,
554 uint32_t offset,
555 Location index = Location::NoLocation());
Roland Levillain0d5a2812015-11-13 10:07:31 +0000556
Roland Levillain7c1559a2015-12-15 10:55:36 +0000557 // If read barriers are enabled, generate a read barrier for a heap
558 // reference using a slow path. If heap poisoning is enabled, also
559 // unpoison the reference in `out`.
560 void MaybeGenerateReadBarrierSlow(HInstruction* instruction,
561 Location out,
562 Location ref,
563 Location obj,
564 uint32_t offset,
565 Location index = Location::NoLocation());
Roland Levillain0d5a2812015-11-13 10:07:31 +0000566
Roland Levillain7c1559a2015-12-15 10:55:36 +0000567 // Generate a read barrier for a GC root within `instruction` using
568 // a slow path.
Roland Levillain0d5a2812015-11-13 10:07:31 +0000569 //
570 // A read barrier for an object reference GC root is implemented as
571 // a call to the artReadBarrierForRootSlow runtime entry point,
572 // which is passed the value in location `root`:
573 //
574 // mirror::Object* artReadBarrierForRootSlow(GcRoot<mirror::Object>* root);
575 //
576 // The `out` location contains the value returned by
577 // artReadBarrierForRootSlow.
Roland Levillain7c1559a2015-12-15 10:55:36 +0000578 void GenerateReadBarrierForRootSlow(HInstruction* instruction, Location out, Location root);
Roland Levillain0d5a2812015-11-13 10:07:31 +0000579
Mark P Mendell17077d82015-12-16 19:15:59 +0000580 // Ensure that prior stores complete to memory before subsequent loads.
581 // The locked add implementation will avoid serializing device memory, but will
582 // touch (but not change) the top of the stack.
583 // The 'non_temporal' parameter should be used to ensure ordering of non-temporal stores.
584 void MemoryFence(bool non_temporal = false) {
Mark Mendell7aa04a12016-01-27 22:39:07 -0500585 if (!non_temporal) {
Mark P Mendell17077d82015-12-16 19:15:59 +0000586 assembler_.lock()->addl(Address(ESP, 0), Immediate(0));
587 } else {
588 assembler_.mfence();
589 }
590 }
591
Roland Levillainf41f9562016-09-14 19:26:48 +0100592 void GenerateNop() OVERRIDE;
593 void GenerateImplicitNullCheck(HNullCheck* instruction) OVERRIDE;
594 void GenerateExplicitNullCheck(HNullCheck* instruction) OVERRIDE;
Mark P Mendell17077d82015-12-16 19:15:59 +0000595
Vladimir Markocac5a7e2016-02-22 10:39:50 +0000596 // When we don't know the proper offset for the value, we use kDummy32BitOffset.
597 // The correct value will be inserted when processing Assembler fixups.
598 static constexpr int32_t kDummy32BitOffset = 256;
599
Nicolas Geoffray3c7bb982014-07-23 16:04:16 +0100600 private:
Vladimir Marko0f7dca42015-11-02 14:36:43 +0000601 Register GetInvokeStaticOrDirectExtraParameter(HInvokeStaticOrDirect* invoke, Register temp);
602
Vladimir Markoaad75c62016-10-03 08:46:48 +0000603 template <LinkerPatch (*Factory)(size_t, const DexFile*, uint32_t, uint32_t)>
604 void EmitPcRelativeLinkerPatches(const ArenaDeque<PatchInfo<Label>>& infos,
605 ArenaVector<LinkerPatch>* linker_patches);
Vladimir Marko0f7dca42015-11-02 14:36:43 +0000606
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +0100607 // Labels for each block that will be compiled.
Vladimir Marko225b6462015-09-28 12:17:40 +0100608 Label* block_labels_; // Indexed by block id.
Nicolas Geoffray1cf95282014-12-12 19:22:03 +0000609 Label frame_entry_label_;
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000610 LocationsBuilderX86 location_builder_;
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000611 InstructionCodeGeneratorX86 instruction_visitor_;
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +0100612 ParallelMoveResolverX86 move_resolver_;
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000613 X86Assembler assembler_;
Mark Mendellfb8d2792015-03-31 22:16:59 -0400614 const X86InstructionSetFeatures& isa_features_;
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000615
Vladimir Marko58155012015-08-19 12:49:41 +0000616 // Method patch info. Using ArenaDeque<> which retains element addresses on push/emplace_back().
Vladimir Markoaad75c62016-10-03 08:46:48 +0000617 ArenaDeque<PatchInfo<Label>> method_patches_;
618 ArenaDeque<PatchInfo<Label>> relative_call_patches_;
Vladimir Marko0f7dca42015-11-02 14:36:43 +0000619 // PC-relative DexCache access info.
Vladimir Markoaad75c62016-10-03 08:46:48 +0000620 ArenaDeque<PatchInfo<Label>> pc_relative_dex_cache_patches_;
Vladimir Markocac5a7e2016-02-22 10:39:50 +0000621 // Patch locations for patchoat where the linker doesn't do any other work.
622 ArenaDeque<Label> simple_patches_;
Vladimir Markoaad75c62016-10-03 08:46:48 +0000623 // String patch locations; type depends on configuration (app .bss or boot image PIC/non-PIC).
624 ArenaDeque<PatchInfo<Label>> string_patches_;
Vladimir Markodbb7f5b2016-03-30 13:23:58 +0100625 // Type patch locations.
Vladimir Markoaad75c62016-10-03 08:46:48 +0000626 ArenaDeque<PatchInfo<Label>> type_patches_;
Vladimir Marko58155012015-08-19 12:49:41 +0000627
Nicolas Geoffray132d8362016-11-16 09:19:42 +0000628 // Patches for string root accesses in JIT compiled code.
629 ArenaDeque<PatchInfo<Label>> jit_string_patches_;
630
Nicolas Geoffray22384ae2016-12-12 22:33:36 +0000631 // Patches for class root accesses in JIT compiled code.
632 ArenaDeque<PatchInfo<Label>> jit_class_patches_;
633
Mark Mendell0616ae02015-04-17 12:49:27 -0400634 // Offset to the start of the constant area in the assembled code.
635 // Used for fixups to the constant area.
636 int32_t constant_area_start_;
637
Mark Mendell805b3b52015-09-18 14:10:29 -0400638 // Fixups for jump tables that need to be patched after the constant table is generated.
639 ArenaVector<JumpTableRIPFixup*> fixups_to_jump_tables_;
640
Mark Mendell0616ae02015-04-17 12:49:27 -0400641 // If there is a HX86ComputeBaseMethodAddress instruction in the graph
642 // (which shall be the sole instruction of this kind), subtracting this offset
643 // from the value contained in the out register of this HX86ComputeBaseMethodAddress
644 // instruction gives the address of the start of this method.
645 int32_t method_address_offset_;
646
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000647 DISALLOW_COPY_AND_ASSIGN(CodeGeneratorX86);
648};
649
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000650} // namespace x86
651} // namespace art
652
653#endif // ART_COMPILER_OPTIMIZING_CODE_GENERATOR_X86_H_