blob: c5e8a04da623ed79370c52502a86df5c07011fa8 [file] [log] [blame]
Nicolas Geoffray9cf35522014-06-09 18:40:10 +01001/*
2 * Copyright (C) 2014 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#ifndef ART_COMPILER_OPTIMIZING_CODE_GENERATOR_X86_64_H_
18#define ART_COMPILER_OPTIMIZING_CODE_GENERATOR_X86_64_H_
19
Mark P Mendell17077d82015-12-16 19:15:59 +000020#include "arch/x86_64/instruction_set_features_x86_64.h"
Nicolas Geoffray9cf35522014-06-09 18:40:10 +010021#include "code_generator.h"
Calin Juravle52c48962014-12-16 17:02:57 +000022#include "dex/compiler_enums.h"
Calin Juravlecd6dffe2015-01-08 17:35:35 +000023#include "driver/compiler_options.h"
Nicolas Geoffray9cf35522014-06-09 18:40:10 +010024#include "nodes.h"
Nicolas Geoffrayecb2f9b2014-06-13 08:59:59 +000025#include "parallel_move_resolver.h"
Nicolas Geoffray9cf35522014-06-09 18:40:10 +010026#include "utils/x86_64/assembler_x86_64.h"
27
28namespace art {
29namespace x86_64 {
30
Nicolas Geoffray86a8d7a2014-11-19 08:47:18 +000031// Use a local definition to prevent copying mistakes.
32static constexpr size_t kX86_64WordSize = kX86_64PointerSize;
Nicolas Geoffray9cf35522014-06-09 18:40:10 +010033
Nicolas Geoffrayee3cf072015-10-06 11:45:02 +010034// Some x86_64 instructions require a register to be available as temp.
35static constexpr Register TMP = R11;
36
Nicolas Geoffray9cf35522014-06-09 18:40:10 +010037static constexpr Register kParameterCoreRegisters[] = { RSI, RDX, RCX, R8, R9 };
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +010038static constexpr FloatRegister kParameterFloatRegisters[] =
39 { XMM0, XMM1, XMM2, XMM3, XMM4, XMM5, XMM6, XMM7 };
Nicolas Geoffray9cf35522014-06-09 18:40:10 +010040
41static constexpr size_t kParameterCoreRegistersLength = arraysize(kParameterCoreRegisters);
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +010042static constexpr size_t kParameterFloatRegistersLength = arraysize(kParameterFloatRegisters);
Nicolas Geoffray9cf35522014-06-09 18:40:10 +010043
Jeff Hao848f70a2014-01-15 13:49:50 -080044static constexpr Register kRuntimeParameterCoreRegisters[] = { RDI, RSI, RDX, RCX };
Nicolas Geoffrayd75948a2015-03-27 09:53:16 +000045static constexpr size_t kRuntimeParameterCoreRegistersLength =
46 arraysize(kRuntimeParameterCoreRegisters);
47static constexpr FloatRegister kRuntimeParameterFpuRegisters[] = { XMM0, XMM1 };
48static constexpr size_t kRuntimeParameterFpuRegistersLength =
49 arraysize(kRuntimeParameterFpuRegisters);
50
Mark Mendella4f12202015-08-06 15:23:34 -040051// These XMM registers are non-volatile in ART ABI, but volatile in native ABI.
52// If the ART ABI changes, this list must be updated. It is used to ensure that
53// these are not clobbered by any direct call to native code (such as math intrinsics).
54static constexpr FloatRegister non_volatile_xmm_regs[] = { XMM12, XMM13, XMM14, XMM15 };
55
56
Nicolas Geoffrayd75948a2015-03-27 09:53:16 +000057class InvokeRuntimeCallingConvention : public CallingConvention<Register, FloatRegister> {
58 public:
59 InvokeRuntimeCallingConvention()
60 : CallingConvention(kRuntimeParameterCoreRegisters,
61 kRuntimeParameterCoreRegistersLength,
62 kRuntimeParameterFpuRegisters,
Mathieu Chartiere401d142015-04-22 13:56:20 -070063 kRuntimeParameterFpuRegistersLength,
64 kX86_64PointerSize) {}
Nicolas Geoffrayd75948a2015-03-27 09:53:16 +000065
66 private:
67 DISALLOW_COPY_AND_ASSIGN(InvokeRuntimeCallingConvention);
68};
69
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +010070class InvokeDexCallingConvention : public CallingConvention<Register, FloatRegister> {
Nicolas Geoffray9cf35522014-06-09 18:40:10 +010071 public:
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +010072 InvokeDexCallingConvention() : CallingConvention(
73 kParameterCoreRegisters,
74 kParameterCoreRegistersLength,
75 kParameterFloatRegisters,
Mathieu Chartiere401d142015-04-22 13:56:20 -070076 kParameterFloatRegistersLength,
77 kX86_64PointerSize) {}
Nicolas Geoffray9cf35522014-06-09 18:40:10 +010078
79 private:
80 DISALLOW_COPY_AND_ASSIGN(InvokeDexCallingConvention);
81};
82
Calin Juravlee460d1d2015-09-29 04:52:17 +010083class FieldAccessCallingConventionX86_64 : public FieldAccessCallingConvention {
84 public:
85 FieldAccessCallingConventionX86_64() {}
86
87 Location GetObjectLocation() const OVERRIDE {
88 return Location::RegisterLocation(RSI);
89 }
90 Location GetFieldIndexLocation() const OVERRIDE {
91 return Location::RegisterLocation(RDI);
92 }
93 Location GetReturnLocation(Primitive::Type type ATTRIBUTE_UNUSED) const OVERRIDE {
94 return Location::RegisterLocation(RAX);
95 }
96 Location GetSetValueLocation(Primitive::Type type, bool is_instance) const OVERRIDE {
97 return Primitive::Is64BitType(type)
98 ? Location::RegisterLocation(RDX)
99 : (is_instance
100 ? Location::RegisterLocation(RDX)
101 : Location::RegisterLocation(RSI));
102 }
103 Location GetFpuLocation(Primitive::Type type ATTRIBUTE_UNUSED) const OVERRIDE {
104 return Location::FpuRegisterLocation(XMM0);
105 }
106
107 private:
108 DISALLOW_COPY_AND_ASSIGN(FieldAccessCallingConventionX86_64);
109};
110
111
Roland Levillain2d27c8e2015-04-28 15:48:45 +0100112class InvokeDexCallingConventionVisitorX86_64 : public InvokeDexCallingConventionVisitor {
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100113 public:
Roland Levillain2d27c8e2015-04-28 15:48:45 +0100114 InvokeDexCallingConventionVisitorX86_64() {}
115 virtual ~InvokeDexCallingConventionVisitorX86_64() {}
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100116
Roland Levillain2d27c8e2015-04-28 15:48:45 +0100117 Location GetNextLocation(Primitive::Type type) OVERRIDE;
Nicolas Geoffrayfd88f162015-06-03 11:23:52 +0100118 Location GetReturnLocation(Primitive::Type type) const OVERRIDE;
119 Location GetMethodLocation() const OVERRIDE;
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100120
121 private:
122 InvokeDexCallingConvention calling_convention;
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100123
Roland Levillain2d27c8e2015-04-28 15:48:45 +0100124 DISALLOW_COPY_AND_ASSIGN(InvokeDexCallingConventionVisitorX86_64);
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100125};
126
127class CodeGeneratorX86_64;
Andreas Gampe71fb52f2014-12-29 17:43:08 -0800128
Zheng Xuad4450e2015-04-17 18:48:56 +0800129class ParallelMoveResolverX86_64 : public ParallelMoveResolverWithSwap {
Nicolas Geoffrayecb2f9b2014-06-13 08:59:59 +0000130 public:
131 ParallelMoveResolverX86_64(ArenaAllocator* allocator, CodeGeneratorX86_64* codegen)
Zheng Xuad4450e2015-04-17 18:48:56 +0800132 : ParallelMoveResolverWithSwap(allocator), codegen_(codegen) {}
Nicolas Geoffrayecb2f9b2014-06-13 08:59:59 +0000133
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000134 void EmitMove(size_t index) OVERRIDE;
135 void EmitSwap(size_t index) OVERRIDE;
136 void SpillScratch(int reg) OVERRIDE;
137 void RestoreScratch(int reg) OVERRIDE;
Nicolas Geoffrayecb2f9b2014-06-13 08:59:59 +0000138
139 X86_64Assembler* GetAssembler() const;
140
141 private:
Nicolas Geoffray412f10c2014-06-19 10:00:34 +0100142 void Exchange32(CpuRegister reg, int mem);
Nicolas Geoffray102cbed2014-10-15 18:31:05 +0100143 void Exchange32(XmmRegister reg, int mem);
Nicolas Geoffray412f10c2014-06-19 10:00:34 +0100144 void Exchange32(int mem1, int mem2);
145 void Exchange64(CpuRegister reg, int mem);
Nicolas Geoffray102cbed2014-10-15 18:31:05 +0100146 void Exchange64(XmmRegister reg, int mem);
Nicolas Geoffray412f10c2014-06-19 10:00:34 +0100147 void Exchange64(int mem1, int mem2);
Nicolas Geoffrayecb2f9b2014-06-13 08:59:59 +0000148
149 CodeGeneratorX86_64* const codegen_;
150
151 DISALLOW_COPY_AND_ASSIGN(ParallelMoveResolverX86_64);
152};
153
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100154class LocationsBuilderX86_64 : public HGraphVisitor {
155 public:
156 LocationsBuilderX86_64(HGraph* graph, CodeGeneratorX86_64* codegen)
157 : HGraphVisitor(graph), codegen_(codegen) {}
158
Nicolas Geoffray360231a2014-10-08 21:07:48 +0100159#define DECLARE_VISIT_INSTRUCTION(name, super) \
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000160 void Visit##name(H##name* instr) OVERRIDE;
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100161
Alexandre Ramesef20f712015-06-09 10:29:30 +0100162 FOR_EACH_CONCRETE_INSTRUCTION_COMMON(DECLARE_VISIT_INSTRUCTION)
163 FOR_EACH_CONCRETE_INSTRUCTION_X86_64(DECLARE_VISIT_INSTRUCTION)
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100164
165#undef DECLARE_VISIT_INSTRUCTION
166
Alexandre Ramesef20f712015-06-09 10:29:30 +0100167 void VisitInstruction(HInstruction* instruction) OVERRIDE {
168 LOG(FATAL) << "Unreachable instruction " << instruction->DebugName()
169 << " (id " << instruction->GetId() << ")";
170 }
171
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100172 private:
Nicolas Geoffray9574c4b2014-11-12 13:19:37 +0000173 void HandleInvoke(HInvoke* invoke);
174 void HandleBitwiseOperation(HBinaryOperation* operation);
Vladimir Marko5f7b58e2015-11-23 19:49:34 +0000175 void HandleCondition(HCondition* condition);
Calin Juravle9aec02f2014-11-18 23:06:35 +0000176 void HandleShift(HBinaryOperation* operation);
Calin Juravle52c48962014-12-16 17:02:57 +0000177 void HandleFieldSet(HInstruction* instruction, const FieldInfo& field_info);
178 void HandleFieldGet(HInstruction* instruction);
Nicolas Geoffray9574c4b2014-11-12 13:19:37 +0000179
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100180 CodeGeneratorX86_64* const codegen_;
Roland Levillain2d27c8e2015-04-28 15:48:45 +0100181 InvokeDexCallingConventionVisitorX86_64 parameter_visitor_;
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100182
183 DISALLOW_COPY_AND_ASSIGN(LocationsBuilderX86_64);
184};
185
186class InstructionCodeGeneratorX86_64 : public HGraphVisitor {
187 public:
188 InstructionCodeGeneratorX86_64(HGraph* graph, CodeGeneratorX86_64* codegen);
189
Nicolas Geoffray360231a2014-10-08 21:07:48 +0100190#define DECLARE_VISIT_INSTRUCTION(name, super) \
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000191 void Visit##name(H##name* instr) OVERRIDE;
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100192
Alexandre Ramesef20f712015-06-09 10:29:30 +0100193 FOR_EACH_CONCRETE_INSTRUCTION_COMMON(DECLARE_VISIT_INSTRUCTION)
194 FOR_EACH_CONCRETE_INSTRUCTION_X86_64(DECLARE_VISIT_INSTRUCTION)
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100195
196#undef DECLARE_VISIT_INSTRUCTION
197
Alexandre Ramesef20f712015-06-09 10:29:30 +0100198 void VisitInstruction(HInstruction* instruction) OVERRIDE {
199 LOG(FATAL) << "Unreachable instruction " << instruction->DebugName()
200 << " (id " << instruction->GetId() << ")";
201 }
202
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100203 X86_64Assembler* GetAssembler() const { return assembler_; }
204
205 private:
Nicolas Geoffray3c049742014-09-24 18:10:46 +0100206 // Generate code for the given suspend check. If not null, `successor`
207 // is the block to branch to if the suspend check is not needed, and after
208 // the suspend call.
209 void GenerateSuspendCheck(HSuspendCheck* instruction, HBasicBlock* successor);
Andreas Gampe85b62f22015-09-09 13:15:38 -0700210 void GenerateClassInitializationCheck(SlowPathCode* slow_path, CpuRegister class_reg);
Nicolas Geoffray9574c4b2014-11-12 13:19:37 +0000211 void HandleBitwiseOperation(HBinaryOperation* operation);
Mark Mendellc4701932015-04-10 13:18:51 -0400212 void GenerateRemFP(HRem* rem);
Guillaume Sanchez0f88e872015-03-30 17:55:45 +0100213 void DivRemOneOrMinusOne(HBinaryOperation* instruction);
Guillaume Sanchezb19930c2015-04-09 21:12:15 +0100214 void DivByPowerOfTwo(HDiv* instruction);
Guillaume Sanchez0f88e872015-03-30 17:55:45 +0100215 void GenerateDivRemWithAnyConstant(HBinaryOperation* instruction);
Calin Juravlebacfec32014-11-14 15:54:36 +0000216 void GenerateDivRemIntegral(HBinaryOperation* instruction);
Vladimir Marko5f7b58e2015-11-23 19:49:34 +0000217 void HandleCondition(HCondition* condition);
Calin Juravle9aec02f2014-11-18 23:06:35 +0000218 void HandleShift(HBinaryOperation* operation);
Roland Levillain1e7f8db2015-12-15 10:54:19 +0000219
Nicolas Geoffray07276db2015-05-18 14:22:09 +0100220 void HandleFieldSet(HInstruction* instruction,
221 const FieldInfo& field_info,
222 bool value_can_be_null);
Calin Juravle52c48962014-12-16 17:02:57 +0000223 void HandleFieldGet(HInstruction* instruction, const FieldInfo& field_info);
Roland Levillain1e7f8db2015-12-15 10:54:19 +0000224
225 // Generate a heap reference load using one register `out`:
226 //
227 // out <- *(out + offset)
228 //
229 // while honoring heap poisoning and/or read barriers (if any).
230 // Register `temp` is used when generating a read barrier.
231 void GenerateReferenceLoadOneRegister(HInstruction* instruction,
232 Location out,
233 uint32_t offset,
234 Location temp);
235 // Generate a heap reference load using two different registers
236 // `out` and `obj`:
237 //
238 // out <- *(obj + offset)
239 //
240 // while honoring heap poisoning and/or read barriers (if any).
241 // Register `temp` is used when generating a Baker's read barrier.
242 void GenerateReferenceLoadTwoRegisters(HInstruction* instruction,
243 Location out,
244 Location obj,
245 uint32_t offset,
246 Location temp);
247 // Generate a GC root reference load:
248 //
249 // root <- *(obj + offset)
250 //
251 // while honoring read barriers (if any).
252 void GenerateGcRootFieldLoad(HInstruction* instruction,
253 Location root,
254 CpuRegister obj,
255 uint32_t offset);
256
Calin Juravlecd6dffe2015-01-08 17:35:35 +0000257 void GenerateImplicitNullCheck(HNullCheck* instruction);
258 void GenerateExplicitNullCheck(HNullCheck* instruction);
Mark Mendell24f2dfa2015-01-14 19:51:45 -0500259 void PushOntoFPStack(Location source, uint32_t temp_offset,
260 uint32_t stack_adjustment, bool is_float);
Mark Mendell152408f2015-12-31 12:28:50 -0500261 template<class LabelType>
Mingyao Yangd43b3ac2015-04-01 14:03:04 -0700262 void GenerateTestAndBranch(HInstruction* instruction,
David Brazdil0debae72015-11-12 18:37:00 +0000263 size_t condition_input_index,
Mark Mendell152408f2015-12-31 12:28:50 -0500264 LabelType* true_target,
265 LabelType* false_target);
266 template<class LabelType>
David Brazdil0debae72015-11-12 18:37:00 +0000267 void GenerateCompareTestAndBranch(HCondition* condition,
Mark Mendell152408f2015-12-31 12:28:50 -0500268 LabelType* true_target,
269 LabelType* false_target);
270 template<class LabelType>
271 void GenerateFPJumps(HCondition* cond, LabelType* true_label, LabelType* false_label);
272
David Brazdilfc6a86a2015-06-26 10:33:45 +0000273 void HandleGoto(HInstruction* got, HBasicBlock* successor);
Nicolas Geoffray3c049742014-09-24 18:10:46 +0100274
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100275 X86_64Assembler* const assembler_;
276 CodeGeneratorX86_64* const codegen_;
277
278 DISALLOW_COPY_AND_ASSIGN(InstructionCodeGeneratorX86_64);
279};
280
Mark Mendell9c86b482015-09-18 13:36:07 -0400281// Class for fixups to jump tables.
282class JumpTableRIPFixup;
283
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100284class CodeGeneratorX86_64 : public CodeGenerator {
285 public:
Mark Mendellfb8d2792015-03-31 22:16:59 -0400286 CodeGeneratorX86_64(HGraph* graph,
287 const X86_64InstructionSetFeatures& isa_features,
Serban Constantinescuecc43662015-08-13 13:33:12 +0100288 const CompilerOptions& compiler_options,
289 OptimizingCompilerStats* stats = nullptr);
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100290 virtual ~CodeGeneratorX86_64() {}
291
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000292 void GenerateFrameEntry() OVERRIDE;
293 void GenerateFrameExit() OVERRIDE;
294 void Bind(HBasicBlock* block) OVERRIDE;
295 void Move(HInstruction* instruction, Location location, HInstruction* move_for) OVERRIDE;
Calin Juravle175dc732015-08-25 15:42:32 +0100296 void MoveConstant(Location destination, int32_t value) OVERRIDE;
Calin Juravlee460d1d2015-09-29 04:52:17 +0100297 void MoveLocation(Location dst, Location src, Primitive::Type dst_type) OVERRIDE;
298 void AddLocationAsTemp(Location location, LocationSummary* locations) OVERRIDE;
299
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000300 size_t SaveCoreRegister(size_t stack_index, uint32_t reg_id) OVERRIDE;
301 size_t RestoreCoreRegister(size_t stack_index, uint32_t reg_id) OVERRIDE;
302 size_t SaveFloatingPointRegister(size_t stack_index, uint32_t reg_id) OVERRIDE;
303 size_t RestoreFloatingPointRegister(size_t stack_index, uint32_t reg_id) OVERRIDE;
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100304
Alexandre Rames8158f282015-08-07 10:26:17 +0100305 // Generate code to invoke a runtime entry point.
Calin Juravle175dc732015-08-25 15:42:32 +0100306 void InvokeRuntime(QuickEntrypointEnum entrypoint,
307 HInstruction* instruction,
308 uint32_t dex_pc,
309 SlowPathCode* slow_path) OVERRIDE;
310
311 void InvokeRuntime(int32_t entry_point_offset,
Alexandre Rames8158f282015-08-07 10:26:17 +0100312 HInstruction* instruction,
313 uint32_t dex_pc,
314 SlowPathCode* slow_path);
315
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000316 size_t GetWordSize() const OVERRIDE {
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100317 return kX86_64WordSize;
318 }
319
Mark Mendellf85a9ca2015-01-13 09:20:58 -0500320 size_t GetFloatingPointSpillSlotSize() const OVERRIDE {
321 return kX86_64WordSize;
322 }
323
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000324 HGraphVisitor* GetLocationBuilder() OVERRIDE {
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100325 return &location_builder_;
326 }
327
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000328 HGraphVisitor* GetInstructionVisitor() OVERRIDE {
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100329 return &instruction_visitor_;
330 }
331
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000332 X86_64Assembler* GetAssembler() OVERRIDE {
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100333 return &assembler_;
334 }
335
Alexandre Rameseb7b7392015-06-19 14:47:01 +0100336 const X86_64Assembler& GetAssembler() const OVERRIDE {
337 return assembler_;
338 }
339
Nicolas Geoffrayf0e39372014-11-12 17:50:07 +0000340 ParallelMoveResolverX86_64* GetMoveResolver() OVERRIDE {
Nicolas Geoffrayecb2f9b2014-06-13 08:59:59 +0000341 return &move_resolver_;
342 }
343
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000344 uintptr_t GetAddressOf(HBasicBlock* block) const OVERRIDE {
345 return GetLabelOf(block)->Position();
346 }
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100347
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000348 Location GetStackLocation(HLoadLocal* load) const OVERRIDE;
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100349
Nicolas Geoffray98893962015-01-21 12:32:32 +0000350 void SetupBlockedRegisters(bool is_baseline) const OVERRIDE;
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000351 Location AllocateFreeRegister(Primitive::Type type) const OVERRIDE;
352 void DumpCoreRegister(std::ostream& stream, int reg) const OVERRIDE;
353 void DumpFloatingPointRegister(std::ostream& stream, int reg) const OVERRIDE;
Mark Mendellf55c3e02015-03-26 21:07:46 -0400354 void Finalize(CodeAllocator* allocator) OVERRIDE;
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000355
356 InstructionSet GetInstructionSet() const OVERRIDE {
Nicolas Geoffray412f10c2014-06-19 10:00:34 +0100357 return InstructionSet::kX86_64;
358 }
359
Nicolas Geoffray3c7bb982014-07-23 16:04:16 +0100360 // Emit a write barrier.
Nicolas Geoffray07276db2015-05-18 14:22:09 +0100361 void MarkGCCard(CpuRegister temp,
362 CpuRegister card,
363 CpuRegister object,
364 CpuRegister value,
365 bool value_can_be_null);
Nicolas Geoffray3c7bb982014-07-23 16:04:16 +0100366
Roland Levillain1e7f8db2015-12-15 10:54:19 +0000367 void GenerateMemoryBarrier(MemBarrierKind kind);
368
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100369 // Helper method to move a value between two locations.
370 void Move(Location destination, Location source);
371
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +0100372 Label* GetLabelOf(HBasicBlock* block) const {
Vladimir Marko225b6462015-09-28 12:17:40 +0100373 return CommonGetLabelOf<Label>(block_labels_, block);
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +0100374 }
375
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000376 void Initialize() OVERRIDE {
Vladimir Marko225b6462015-09-28 12:17:40 +0100377 block_labels_ = CommonInitializeLabels<Label>();
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +0100378 }
379
Nicolas Geoffray840e5462015-01-07 16:01:24 +0000380 bool NeedsTwoRegisters(Primitive::Type type ATTRIBUTE_UNUSED) const OVERRIDE {
381 return false;
382 }
383
Vladimir Markodc151b22015-10-15 18:02:30 +0100384 // Check if the desired_dispatch_info is supported. If it is, return it,
385 // otherwise return a fall-back info that should be used instead.
386 HInvokeStaticOrDirect::DispatchInfo GetSupportedInvokeStaticOrDirectDispatch(
387 const HInvokeStaticOrDirect::DispatchInfo& desired_dispatch_info,
388 MethodReference target_method) OVERRIDE;
389
Andreas Gampe85b62f22015-09-09 13:15:38 -0700390 void GenerateStaticOrDirectCall(HInvokeStaticOrDirect* invoke, Location temp) OVERRIDE;
391 void GenerateVirtualCall(HInvokeVirtual* invoke, Location temp) OVERRIDE;
392
393 void MoveFromReturnRegister(Location trg, Primitive::Type type) OVERRIDE;
Andreas Gampe71fb52f2014-12-29 17:43:08 -0800394
Vladimir Marko58155012015-08-19 12:49:41 +0000395 void EmitLinkerPatches(ArenaVector<LinkerPatch>* linker_patches) OVERRIDE;
396
Mark Mendellfb8d2792015-03-31 22:16:59 -0400397 const X86_64InstructionSetFeatures& GetInstructionSetFeatures() const {
398 return isa_features_;
399 }
400
Roland Levillain1e7f8db2015-12-15 10:54:19 +0000401 // Fast path implementation of ReadBarrier::Barrier for a heap
402 // reference field load when Baker's read barriers are used.
403 void GenerateFieldLoadWithBakerReadBarrier(HInstruction* instruction,
404 Location out,
405 CpuRegister obj,
406 uint32_t offset,
407 Location temp,
408 bool needs_null_check);
409 // Fast path implementation of ReadBarrier::Barrier for a heap
410 // reference array load when Baker's read barriers are used.
411 void GenerateArrayLoadWithBakerReadBarrier(HInstruction* instruction,
412 Location out,
413 CpuRegister obj,
414 uint32_t data_offset,
415 Location index,
416 Location temp,
417 bool needs_null_check);
418
419 // Generate a read barrier for a heap reference within `instruction`
420 // using a slow path.
Roland Levillain0d5a2812015-11-13 10:07:31 +0000421 //
422 // A read barrier for an object reference read from the heap is
423 // implemented as a call to the artReadBarrierSlow runtime entry
424 // point, which is passed the values in locations `ref`, `obj`, and
425 // `offset`:
426 //
427 // mirror::Object* artReadBarrierSlow(mirror::Object* ref,
428 // mirror::Object* obj,
429 // uint32_t offset);
430 //
431 // The `out` location contains the value returned by
432 // artReadBarrierSlow.
433 //
434 // When `index` provided (i.e., when it is different from
435 // Location::NoLocation()), the offset value passed to
436 // artReadBarrierSlow is adjusted to take `index` into account.
Roland Levillain1e7f8db2015-12-15 10:54:19 +0000437 void GenerateReadBarrierSlow(HInstruction* instruction,
438 Location out,
439 Location ref,
440 Location obj,
441 uint32_t offset,
442 Location index = Location::NoLocation());
Roland Levillain0d5a2812015-11-13 10:07:31 +0000443
Roland Levillain1e7f8db2015-12-15 10:54:19 +0000444 // If read barriers are enabled, generate a read barrier for a heap
445 // reference using a slow path. If heap poisoning is enabled, also
446 // unpoison the reference in `out`.
447 void MaybeGenerateReadBarrierSlow(HInstruction* instruction,
448 Location out,
449 Location ref,
450 Location obj,
451 uint32_t offset,
452 Location index = Location::NoLocation());
Roland Levillain0d5a2812015-11-13 10:07:31 +0000453
Roland Levillain1e7f8db2015-12-15 10:54:19 +0000454 // Generate a read barrier for a GC root within `instruction` using
455 // a slow path.
Roland Levillain0d5a2812015-11-13 10:07:31 +0000456 //
457 // A read barrier for an object reference GC root is implemented as
458 // a call to the artReadBarrierForRootSlow runtime entry point,
459 // which is passed the value in location `root`:
460 //
461 // mirror::Object* artReadBarrierForRootSlow(GcRoot<mirror::Object>* root);
462 //
463 // The `out` location contains the value returned by
464 // artReadBarrierForRootSlow.
Roland Levillain1e7f8db2015-12-15 10:54:19 +0000465 void GenerateReadBarrierForRootSlow(HInstruction* instruction, Location out, Location root);
Roland Levillain0d5a2812015-11-13 10:07:31 +0000466
Mark Mendellf55c3e02015-03-26 21:07:46 -0400467 int ConstantAreaStart() const {
468 return constant_area_start_;
469 }
470
471 Address LiteralDoubleAddress(double v);
472 Address LiteralFloatAddress(float v);
473 Address LiteralInt32Address(int32_t v);
474 Address LiteralInt64Address(int64_t v);
475
Mark Mendell92e83bf2015-05-07 11:25:03 -0400476 // Load a 64 bit value into a register in the most efficient manner.
477 void Load64BitValue(CpuRegister dest, int64_t value);
Mark Mendell9c86b482015-09-18 13:36:07 -0400478 Address LiteralCaseTable(HPackedSwitch* switch_instr);
Mark Mendell92e83bf2015-05-07 11:25:03 -0400479
Mark Mendellcfa410b2015-05-25 16:02:44 -0400480 // Store a 64 bit value into a DoubleStackSlot in the most efficient manner.
481 void Store64BitValueToStack(Location dest, int64_t value);
482
Mark Mendellea5af682015-10-22 17:35:49 -0400483 // Assign a 64 bit constant to an address.
484 void MoveInt64ToAddress(const Address& addr_low,
485 const Address& addr_high,
486 int64_t v,
487 HInstruction* instruction);
488
Mark P Mendell17077d82015-12-16 19:15:59 +0000489 // Ensure that prior stores complete to memory before subsequent loads.
490 // The locked add implementation will avoid serializing device memory, but will
491 // touch (but not change) the top of the stack. The locked add should not be used for
492 // ordering non-temporal stores.
493 void MemoryFence(bool force_mfence = false) {
494 if (!force_mfence && isa_features_.PrefersLockedAddSynchronization()) {
495 assembler_.lock()->addl(Address(CpuRegister(RSP), 0), Immediate(0));
496 } else {
497 assembler_.mfence();
498 }
499 }
500
Nicolas Geoffray3c7bb982014-07-23 16:04:16 +0100501 private:
Roland Levillain1e7f8db2015-12-15 10:54:19 +0000502 // Factored implementation of GenerateFieldLoadWithBakerReadBarrier
503 // and GenerateArrayLoadWithBakerReadBarrier.
504 void GenerateReferenceLoadWithBakerReadBarrier(HInstruction* instruction,
505 Location ref,
506 CpuRegister obj,
507 const Address& src,
508 Location temp,
509 bool needs_null_check);
510
Vladimir Marko58155012015-08-19 12:49:41 +0000511 struct PcRelativeDexCacheAccessInfo {
512 PcRelativeDexCacheAccessInfo(const DexFile& dex_file, uint32_t element_off)
513 : target_dex_file(dex_file), element_offset(element_off), label() { }
514
515 const DexFile& target_dex_file;
516 uint32_t element_offset;
517 Label label;
518 };
519
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +0100520 // Labels for each block that will be compiled.
Vladimir Marko225b6462015-09-28 12:17:40 +0100521 Label* block_labels_; // Indexed by block id.
Nicolas Geoffray1cf95282014-12-12 19:22:03 +0000522 Label frame_entry_label_;
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100523 LocationsBuilderX86_64 location_builder_;
524 InstructionCodeGeneratorX86_64 instruction_visitor_;
Nicolas Geoffrayecb2f9b2014-06-13 08:59:59 +0000525 ParallelMoveResolverX86_64 move_resolver_;
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100526 X86_64Assembler assembler_;
Mark Mendellfb8d2792015-03-31 22:16:59 -0400527 const X86_64InstructionSetFeatures& isa_features_;
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100528
Mark Mendell39dcf552015-04-09 20:42:42 -0400529 // Offset to the start of the constant area in the assembled code.
Mark Mendellf55c3e02015-03-26 21:07:46 -0400530 // Used for fixups to the constant area.
531 int constant_area_start_;
532
Vladimir Marko58155012015-08-19 12:49:41 +0000533 // Method patch info. Using ArenaDeque<> which retains element addresses on push/emplace_back().
534 ArenaDeque<MethodPatchInfo<Label>> method_patches_;
535 ArenaDeque<MethodPatchInfo<Label>> relative_call_patches_;
536 // PC-relative DexCache access info.
Vladimir Marko0f7dca42015-11-02 14:36:43 +0000537 ArenaDeque<PcRelativeDexCacheAccessInfo> pc_relative_dex_cache_patches_;
Vladimir Marko58155012015-08-19 12:49:41 +0000538
539 // When we don't know the proper offset for the value, we use kDummy32BitOffset.
540 // We will fix this up in the linker later to have the right value.
541 static constexpr int32_t kDummy32BitOffset = 256;
542
Mark Mendell9c86b482015-09-18 13:36:07 -0400543 // Fixups for jump tables need to be handled specially.
544 ArenaVector<JumpTableRIPFixup*> fixups_to_jump_tables_;
545
Nicolas Geoffray9cf35522014-06-09 18:40:10 +0100546 DISALLOW_COPY_AND_ASSIGN(CodeGeneratorX86_64);
547};
548
549} // namespace x86_64
550} // namespace art
551
552#endif // ART_COMPILER_OPTIMIZING_CODE_GENERATOR_X86_64_H_