blob: 65108573019796953f8ba1c7d72bbd82c61ede11 [file] [log] [blame]
Nicolas Geoffraye53798a2014-12-01 10:31:54 +00001/*
2 * Copyright (C) 2014 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#ifndef ART_COMPILER_OPTIMIZING_INLINER_H_
18#define ART_COMPILER_OPTIMIZING_INLINER_H_
19
David Sehr9e734c72018-01-04 17:56:19 -080020#include "dex/dex_file_types.h"
David Sehr8c0961f2018-01-23 16:11:38 -080021#include "dex/invoke_type.h"
Andreas Gampe8cf9cb32017-07-19 09:28:38 -070022#include "optimization.h"
David Sehr82d046e2018-04-23 08:14:19 -070023#include "profile/profile_compilation_info.h"
Nicolas Geoffraye53798a2014-12-01 10:31:54 +000024
Vladimir Marko0a516052019-10-14 13:00:44 +000025namespace art {
Nicolas Geoffraye53798a2014-12-01 10:31:54 +000026
Vladimir Markodc151b22015-10-15 18:02:30 +010027class CodeGenerator;
Nicolas Geoffraye53798a2014-12-01 10:31:54 +000028class DexCompilationUnit;
29class HGraph;
30class HInvoke;
31class OptimizingCompilerStats;
32
33class HInliner : public HOptimization {
34 public:
35 HInliner(HGraph* outer_graph,
Nicolas Geoffray73be1e82015-09-17 15:22:56 +010036 HGraph* outermost_graph,
Vladimir Markodc151b22015-10-15 18:02:30 +010037 CodeGenerator* codegen,
Nicolas Geoffraye53798a2014-12-01 10:31:54 +000038 const DexCompilationUnit& outer_compilation_unit,
Nicolas Geoffray9437b782015-03-25 10:08:51 +000039 const DexCompilationUnit& caller_compilation_unit,
Nicolas Geoffrayef87c5d2015-01-30 12:41:14 +000040 OptimizingCompilerStats* stats,
Nicolas Geoffray5949fa02015-12-18 10:57:10 +000041 size_t total_number_of_dex_registers,
Nicolas Geoffrayf6d46682017-02-28 17:41:45 +000042 size_t total_number_of_instructions,
43 HInliner* parent,
Aart Bik2ca10eb2017-11-15 15:17:53 -080044 size_t depth = 0,
45 const char* name = kInlinerPassName)
46 : HOptimization(outer_graph, name, stats),
Nicolas Geoffray73be1e82015-09-17 15:22:56 +010047 outermost_graph_(outermost_graph),
Nicolas Geoffraye53798a2014-12-01 10:31:54 +000048 outer_compilation_unit_(outer_compilation_unit),
Nicolas Geoffray9437b782015-03-25 10:08:51 +000049 caller_compilation_unit_(caller_compilation_unit),
Vladimir Markodc151b22015-10-15 18:02:30 +010050 codegen_(codegen),
Nicolas Geoffray5949fa02015-12-18 10:57:10 +000051 total_number_of_dex_registers_(total_number_of_dex_registers),
Nicolas Geoffrayf6d46682017-02-28 17:41:45 +000052 total_number_of_instructions_(total_number_of_instructions),
53 parent_(parent),
Nicolas Geoffray454a4812015-06-09 10:37:32 +010054 depth_(depth),
Nicolas Geoffrayf6d46682017-02-28 17:41:45 +000055 inlining_budget_(0),
Vladimir Marko438709f2017-02-23 18:56:13 +000056 inline_stats_(nullptr) {}
Nicolas Geoffraye53798a2014-12-01 10:31:54 +000057
Roland Levillainbbc6e7e2018-08-24 16:58:47 +010058 bool Run() override;
Nicolas Geoffraye53798a2014-12-01 10:31:54 +000059
Andreas Gampe7c3952f2015-02-19 18:21:24 -080060 static constexpr const char* kInlinerPassName = "inliner";
61
Nicolas Geoffraye53798a2014-12-01 10:31:54 +000062 private:
Calin Juravle13439f02017-02-21 01:17:21 -080063 enum InlineCacheType {
64 kInlineCacheNoData = 0,
65 kInlineCacheUninitialized = 1,
66 kInlineCacheMonomorphic = 2,
67 kInlineCachePolymorphic = 3,
68 kInlineCacheMegamorphic = 4,
69 kInlineCacheMissingTypes = 5
70 };
71
Nicolas Geoffraye418dda2015-08-11 20:03:09 -070072 bool TryInline(HInvoke* invoke_instruction);
Nicolas Geoffray73be1e82015-09-17 15:22:56 +010073
Eric Holk1868de92020-02-12 09:10:21 -080074 // Attempt to resolve the target of the invoke instruction to an acutal call
75 // target.
76 //
77 // Returns the target directly in the case of static or direct invokes.
78 // Otherwise, uses CHA devirtualization or other methods to try to find the
79 // call target.
80 ArtMethod* FindActualCallTarget(HInvoke* invoke_instruction, bool* cha_devirtualize)
81 REQUIRES_SHARED(Locks::mutator_lock_);
82
Nicolas Geoffray73be1e82015-09-17 15:22:56 +010083 // Try to inline `resolved_method` in place of `invoke_instruction`. `do_rtp` is whether
Nicolas Geoffray55bd7492016-02-16 15:37:12 +000084 // reference type propagation can run after the inlining. If the inlining is successful, this
Mingyao Yang063fc772016-08-02 11:02:54 -070085 // method will replace and remove the `invoke_instruction`. If `cha_devirtualize` is true,
86 // a CHA guard needs to be added for the inlining.
87 bool TryInlineAndReplace(HInvoke* invoke_instruction,
88 ArtMethod* resolved_method,
Nicolas Geoffray0f001b72017-01-04 16:46:23 +000089 ReferenceTypeInfo receiver_type,
Mingyao Yang063fc772016-08-02 11:02:54 -070090 bool do_rtp,
91 bool cha_devirtualize)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -070092 REQUIRES_SHARED(Locks::mutator_lock_);
Nicolas Geoffray73be1e82015-09-17 15:22:56 +010093
Nicolas Geoffray55bd7492016-02-16 15:37:12 +000094 bool TryBuildAndInline(HInvoke* invoke_instruction,
95 ArtMethod* resolved_method,
Nicolas Geoffray0f001b72017-01-04 16:46:23 +000096 ReferenceTypeInfo receiver_type,
Nicolas Geoffray55bd7492016-02-16 15:37:12 +000097 HInstruction** return_replacement)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -070098 REQUIRES_SHARED(Locks::mutator_lock_);
Nicolas Geoffray55bd7492016-02-16 15:37:12 +000099
100 bool TryBuildAndInlineHelper(HInvoke* invoke_instruction,
101 ArtMethod* resolved_method,
Nicolas Geoffray0f001b72017-01-04 16:46:23 +0000102 ReferenceTypeInfo receiver_type,
Eric Holk1868de92020-02-12 09:10:21 -0800103 HInstruction** return_replacement)
104 REQUIRES_SHARED(Locks::mutator_lock_);
105
106 // Substitutes parameters in the callee graph with their values from the caller.
107 void SubstituteArguments(HGraph* callee_graph,
108 HInvoke* invoke_instruction,
109 ReferenceTypeInfo receiver_type,
110 const DexCompilationUnit& dex_compilation_unit)
111 REQUIRES_SHARED(Locks::mutator_lock_);
Nicolas Geoffray55bd7492016-02-16 15:37:12 +0000112
Roland Levillaina3aef2e2016-04-06 17:45:58 +0100113 // Run simple optimizations on `callee_graph`.
Nicolas Geoffrayf6d46682017-02-28 17:41:45 +0000114 void RunOptimizations(HGraph* callee_graph,
Andreas Gampe3f1dcd32018-12-28 09:39:56 -0800115 const dex::CodeItem* code_item,
Nicolas Geoffrayf6d46682017-02-28 17:41:45 +0000116 const DexCompilationUnit& dex_compilation_unit)
117 REQUIRES_SHARED(Locks::mutator_lock_);
Roland Levillaina3aef2e2016-04-06 17:45:58 +0100118
Vladimir Markobe10e8e2016-01-22 12:09:44 +0000119 // Try to recognize known simple patterns and replace invoke call with appropriate instructions.
Nicolas Geoffray55bd7492016-02-16 15:37:12 +0000120 bool TryPatternSubstitution(HInvoke* invoke_instruction,
121 ArtMethod* resolved_method,
122 HInstruction** return_replacement)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700123 REQUIRES_SHARED(Locks::mutator_lock_);
Vladimir Markobe10e8e2016-01-22 12:09:44 +0000124
Eric Holk1868de92020-02-12 09:10:21 -0800125 // Returns whether inlining is allowed based on ART semantics.
126 bool IsInliningAllowed(art::ArtMethod* method, const CodeItemDataAccessor& accessor) const
127 REQUIRES_SHARED(Locks::mutator_lock_);
128
129
130 // Returns whether ART supports inlining this method.
131 //
132 // Some methods are not supported because they have features for which inlining
133 // is not implemented. For example, we do not currently support inlining throw
134 // instructions into a try block.
135 bool IsInliningSupported(const HInvoke* invoke_instruction,
136 art::ArtMethod* method,
137 const CodeItemDataAccessor& accessor) const
138 REQUIRES_SHARED(Locks::mutator_lock_);
139
140 // Returns whether the inlining budget allows inlining method.
141 //
142 // For example, this checks whether the function has grown too large and
143 // inlining should be prevented.
144 bool IsInliningBudgetAvailable(art::ArtMethod* method, const CodeItemDataAccessor& accessor) const
145 REQUIRES_SHARED(Locks::mutator_lock_);
146
147 // Inspects the body of a method (callee_graph) and returns whether it can be
148 // inlined.
149 //
150 // This checks for instructions and constructs that we do not support
151 // inlining, such as inlining a throw instruction into a try block.
152 bool CanInlineBody(const HGraph* callee_graph,
153 const HBasicBlock* target_block,
154 size_t* out_number_of_instructions) const
155 REQUIRES_SHARED(Locks::mutator_lock_);
156
Vladimir Markobe10e8e2016-01-22 12:09:44 +0000157 // Create a new HInstanceFieldGet.
Vladimir Markof44d36c2017-03-14 14:18:46 +0000158 HInstanceFieldGet* CreateInstanceFieldGet(uint32_t field_index,
159 ArtMethod* referrer,
Vladimir Markobe10e8e2016-01-22 12:09:44 +0000160 HInstruction* obj);
161 // Create a new HInstanceFieldSet.
Vladimir Markof44d36c2017-03-14 14:18:46 +0000162 HInstanceFieldSet* CreateInstanceFieldSet(uint32_t field_index,
163 ArtMethod* referrer,
Vladimir Markobe10e8e2016-01-22 12:09:44 +0000164 HInstruction* obj,
Vladimir Markof44d36c2017-03-14 14:18:46 +0000165 HInstruction* value,
166 bool* is_final = nullptr);
Vladimir Markobe10e8e2016-01-22 12:09:44 +0000167
Calin Juravle13439f02017-02-21 01:17:21 -0800168 // Try inlining the invoke instruction using inline caches.
169 bool TryInlineFromInlineCache(
170 const DexFile& caller_dex_file,
171 HInvoke* invoke_instruction,
172 ArtMethod* resolved_method)
173 REQUIRES_SHARED(Locks::mutator_lock_);
174
175 // Try getting the inline cache from JIT code cache.
176 // Return true if the inline cache was successfully allocated and the
177 // invoke info was found in the profile info.
178 InlineCacheType GetInlineCacheJIT(
179 HInvoke* invoke_instruction,
180 StackHandleScope<1>* hs,
181 /*out*/Handle<mirror::ObjectArray<mirror::Class>>* inline_cache)
182 REQUIRES_SHARED(Locks::mutator_lock_);
183
184 // Try getting the inline cache from AOT offline profile.
185 // Return true if the inline cache was successfully allocated and the
186 // invoke info was found in the profile info.
187 InlineCacheType GetInlineCacheAOT(const DexFile& caller_dex_file,
188 HInvoke* invoke_instruction,
189 StackHandleScope<1>* hs,
190 /*out*/Handle<mirror::ObjectArray<mirror::Class>>* inline_cache)
191 REQUIRES_SHARED(Locks::mutator_lock_);
192
193 // Extract the mirror classes from the offline profile and add them to the `inline_cache`.
194 // Note that even if we have profile data for the invoke the inline_cache might contain
195 // only null entries if the types cannot be resolved.
196 InlineCacheType ExtractClassesFromOfflineProfile(
197 const HInvoke* invoke_instruction,
198 const ProfileCompilationInfo::OfflineProfileMethodInfo& offline_profile,
199 /*out*/Handle<mirror::ObjectArray<mirror::Class>> inline_cache)
200 REQUIRES_SHARED(Locks::mutator_lock_);
201
202 // Compute the inline cache type.
203 InlineCacheType GetInlineCacheType(
204 const Handle<mirror::ObjectArray<mirror::Class>>& classes)
205 REQUIRES_SHARED(Locks::mutator_lock_);
206
Nicolas Geoffray73be1e82015-09-17 15:22:56 +0100207 // Try to inline the target of a monomorphic call. If successful, the code
208 // in the graph will look like:
209 // if (receiver.getClass() != ic.GetMonomorphicType()) deopt
210 // ... // inlined code
211 bool TryInlineMonomorphicCall(HInvoke* invoke_instruction,
212 ArtMethod* resolved_method,
Nicolas Geoffraye51ca8b2016-11-22 14:49:31 +0000213 Handle<mirror::ObjectArray<mirror::Class>> classes)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700214 REQUIRES_SHARED(Locks::mutator_lock_);
Nicolas Geoffray73be1e82015-09-17 15:22:56 +0100215
Nicolas Geoffray916cc1d2016-02-18 11:12:31 +0000216 // Try to inline targets of a polymorphic call.
Nicolas Geoffray73be1e82015-09-17 15:22:56 +0100217 bool TryInlinePolymorphicCall(HInvoke* invoke_instruction,
218 ArtMethod* resolved_method,
Nicolas Geoffraye51ca8b2016-11-22 14:49:31 +0000219 Handle<mirror::ObjectArray<mirror::Class>> classes)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700220 REQUIRES_SHARED(Locks::mutator_lock_);
Nicolas Geoffray73be1e82015-09-17 15:22:56 +0100221
Nicolas Geoffray916cc1d2016-02-18 11:12:31 +0000222 bool TryInlinePolymorphicCallToSameTarget(HInvoke* invoke_instruction,
223 ArtMethod* resolved_method,
Nicolas Geoffraye51ca8b2016-11-22 14:49:31 +0000224 Handle<mirror::ObjectArray<mirror::Class>> classes)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700225 REQUIRES_SHARED(Locks::mutator_lock_);
Nicolas Geoffray916cc1d2016-02-18 11:12:31 +0000226
Calin Juravleaf44e6c2017-05-23 14:24:55 -0700227 // Returns whether or not we should use only polymorphic inlining with no deoptimizations.
228 bool UseOnlyPolymorphicInliningWithNoDeopt();
229
Mingyao Yang063fc772016-08-02 11:02:54 -0700230 // Try CHA-based devirtualization to change virtual method calls into
231 // direct calls.
232 // Returns the actual method that resolved_method can be devirtualized to.
233 ArtMethod* TryCHADevirtualization(ArtMethod* resolved_method)
234 REQUIRES_SHARED(Locks::mutator_lock_);
235
236 // Add a CHA guard for a CHA-based devirtualized call. A CHA guard checks a
237 // should_deoptimize flag and if it's true, does deoptimization.
238 void AddCHAGuard(HInstruction* invoke_instruction,
239 uint32_t dex_pc,
240 HInstruction* cursor,
241 HBasicBlock* bb_cursor);
Nicolas Geoffray916cc1d2016-02-18 11:12:31 +0000242
Nicolas Geoffraya42363f2015-12-17 14:57:09 +0000243 HInstanceFieldGet* BuildGetReceiverClass(ClassLinker* class_linker,
244 HInstruction* receiver,
245 uint32_t dex_pc) const
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700246 REQUIRES_SHARED(Locks::mutator_lock_);
Nicolas Geoffraya42363f2015-12-17 14:57:09 +0000247
David Brazdil94ab38f2016-06-21 17:48:19 +0100248 void FixUpReturnReferenceType(ArtMethod* resolved_method, HInstruction* return_replacement)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700249 REQUIRES_SHARED(Locks::mutator_lock_);
David Brazdil94ab38f2016-06-21 17:48:19 +0100250
David Brazdil94ab38f2016-06-21 17:48:19 +0100251 bool ArgumentTypesMoreSpecific(HInvoke* invoke_instruction, ArtMethod* resolved_method)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700252 REQUIRES_SHARED(Locks::mutator_lock_);
David Brazdil94ab38f2016-06-21 17:48:19 +0100253
254 bool ReturnTypeMoreSpecific(HInvoke* invoke_instruction, HInstruction* return_replacement)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700255 REQUIRES_SHARED(Locks::mutator_lock_);
Vladimir Markobe10e8e2016-01-22 12:09:44 +0000256
Nicolas Geoffray916cc1d2016-02-18 11:12:31 +0000257 // Add a type guard on the given `receiver`. This will add to the graph:
258 // i0 = HFieldGet(receiver, klass)
259 // i1 = HLoadClass(class_index, is_referrer)
260 // i2 = HNotEqual(i0, i1)
261 //
262 // And if `with_deoptimization` is true:
263 // HDeoptimize(i2)
264 //
265 // The method returns the `HNotEqual`, that will be used for polymorphic inlining.
266 HInstruction* AddTypeGuard(HInstruction* receiver,
267 HInstruction* cursor,
268 HBasicBlock* bb_cursor,
Andreas Gampea5b09a62016-11-17 15:21:22 -0800269 dex::TypeIndex class_index,
Nicolas Geoffray5247c082017-01-13 14:17:29 +0000270 Handle<mirror::Class> klass,
Nicolas Geoffray916cc1d2016-02-18 11:12:31 +0000271 HInstruction* invoke_instruction,
272 bool with_deoptimization)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700273 REQUIRES_SHARED(Locks::mutator_lock_);
Nicolas Geoffray916cc1d2016-02-18 11:12:31 +0000274
275 /*
276 * Ad-hoc implementation for implementing a diamond pattern in the graph for
277 * polymorphic inlining:
278 * 1) `compare` becomes the input of the new `HIf`.
279 * 2) Everything up until `invoke_instruction` is in the then branch (could
280 * contain multiple blocks).
281 * 3) `invoke_instruction` is moved to the otherwise block.
282 * 4) If `return_replacement` is not null, the merge block will have
283 * a phi whose inputs are `return_replacement` and `invoke_instruction`.
284 *
285 * Before:
286 * Block1
287 * compare
288 * ...
289 * invoke_instruction
290 *
291 * After:
292 * Block1
293 * compare
294 * if
295 * / \
296 * / \
297 * Then block Otherwise block
298 * ... invoke_instruction
299 * \ /
300 * \ /
301 * Merge block
302 * phi(return_replacement, invoke_instruction)
303 */
304 void CreateDiamondPatternForPolymorphicInline(HInstruction* compare,
305 HInstruction* return_replacement,
306 HInstruction* invoke_instruction);
307
Nicolas Geoffrayf6d46682017-02-28 17:41:45 +0000308 // Update the inlining budget based on `total_number_of_instructions_`.
309 void UpdateInliningBudget();
310
311 // Count the number of calls of `method` being inlined recursively.
312 size_t CountRecursiveCallsOf(ArtMethod* method) const;
313
314 // Pretty-print for spaces during logging.
315 std::string DepthString(int line) const;
316
Nicolas Geoffray73be1e82015-09-17 15:22:56 +0100317 HGraph* const outermost_graph_;
Nicolas Geoffraye53798a2014-12-01 10:31:54 +0000318 const DexCompilationUnit& outer_compilation_unit_;
Nicolas Geoffray9437b782015-03-25 10:08:51 +0000319 const DexCompilationUnit& caller_compilation_unit_;
Vladimir Markodc151b22015-10-15 18:02:30 +0100320 CodeGenerator* const codegen_;
Nicolas Geoffray5949fa02015-12-18 10:57:10 +0000321 const size_t total_number_of_dex_registers_;
Nicolas Geoffrayf6d46682017-02-28 17:41:45 +0000322 size_t total_number_of_instructions_;
323
324 // The 'parent' inliner, that means the inlinigng optimization that requested
325 // `graph_` to be inlined.
326 const HInliner* const parent_;
Nicolas Geoffrayef87c5d2015-01-30 12:41:14 +0000327 const size_t depth_;
Nicolas Geoffrayf6d46682017-02-28 17:41:45 +0000328
329 // The budget left for inlining, in number of instructions.
330 size_t inlining_budget_;
Nicolas Geoffraye53798a2014-12-01 10:31:54 +0000331
Vladimir Marko438709f2017-02-23 18:56:13 +0000332 // Used to record stats about optimizations on the inlined graph.
333 // If the inlining is successful, these stats are merged to the caller graph's stats.
334 OptimizingCompilerStats* inline_stats_;
335
Nicolas Geoffraye53798a2014-12-01 10:31:54 +0000336 DISALLOW_COPY_AND_ASSIGN(HInliner);
337};
338
339} // namespace art
340
341#endif // ART_COMPILER_OPTIMIZING_INLINER_H_