blob: b174c63a577b199c5e93c71dfe0e235e1c25d4e1 [file] [log] [blame]
Meador Inge6b6a1612013-03-21 00:55:59 +00001//===- FunctionAttrs.cpp - Pass which marks functions attributes ----------===//
Duncan Sands44c8cd92008-12-31 16:14:43 +00002//
Chandler Carruth2946cd72019-01-19 08:50:56 +00003// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
Duncan Sands44c8cd92008-12-31 16:14:43 +00006//
7//===----------------------------------------------------------------------===//
Eugene Zelenkof27d1612017-10-19 21:21:30 +00008//
Chandler Carruth1926b702016-01-08 10:55:52 +00009/// \file
10/// This file implements interprocedural passes which walk the
11/// call-graph deducing and/or propagating function attributes.
Eugene Zelenkof27d1612017-10-19 21:21:30 +000012//
Duncan Sands44c8cd92008-12-31 16:14:43 +000013//===----------------------------------------------------------------------===//
14
Chandler Carruth9c4ed172016-02-18 11:03:11 +000015#include "llvm/Transforms/IPO/FunctionAttrs.h"
Nick Lewycky4c378a42011-12-28 23:24:21 +000016#include "llvm/ADT/SCCIterator.h"
Eugene Zelenkof27d1612017-10-19 21:21:30 +000017#include "llvm/ADT/STLExtras.h"
Benjamin Kramer15591272012-10-31 13:45:49 +000018#include "llvm/ADT/SetVector.h"
Eugene Zelenkof27d1612017-10-19 21:21:30 +000019#include "llvm/ADT/SmallPtrSet.h"
Eugene Zelenkof27d1612017-10-19 21:21:30 +000020#include "llvm/ADT/SmallVector.h"
Duncan Sands44c8cd92008-12-31 16:14:43 +000021#include "llvm/ADT/Statistic.h"
Chandler Carruthed0881b2012-12-03 16:50:05 +000022#include "llvm/Analysis/AliasAnalysis.h"
Daniel Jasperaec2fa32016-12-19 08:22:17 +000023#include "llvm/Analysis/AssumptionCache.h"
Chandler Carruth7b560d42015-09-09 17:55:00 +000024#include "llvm/Analysis/BasicAliasAnalysis.h"
Eugene Zelenkof27d1612017-10-19 21:21:30 +000025#include "llvm/Analysis/CGSCCPassManager.h"
Chandler Carruthed0881b2012-12-03 16:50:05 +000026#include "llvm/Analysis/CallGraph.h"
Chandler Carruth839a98e2013-01-07 15:26:48 +000027#include "llvm/Analysis/CallGraphSCCPass.h"
Chandler Carruthed0881b2012-12-03 16:50:05 +000028#include "llvm/Analysis/CaptureTracking.h"
Eugene Zelenkof27d1612017-10-19 21:21:30 +000029#include "llvm/Analysis/LazyCallGraph.h"
Brian Homerdingb4b21d82019-07-08 15:57:56 +000030#include "llvm/Analysis/MemoryBuiltins.h"
Eugene Zelenkof27d1612017-10-19 21:21:30 +000031#include "llvm/Analysis/MemoryLocation.h"
Philip Reamesa88caea2015-08-31 19:44:38 +000032#include "llvm/Analysis/ValueTracking.h"
Eugene Zelenkof27d1612017-10-19 21:21:30 +000033#include "llvm/IR/Argument.h"
34#include "llvm/IR/Attributes.h"
35#include "llvm/IR/BasicBlock.h"
36#include "llvm/IR/CallSite.h"
37#include "llvm/IR/Constant.h"
38#include "llvm/IR/Constants.h"
39#include "llvm/IR/Function.h"
Chandler Carruth83948572014-03-04 10:30:26 +000040#include "llvm/IR/InstIterator.h"
Eugene Zelenkof27d1612017-10-19 21:21:30 +000041#include "llvm/IR/InstrTypes.h"
42#include "llvm/IR/Instruction.h"
43#include "llvm/IR/Instructions.h"
Christian Bruel4ead99b2018-12-05 16:48:00 +000044#include "llvm/IR/IntrinsicInst.h"
Eugene Zelenkof27d1612017-10-19 21:21:30 +000045#include "llvm/IR/Metadata.h"
46#include "llvm/IR/PassManager.h"
47#include "llvm/IR/Type.h"
48#include "llvm/IR/Use.h"
49#include "llvm/IR/User.h"
50#include "llvm/IR/Value.h"
51#include "llvm/Pass.h"
52#include "llvm/Support/Casting.h"
53#include "llvm/Support/CommandLine.h"
54#include "llvm/Support/Compiler.h"
Philip Reamesa88caea2015-08-31 19:44:38 +000055#include "llvm/Support/Debug.h"
Eugene Zelenkof27d1612017-10-19 21:21:30 +000056#include "llvm/Support/ErrorHandling.h"
Hans Wennborg043bf5b2015-08-31 21:19:18 +000057#include "llvm/Support/raw_ostream.h"
Chandler Carruth6bda14b2017-06-06 11:49:48 +000058#include "llvm/Transforms/IPO.h"
Eugene Zelenkof27d1612017-10-19 21:21:30 +000059#include <cassert>
60#include <iterator>
61#include <map>
62#include <vector>
63
Duncan Sands44c8cd92008-12-31 16:14:43 +000064using namespace llvm;
65
Chandler Carruth964daaa2014-04-22 02:55:47 +000066#define DEBUG_TYPE "functionattrs"
67
Duncan Sands44c8cd92008-12-31 16:14:43 +000068STATISTIC(NumReadNone, "Number of functions marked readnone");
69STATISTIC(NumReadOnly, "Number of functions marked readonly");
Brian Homerding3ecabd72018-08-23 15:05:22 +000070STATISTIC(NumWriteOnly, "Number of functions marked writeonly");
Duncan Sands44c8cd92008-12-31 16:14:43 +000071STATISTIC(NumNoCapture, "Number of arguments marked nocapture");
David Majnemer5246e0b2016-07-19 18:50:26 +000072STATISTIC(NumReturned, "Number of arguments marked returned");
Nick Lewyckyc2ec0722013-07-06 00:29:58 +000073STATISTIC(NumReadNoneArg, "Number of arguments marked readnone");
74STATISTIC(NumReadOnlyArg, "Number of arguments marked readonly");
Nick Lewyckyfbed86a2009-03-08 06:20:47 +000075STATISTIC(NumNoAlias, "Number of function returns marked noalias");
Philip Reamesa88caea2015-08-31 19:44:38 +000076STATISTIC(NumNonNullReturn, "Number of function returns marked nonnull");
James Molloy7e9bdd52015-11-12 10:55:20 +000077STATISTIC(NumNoRecurse, "Number of functions marked as norecurse");
Fedor Sergeev6660fd02018-03-23 21:46:16 +000078STATISTIC(NumNoUnwind, "Number of functions marked as nounwind");
Brian Homerdingb4b21d82019-07-08 15:57:56 +000079STATISTIC(NumNoFree, "Number of functions marked as nofree");
Duncan Sands44c8cd92008-12-31 16:14:43 +000080
Sanjay Patel4f742162017-02-13 23:10:51 +000081static cl::opt<bool> EnableNonnullArgPropagation(
David Bolvanskyd90fd412019-09-23 09:58:02 +000082 "enable-nonnull-arg-prop", cl::init(true), cl::Hidden,
Sanjay Patel4f742162017-02-13 23:10:51 +000083 cl::desc("Try to propagate nonnull argument attributes from callsites to "
84 "caller functions."));
85
Fedor Sergeev6660fd02018-03-23 21:46:16 +000086static cl::opt<bool> DisableNoUnwindInference(
87 "disable-nounwind-inference", cl::Hidden,
88 cl::desc("Stop inferring nounwind attribute during function-attrs pass"));
89
Brian Homerdingb4b21d82019-07-08 15:57:56 +000090static cl::opt<bool> DisableNoFreeInference(
91 "disable-nofree-inference", cl::Hidden,
92 cl::desc("Stop inferring nofree attribute during function-attrs pass"));
93
Duncan Sands44c8cd92008-12-31 16:14:43 +000094namespace {
Eugene Zelenkof27d1612017-10-19 21:21:30 +000095
96using SCCNodeSet = SmallSetVector<Function *, 8>;
97
98} // end anonymous namespace
Chandler Carruthc518ebd2015-10-29 18:29:15 +000099
Peter Collingbournec45f7f32017-02-14 00:28:13 +0000100/// Returns the memory access attribute for function F using AAR for AA results,
101/// where SCCNodes is the current SCC.
102///
103/// If ThisBody is true, this function may examine the function body and will
104/// return a result pertaining to this copy of the function. If it is false, the
105/// result will be based only on AA results for the function declaration; it
106/// will be assumed that some other (perhaps less optimized) version of the
107/// function may be selected at link time.
108static MemoryAccessKind checkFunctionMemoryAccess(Function &F, bool ThisBody,
109 AAResults &AAR,
Chandler Carruthc518ebd2015-10-29 18:29:15 +0000110 const SCCNodeSet &SCCNodes) {
Chandler Carruth7542d372015-09-21 17:39:41 +0000111 FunctionModRefBehavior MRB = AAR.getModRefBehavior(&F);
112 if (MRB == FMRB_DoesNotAccessMemory)
113 // Already perfect!
114 return MAK_ReadNone;
115
Peter Collingbournec45f7f32017-02-14 00:28:13 +0000116 if (!ThisBody) {
Chandler Carruth7542d372015-09-21 17:39:41 +0000117 if (AliasAnalysis::onlyReadsMemory(MRB))
118 return MAK_ReadOnly;
119
Brian Homerding3ecabd72018-08-23 15:05:22 +0000120 if (AliasAnalysis::doesNotReadMemory(MRB))
121 return MAK_WriteOnly;
122
123 // Conservatively assume it reads and writes to memory.
Chandler Carruth7542d372015-09-21 17:39:41 +0000124 return MAK_MayWrite;
125 }
126
127 // Scan the function body for instructions that may read or write memory.
128 bool ReadsMemory = false;
Brian Homerding3ecabd72018-08-23 15:05:22 +0000129 bool WritesMemory = false;
Chandler Carruth7542d372015-09-21 17:39:41 +0000130 for (inst_iterator II = inst_begin(F), E = inst_end(F); II != E; ++II) {
131 Instruction *I = &*II;
132
133 // Some instructions can be ignored even if they read or write memory.
134 // Detect these now, skipping to the next instruction if one is found.
Chandler Carruth363ac682019-01-07 05:42:51 +0000135 if (auto *Call = dyn_cast<CallBase>(I)) {
Sanjoy Das10c8a042016-02-09 18:40:40 +0000136 // Ignore calls to functions in the same SCC, as long as the call sites
137 // don't have operand bundles. Calls with operand bundles are allowed to
138 // have memory effects not described by the memory effects of the call
139 // target.
Chandler Carruth363ac682019-01-07 05:42:51 +0000140 if (!Call->hasOperandBundles() && Call->getCalledFunction() &&
141 SCCNodes.count(Call->getCalledFunction()))
Chandler Carruth7542d372015-09-21 17:39:41 +0000142 continue;
Chandler Carruth363ac682019-01-07 05:42:51 +0000143 FunctionModRefBehavior MRB = AAR.getModRefBehavior(Call);
Alina Sbirlea63d22502017-12-05 20:12:23 +0000144 ModRefInfo MRI = createModRefInfo(MRB);
Chandler Carruth7542d372015-09-21 17:39:41 +0000145
Chandler Carruth69798fb2015-10-27 01:41:43 +0000146 // If the call doesn't access memory, we're done.
Alina Sbirlea63d22502017-12-05 20:12:23 +0000147 if (isNoModRef(MRI))
Chandler Carruth69798fb2015-10-27 01:41:43 +0000148 continue;
149
150 if (!AliasAnalysis::onlyAccessesArgPointees(MRB)) {
Brian Homerding3ecabd72018-08-23 15:05:22 +0000151 // The call could access any memory. If that includes writes, note it.
Alina Sbirlea63d22502017-12-05 20:12:23 +0000152 if (isModSet(MRI))
Brian Homerding3ecabd72018-08-23 15:05:22 +0000153 WritesMemory = true;
Chandler Carruth69798fb2015-10-27 01:41:43 +0000154 // If it reads, note it.
Alina Sbirlea63d22502017-12-05 20:12:23 +0000155 if (isRefSet(MRI))
Chandler Carruth69798fb2015-10-27 01:41:43 +0000156 ReadsMemory = true;
Chandler Carruth7542d372015-09-21 17:39:41 +0000157 continue;
158 }
Chandler Carruth69798fb2015-10-27 01:41:43 +0000159
160 // Check whether all pointer arguments point to local memory, and
161 // ignore calls that only access local memory.
Chandler Carruth363ac682019-01-07 05:42:51 +0000162 for (CallSite::arg_iterator CI = Call->arg_begin(), CE = Call->arg_end();
Chandler Carruth69798fb2015-10-27 01:41:43 +0000163 CI != CE; ++CI) {
164 Value *Arg = *CI;
Elena Demikhovsky3ec9e152015-11-17 19:30:51 +0000165 if (!Arg->getType()->isPtrOrPtrVectorTy())
Chandler Carruth69798fb2015-10-27 01:41:43 +0000166 continue;
167
168 AAMDNodes AAInfo;
169 I->getAAMetadata(AAInfo);
George Burgess IV6ef80022018-10-10 21:28:44 +0000170 MemoryLocation Loc(Arg, LocationSize::unknown(), AAInfo);
Chandler Carruth69798fb2015-10-27 01:41:43 +0000171
172 // Skip accesses to local or constant memory as they don't impact the
173 // externally visible mod/ref behavior.
174 if (AAR.pointsToConstantMemory(Loc, /*OrLocal=*/true))
175 continue;
176
Alina Sbirlea63d22502017-12-05 20:12:23 +0000177 if (isModSet(MRI))
Brian Homerding3ecabd72018-08-23 15:05:22 +0000178 // Writes non-local memory.
179 WritesMemory = true;
Alina Sbirlea63d22502017-12-05 20:12:23 +0000180 if (isRefSet(MRI))
Chandler Carruth69798fb2015-10-27 01:41:43 +0000181 // Ok, it reads non-local memory.
182 ReadsMemory = true;
183 }
Chandler Carruth7542d372015-09-21 17:39:41 +0000184 continue;
185 } else if (LoadInst *LI = dyn_cast<LoadInst>(I)) {
186 // Ignore non-volatile loads from local memory. (Atomic is okay here.)
187 if (!LI->isVolatile()) {
188 MemoryLocation Loc = MemoryLocation::get(LI);
189 if (AAR.pointsToConstantMemory(Loc, /*OrLocal=*/true))
190 continue;
191 }
192 } else if (StoreInst *SI = dyn_cast<StoreInst>(I)) {
193 // Ignore non-volatile stores to local memory. (Atomic is okay here.)
194 if (!SI->isVolatile()) {
195 MemoryLocation Loc = MemoryLocation::get(SI);
196 if (AAR.pointsToConstantMemory(Loc, /*OrLocal=*/true))
197 continue;
198 }
199 } else if (VAArgInst *VI = dyn_cast<VAArgInst>(I)) {
200 // Ignore vaargs on local memory.
201 MemoryLocation Loc = MemoryLocation::get(VI);
202 if (AAR.pointsToConstantMemory(Loc, /*OrLocal=*/true))
203 continue;
204 }
205
206 // Any remaining instructions need to be taken seriously! Check if they
207 // read or write memory.
Brian Homerding3ecabd72018-08-23 15:05:22 +0000208 //
209 // Writes memory, remember that.
210 WritesMemory |= I->mayWriteToMemory();
Chandler Carruth7542d372015-09-21 17:39:41 +0000211
212 // If this instruction may read memory, remember that.
213 ReadsMemory |= I->mayReadFromMemory();
214 }
215
Brian Homerding3ecabd72018-08-23 15:05:22 +0000216 if (WritesMemory) {
217 if (!ReadsMemory)
218 return MAK_WriteOnly;
219 else
220 return MAK_MayWrite;
221 }
222
Chandler Carruth7542d372015-09-21 17:39:41 +0000223 return ReadsMemory ? MAK_ReadOnly : MAK_ReadNone;
224}
225
Peter Collingbournec45f7f32017-02-14 00:28:13 +0000226MemoryAccessKind llvm::computeFunctionBodyMemoryAccess(Function &F,
227 AAResults &AAR) {
228 return checkFunctionMemoryAccess(F, /*ThisBody=*/true, AAR, {});
229}
230
Chandler Carrutha632fb92015-09-13 06:57:25 +0000231/// Deduce readonly/readnone attributes for the SCC.
Chandler Carrutha8125352015-10-30 16:48:08 +0000232template <typename AARGetterT>
Peter Collingbournecea1e4e2017-02-09 23:11:52 +0000233static bool addReadAttrs(const SCCNodeSet &SCCNodes, AARGetterT &&AARGetter) {
Duncan Sands44c8cd92008-12-31 16:14:43 +0000234 // Check if any of the functions in the SCC read or write memory. If they
235 // write memory then they can't be marked readnone or readonly.
236 bool ReadsMemory = false;
Brian Homerding3ecabd72018-08-23 15:05:22 +0000237 bool WritesMemory = false;
Chandler Carruthc518ebd2015-10-29 18:29:15 +0000238 for (Function *F : SCCNodes) {
Chandler Carrutha8125352015-10-30 16:48:08 +0000239 // Call the callable parameter to look up AA results for this function.
240 AAResults &AAR = AARGetter(*F);
Chandler Carruth7b560d42015-09-09 17:55:00 +0000241
Peter Collingbournec45f7f32017-02-14 00:28:13 +0000242 // Non-exact function definitions may not be selected at link time, and an
243 // alternative version that writes to memory may be selected. See the
244 // comment on GlobalValue::isDefinitionExact for more details.
245 switch (checkFunctionMemoryAccess(*F, F->hasExactDefinition(),
246 AAR, SCCNodes)) {
Chandler Carruth7542d372015-09-21 17:39:41 +0000247 case MAK_MayWrite:
248 return false;
249 case MAK_ReadOnly:
Duncan Sands44c8cd92008-12-31 16:14:43 +0000250 ReadsMemory = true;
Chandler Carruth7542d372015-09-21 17:39:41 +0000251 break;
Brian Homerding3ecabd72018-08-23 15:05:22 +0000252 case MAK_WriteOnly:
253 WritesMemory = true;
254 break;
Chandler Carruth7542d372015-09-21 17:39:41 +0000255 case MAK_ReadNone:
256 // Nothing to do!
257 break;
Duncan Sands44c8cd92008-12-31 16:14:43 +0000258 }
259 }
260
Johannes Doerfert3dcd7992019-07-15 17:31:26 +0000261 // If the SCC contains both functions that read and functions that write, then
262 // we cannot add readonly attributes.
263 if (ReadsMemory && WritesMemory)
264 return false;
265
Duncan Sands44c8cd92008-12-31 16:14:43 +0000266 // Success! Functions in this SCC do not access memory, or only read memory.
267 // Give them the appropriate attribute.
268 bool MadeChange = false;
Brian Homerding3ecabd72018-08-23 15:05:22 +0000269
Chandler Carruthc518ebd2015-10-29 18:29:15 +0000270 for (Function *F : SCCNodes) {
Duncan Sands44c8cd92008-12-31 16:14:43 +0000271 if (F->doesNotAccessMemory())
272 // Already perfect!
273 continue;
274
275 if (F->onlyReadsMemory() && ReadsMemory)
276 // No change.
277 continue;
278
Brian Homerding3ecabd72018-08-23 15:05:22 +0000279 if (F->doesNotReadMemory() && WritesMemory)
280 continue;
281
Duncan Sands44c8cd92008-12-31 16:14:43 +0000282 MadeChange = true;
283
284 // Clear out any existing attributes.
Reid Kleckner9d16fa02017-04-19 17:28:52 +0000285 F->removeFnAttr(Attribute::ReadOnly);
286 F->removeFnAttr(Attribute::ReadNone);
Brian Homerding3ecabd72018-08-23 15:05:22 +0000287 F->removeFnAttr(Attribute::WriteOnly);
Duncan Sands44c8cd92008-12-31 16:14:43 +0000288
Johannes Doerfertae3cfeb2018-09-11 11:51:29 +0000289 if (!WritesMemory && !ReadsMemory) {
290 // Clear out any "access range attributes" if readnone was deduced.
291 F->removeFnAttr(Attribute::ArgMemOnly);
292 F->removeFnAttr(Attribute::InaccessibleMemOnly);
293 F->removeFnAttr(Attribute::InaccessibleMemOrArgMemOnly);
294 }
295
Duncan Sands44c8cd92008-12-31 16:14:43 +0000296 // Add in the new attribute.
Brian Homerding3ecabd72018-08-23 15:05:22 +0000297 if (WritesMemory && !ReadsMemory)
298 F->addFnAttr(Attribute::WriteOnly);
299 else
300 F->addFnAttr(ReadsMemory ? Attribute::ReadOnly : Attribute::ReadNone);
Duncan Sands44c8cd92008-12-31 16:14:43 +0000301
Brian Homerding3ecabd72018-08-23 15:05:22 +0000302 if (WritesMemory && !ReadsMemory)
303 ++NumWriteOnly;
304 else if (ReadsMemory)
Duncan Sandscefc8602009-01-02 11:46:24 +0000305 ++NumReadOnly;
Duncan Sands44c8cd92008-12-31 16:14:43 +0000306 else
Duncan Sandscefc8602009-01-02 11:46:24 +0000307 ++NumReadNone;
Duncan Sands44c8cd92008-12-31 16:14:43 +0000308 }
309
310 return MadeChange;
311}
312
Nick Lewycky4c378a42011-12-28 23:24:21 +0000313namespace {
Eugene Zelenkof27d1612017-10-19 21:21:30 +0000314
Chandler Carrutha632fb92015-09-13 06:57:25 +0000315/// For a given pointer Argument, this retains a list of Arguments of functions
316/// in the same SCC that the pointer data flows into. We use this to build an
317/// SCC of the arguments.
Chandler Carruth63559d72015-09-13 06:47:20 +0000318struct ArgumentGraphNode {
319 Argument *Definition;
320 SmallVector<ArgumentGraphNode *, 4> Uses;
321};
Nick Lewycky4c378a42011-12-28 23:24:21 +0000322
Chandler Carruth63559d72015-09-13 06:47:20 +0000323class ArgumentGraph {
324 // We store pointers to ArgumentGraphNode objects, so it's important that
325 // that they not move around upon insert.
Eugene Zelenkof27d1612017-10-19 21:21:30 +0000326 using ArgumentMapTy = std::map<Argument *, ArgumentGraphNode>;
Nick Lewycky4c378a42011-12-28 23:24:21 +0000327
Chandler Carruth63559d72015-09-13 06:47:20 +0000328 ArgumentMapTy ArgumentMap;
Nick Lewycky4c378a42011-12-28 23:24:21 +0000329
Chandler Carruth63559d72015-09-13 06:47:20 +0000330 // There is no root node for the argument graph, in fact:
331 // void f(int *x, int *y) { if (...) f(x, y); }
332 // is an example where the graph is disconnected. The SCCIterator requires a
333 // single entry point, so we maintain a fake ("synthetic") root node that
334 // uses every node. Because the graph is directed and nothing points into
335 // the root, it will not participate in any SCCs (except for its own).
336 ArgumentGraphNode SyntheticRoot;
Nick Lewycky4c378a42011-12-28 23:24:21 +0000337
Chandler Carruth63559d72015-09-13 06:47:20 +0000338public:
339 ArgumentGraph() { SyntheticRoot.Definition = nullptr; }
Nick Lewycky4c378a42011-12-28 23:24:21 +0000340
Eugene Zelenkof27d1612017-10-19 21:21:30 +0000341 using iterator = SmallVectorImpl<ArgumentGraphNode *>::iterator;
Nick Lewycky4c378a42011-12-28 23:24:21 +0000342
Chandler Carruth63559d72015-09-13 06:47:20 +0000343 iterator begin() { return SyntheticRoot.Uses.begin(); }
344 iterator end() { return SyntheticRoot.Uses.end(); }
345 ArgumentGraphNode *getEntryNode() { return &SyntheticRoot; }
Nick Lewycky4c378a42011-12-28 23:24:21 +0000346
Chandler Carruth63559d72015-09-13 06:47:20 +0000347 ArgumentGraphNode *operator[](Argument *A) {
348 ArgumentGraphNode &Node = ArgumentMap[A];
349 Node.Definition = A;
350 SyntheticRoot.Uses.push_back(&Node);
351 return &Node;
352 }
353};
Nick Lewycky4c378a42011-12-28 23:24:21 +0000354
Chandler Carrutha632fb92015-09-13 06:57:25 +0000355/// This tracker checks whether callees are in the SCC, and if so it does not
356/// consider that a capture, instead adding it to the "Uses" list and
357/// continuing with the analysis.
Chandler Carruth63559d72015-09-13 06:47:20 +0000358struct ArgumentUsesTracker : public CaptureTracker {
Eugene Zelenkof27d1612017-10-19 21:21:30 +0000359 ArgumentUsesTracker(const SCCNodeSet &SCCNodes) : SCCNodes(SCCNodes) {}
Nick Lewycky4c378a42011-12-28 23:24:21 +0000360
Chandler Carruth63559d72015-09-13 06:47:20 +0000361 void tooManyUses() override { Captured = true; }
Nick Lewycky4c378a42011-12-28 23:24:21 +0000362
Chandler Carruth63559d72015-09-13 06:47:20 +0000363 bool captured(const Use *U) override {
364 CallSite CS(U->getUser());
365 if (!CS.getInstruction()) {
366 Captured = true;
367 return true;
Nick Lewycky4c378a42011-12-28 23:24:21 +0000368 }
369
Chandler Carruth63559d72015-09-13 06:47:20 +0000370 Function *F = CS.getCalledFunction();
Sanjoy Das5ce32722016-04-08 00:48:30 +0000371 if (!F || !F->hasExactDefinition() || !SCCNodes.count(F)) {
Chandler Carruth63559d72015-09-13 06:47:20 +0000372 Captured = true;
373 return true;
374 }
Nick Lewycky4c378a42011-12-28 23:24:21 +0000375
Sanjoy Das98bfe262015-11-05 03:04:40 +0000376 // Note: the callee and the two successor blocks *follow* the argument
377 // operands. This means there is no need to adjust UseIndex to account for
378 // these.
379
380 unsigned UseIndex =
381 std::distance(const_cast<const Use *>(CS.arg_begin()), U);
382
Sanjoy Das71fe81f2015-11-07 01:56:00 +0000383 assert(UseIndex < CS.data_operands_size() &&
384 "Indirect function calls should have been filtered above!");
385
386 if (UseIndex >= CS.getNumArgOperands()) {
387 // Data operand, but not a argument operand -- must be a bundle operand
388 assert(CS.hasOperandBundles() && "Must be!");
389
390 // CaptureTracking told us that we're being captured by an operand bundle
391 // use. In this case it does not matter if the callee is within our SCC
392 // or not -- we've been captured in some unknown way, and we have to be
393 // conservative.
394 Captured = true;
395 return true;
396 }
397
Sanjoy Das98bfe262015-11-05 03:04:40 +0000398 if (UseIndex >= F->arg_size()) {
399 assert(F->isVarArg() && "More params than args in non-varargs call");
400 Captured = true;
401 return true;
Chandler Carruth63559d72015-09-13 06:47:20 +0000402 }
Sanjoy Das98bfe262015-11-05 03:04:40 +0000403
Duncan P. N. Exon Smith83c4b682015-11-07 00:01:16 +0000404 Uses.push_back(&*std::next(F->arg_begin(), UseIndex));
Chandler Carruth63559d72015-09-13 06:47:20 +0000405 return false;
406 }
407
Eugene Zelenkof27d1612017-10-19 21:21:30 +0000408 // True only if certainly captured (used outside our SCC).
409 bool Captured = false;
410
411 // Uses within our SCC.
412 SmallVector<Argument *, 4> Uses;
Chandler Carruth63559d72015-09-13 06:47:20 +0000413
Chandler Carruthc518ebd2015-10-29 18:29:15 +0000414 const SCCNodeSet &SCCNodes;
Chandler Carruth63559d72015-09-13 06:47:20 +0000415};
Eugene Zelenkof27d1612017-10-19 21:21:30 +0000416
417} // end anonymous namespace
Nick Lewycky4c378a42011-12-28 23:24:21 +0000418
419namespace llvm {
Eugene Zelenkof27d1612017-10-19 21:21:30 +0000420
Chandler Carruth63559d72015-09-13 06:47:20 +0000421template <> struct GraphTraits<ArgumentGraphNode *> {
Eugene Zelenkof27d1612017-10-19 21:21:30 +0000422 using NodeRef = ArgumentGraphNode *;
423 using ChildIteratorType = SmallVectorImpl<ArgumentGraphNode *>::iterator;
Nick Lewycky4c378a42011-12-28 23:24:21 +0000424
Tim Shen48f814e2016-08-31 16:48:13 +0000425 static NodeRef getEntryNode(NodeRef A) { return A; }
426 static ChildIteratorType child_begin(NodeRef N) { return N->Uses.begin(); }
427 static ChildIteratorType child_end(NodeRef N) { return N->Uses.end(); }
Chandler Carruth63559d72015-09-13 06:47:20 +0000428};
Eugene Zelenkof27d1612017-10-19 21:21:30 +0000429
Chandler Carruth63559d72015-09-13 06:47:20 +0000430template <>
431struct GraphTraits<ArgumentGraph *> : public GraphTraits<ArgumentGraphNode *> {
Tim Shenf2187ed2016-08-22 21:09:30 +0000432 static NodeRef getEntryNode(ArgumentGraph *AG) { return AG->getEntryNode(); }
Eugene Zelenkof27d1612017-10-19 21:21:30 +0000433
Chandler Carruth63559d72015-09-13 06:47:20 +0000434 static ChildIteratorType nodes_begin(ArgumentGraph *AG) {
435 return AG->begin();
436 }
Eugene Zelenkof27d1612017-10-19 21:21:30 +0000437
Chandler Carruth63559d72015-09-13 06:47:20 +0000438 static ChildIteratorType nodes_end(ArgumentGraph *AG) { return AG->end(); }
439};
Eugene Zelenkof27d1612017-10-19 21:21:30 +0000440
441} // end namespace llvm
Nick Lewycky4c378a42011-12-28 23:24:21 +0000442
Chandler Carrutha632fb92015-09-13 06:57:25 +0000443/// Returns Attribute::None, Attribute::ReadOnly or Attribute::ReadNone.
Nick Lewyckyc2ec0722013-07-06 00:29:58 +0000444static Attribute::AttrKind
445determinePointerReadAttrs(Argument *A,
Chandler Carruth63559d72015-09-13 06:47:20 +0000446 const SmallPtrSet<Argument *, 8> &SCCNodes) {
Chandler Carruth63559d72015-09-13 06:47:20 +0000447 SmallVector<Use *, 32> Worklist;
Florian Hahna1cc8482018-06-12 11:16:56 +0000448 SmallPtrSet<Use *, 32> Visited;
Nick Lewyckyc2ec0722013-07-06 00:29:58 +0000449
Reid Kleckner26af2ca2014-01-28 02:38:36 +0000450 // inalloca arguments are always clobbered by the call.
451 if (A->hasInAllocaAttr())
452 return Attribute::None;
453
Nick Lewyckyc2ec0722013-07-06 00:29:58 +0000454 bool IsRead = false;
455 // We don't need to track IsWritten. If A is written to, return immediately.
456
Chandler Carruthcdf47882014-03-09 03:16:01 +0000457 for (Use &U : A->uses()) {
Chandler Carruthcdf47882014-03-09 03:16:01 +0000458 Visited.insert(&U);
459 Worklist.push_back(&U);
Nick Lewyckyc2ec0722013-07-06 00:29:58 +0000460 }
461
462 while (!Worklist.empty()) {
463 Use *U = Worklist.pop_back_val();
464 Instruction *I = cast<Instruction>(U->getUser());
Nick Lewyckyc2ec0722013-07-06 00:29:58 +0000465
466 switch (I->getOpcode()) {
467 case Instruction::BitCast:
468 case Instruction::GetElementPtr:
469 case Instruction::PHI:
470 case Instruction::Select:
Matt Arsenaulte55a2c22014-01-14 19:11:52 +0000471 case Instruction::AddrSpaceCast:
Nick Lewyckyc2ec0722013-07-06 00:29:58 +0000472 // The original value is not read/written via this if the new value isn't.
Chandler Carruthcdf47882014-03-09 03:16:01 +0000473 for (Use &UU : I->uses())
David Blaikie70573dc2014-11-19 07:49:26 +0000474 if (Visited.insert(&UU).second)
Chandler Carruthcdf47882014-03-09 03:16:01 +0000475 Worklist.push_back(&UU);
Nick Lewyckyc2ec0722013-07-06 00:29:58 +0000476 break;
477
478 case Instruction::Call:
479 case Instruction::Invoke: {
Nick Lewycky59633cb2014-05-30 02:31:27 +0000480 bool Captures = true;
481
482 if (I->getType()->isVoidTy())
483 Captures = false;
484
485 auto AddUsersToWorklistIfCapturing = [&] {
486 if (Captures)
487 for (Use &UU : I->uses())
David Blaikie70573dc2014-11-19 07:49:26 +0000488 if (Visited.insert(&UU).second)
Nick Lewycky59633cb2014-05-30 02:31:27 +0000489 Worklist.push_back(&UU);
490 };
491
Nick Lewyckyc2ec0722013-07-06 00:29:58 +0000492 CallSite CS(I);
Nick Lewycky59633cb2014-05-30 02:31:27 +0000493 if (CS.doesNotAccessMemory()) {
494 AddUsersToWorklistIfCapturing();
Nick Lewyckyc2ec0722013-07-06 00:29:58 +0000495 continue;
Nick Lewycky59633cb2014-05-30 02:31:27 +0000496 }
Nick Lewyckyc2ec0722013-07-06 00:29:58 +0000497
498 Function *F = CS.getCalledFunction();
499 if (!F) {
500 if (CS.onlyReadsMemory()) {
501 IsRead = true;
Nick Lewycky59633cb2014-05-30 02:31:27 +0000502 AddUsersToWorklistIfCapturing();
Nick Lewyckyc2ec0722013-07-06 00:29:58 +0000503 continue;
504 }
505 return Attribute::None;
506 }
507
Sanjoy Das436e2392015-11-07 01:55:53 +0000508 // Note: the callee and the two successor blocks *follow* the argument
509 // operands. This means there is no need to adjust UseIndex to account
510 // for these.
511
512 unsigned UseIndex = std::distance(CS.arg_begin(), U);
513
Sanjoy Dasea1df7f2015-11-07 01:56:07 +0000514 // U cannot be the callee operand use: since we're exploring the
515 // transitive uses of an Argument, having such a use be a callee would
516 // imply the CallSite is an indirect call or invoke; and we'd take the
517 // early exit above.
518 assert(UseIndex < CS.data_operands_size() &&
519 "Data operand use expected!");
Sanjoy Das71fe81f2015-11-07 01:56:00 +0000520
521 bool IsOperandBundleUse = UseIndex >= CS.getNumArgOperands();
522
523 if (UseIndex >= F->arg_size() && !IsOperandBundleUse) {
Sanjoy Das436e2392015-11-07 01:55:53 +0000524 assert(F->isVarArg() && "More params than args in non-varargs call");
525 return Attribute::None;
Nick Lewyckyc2ec0722013-07-06 00:29:58 +0000526 }
Sanjoy Das436e2392015-11-07 01:55:53 +0000527
Tilmann Scheller925b1932015-11-20 19:17:10 +0000528 Captures &= !CS.doesNotCapture(UseIndex);
529
Sanjoy Das71fe81f2015-11-07 01:56:00 +0000530 // Since the optimizer (by design) cannot see the data flow corresponding
531 // to a operand bundle use, these cannot participate in the optimistic SCC
532 // analysis. Instead, we model the operand bundle uses as arguments in
533 // call to a function external to the SCC.
Duncan P. N. Exon Smith9e3edad2016-08-17 01:23:58 +0000534 if (IsOperandBundleUse ||
535 !SCCNodes.count(&*std::next(F->arg_begin(), UseIndex))) {
Sanjoy Das71fe81f2015-11-07 01:56:00 +0000536
537 // The accessors used on CallSite here do the right thing for calls and
538 // invokes with operand bundles.
539
Sanjoy Das436e2392015-11-07 01:55:53 +0000540 if (!CS.onlyReadsMemory() && !CS.onlyReadsMemory(UseIndex))
541 return Attribute::None;
542 if (!CS.doesNotAccessMemory(UseIndex))
543 IsRead = true;
544 }
545
Nick Lewycky59633cb2014-05-30 02:31:27 +0000546 AddUsersToWorklistIfCapturing();
Nick Lewyckyc2ec0722013-07-06 00:29:58 +0000547 break;
548 }
549
550 case Instruction::Load:
David Majnemer124bdb72016-05-25 05:53:04 +0000551 // A volatile load has side effects beyond what readonly can be relied
552 // upon.
553 if (cast<LoadInst>(I)->isVolatile())
554 return Attribute::None;
555
Nick Lewyckyc2ec0722013-07-06 00:29:58 +0000556 IsRead = true;
557 break;
558
559 case Instruction::ICmp:
560 case Instruction::Ret:
561 break;
562
563 default:
564 return Attribute::None;
565 }
566 }
567
568 return IsRead ? Attribute::ReadOnly : Attribute::ReadNone;
569}
570
David Majnemer5246e0b2016-07-19 18:50:26 +0000571/// Deduce returned attributes for the SCC.
572static bool addArgumentReturnedAttrs(const SCCNodeSet &SCCNodes) {
573 bool Changed = false;
574
David Majnemer5246e0b2016-07-19 18:50:26 +0000575 // Check each function in turn, determining if an argument is always returned.
576 for (Function *F : SCCNodes) {
577 // We can infer and propagate function attributes only when we know that the
578 // definition we'll get at link time is *exactly* the definition we see now.
579 // For more details, see GlobalValue::mayBeDerefined.
580 if (!F->hasExactDefinition())
581 continue;
582
583 if (F->getReturnType()->isVoidTy())
584 continue;
585
David Majnemerc83044d2016-09-12 16:04:59 +0000586 // There is nothing to do if an argument is already marked as 'returned'.
Eugene Zelenkof27d1612017-10-19 21:21:30 +0000587 if (llvm::any_of(F->args(),
588 [](const Argument &Arg) { return Arg.hasReturnedAttr(); }))
David Majnemerc83044d2016-09-12 16:04:59 +0000589 continue;
590
David Majnemer5246e0b2016-07-19 18:50:26 +0000591 auto FindRetArg = [&]() -> Value * {
592 Value *RetArg = nullptr;
593 for (BasicBlock &BB : *F)
594 if (auto *Ret = dyn_cast<ReturnInst>(BB.getTerminator())) {
595 // Note that stripPointerCasts should look through functions with
596 // returned arguments.
597 Value *RetVal = Ret->getReturnValue()->stripPointerCasts();
598 if (!isa<Argument>(RetVal) || RetVal->getType() != F->getReturnType())
599 return nullptr;
600
601 if (!RetArg)
602 RetArg = RetVal;
603 else if (RetArg != RetVal)
604 return nullptr;
605 }
606
607 return RetArg;
608 };
609
610 if (Value *RetArg = FindRetArg()) {
611 auto *A = cast<Argument>(RetArg);
Reid Kleckner9d16fa02017-04-19 17:28:52 +0000612 A->addAttr(Attribute::Returned);
David Majnemer5246e0b2016-07-19 18:50:26 +0000613 ++NumReturned;
614 Changed = true;
615 }
616 }
617
618 return Changed;
619}
620
Sanjay Patel4f742162017-02-13 23:10:51 +0000621/// If a callsite has arguments that are also arguments to the parent function,
622/// try to propagate attributes from the callsite's arguments to the parent's
623/// arguments. This may be important because inlining can cause information loss
624/// when attribute knowledge disappears with the inlined call.
625static bool addArgumentAttrsFromCallsites(Function &F) {
626 if (!EnableNonnullArgPropagation)
627 return false;
628
629 bool Changed = false;
630
631 // For an argument attribute to transfer from a callsite to the parent, the
632 // call must be guaranteed to execute every time the parent is called.
633 // Conservatively, just check for calls in the entry block that are guaranteed
634 // to execute.
635 // TODO: This could be enhanced by testing if the callsite post-dominates the
636 // entry block or by doing simple forward walks or backward walks to the
637 // callsite.
638 BasicBlock &Entry = F.getEntryBlock();
639 for (Instruction &I : Entry) {
640 if (auto CS = CallSite(&I)) {
641 if (auto *CalledFunc = CS.getCalledFunction()) {
642 for (auto &CSArg : CalledFunc->args()) {
643 if (!CSArg.hasNonNullAttr())
644 continue;
645
646 // If the non-null callsite argument operand is an argument to 'F'
647 // (the caller) and the call is guaranteed to execute, then the value
648 // must be non-null throughout 'F'.
649 auto *FArg = dyn_cast<Argument>(CS.getArgOperand(CSArg.getArgNo()));
650 if (FArg && !FArg->hasNonNullAttr()) {
651 FArg->addAttr(Attribute::NonNull);
652 Changed = true;
653 }
654 }
655 }
656 }
657 if (!isGuaranteedToTransferExecutionToSuccessor(&I))
658 break;
659 }
Fangrui Songf78650a2018-07-30 19:41:25 +0000660
Sanjay Patel4f742162017-02-13 23:10:51 +0000661 return Changed;
662}
663
Whitney Tsang1ccba7c2019-09-11 14:26:22 +0000664static bool addReadAttr(Argument *A, Attribute::AttrKind R) {
665 assert((R == Attribute::ReadOnly || R == Attribute::ReadNone)
666 && "Must be a Read attribute.");
667 assert(A && "Argument must not be null.");
668
669 // If the argument already has the attribute, nothing needs to be done.
670 if (A->hasAttribute(R))
671 return false;
672
673 // Otherwise, remove potentially conflicting attribute, add the new one,
674 // and update statistics.
675 A->removeAttr(Attribute::WriteOnly);
676 A->removeAttr(Attribute::ReadOnly);
677 A->removeAttr(Attribute::ReadNone);
678 A->addAttr(R);
679 R == Attribute::ReadOnly ? ++NumReadOnlyArg : ++NumReadNoneArg;
680 return true;
681}
682
Chandler Carrutha632fb92015-09-13 06:57:25 +0000683/// Deduce nocapture attributes for the SCC.
Chandler Carruthc518ebd2015-10-29 18:29:15 +0000684static bool addArgumentAttrs(const SCCNodeSet &SCCNodes) {
Duncan Sands44c8cd92008-12-31 16:14:43 +0000685 bool Changed = false;
686
Nick Lewycky4c378a42011-12-28 23:24:21 +0000687 ArgumentGraph AG;
688
Duncan Sands44c8cd92008-12-31 16:14:43 +0000689 // Check each function in turn, determining which pointer arguments are not
690 // captured.
Chandler Carruthc518ebd2015-10-29 18:29:15 +0000691 for (Function *F : SCCNodes) {
Sanjoy Das5ce32722016-04-08 00:48:30 +0000692 // We can infer and propagate function attributes only when we know that the
693 // definition we'll get at link time is *exactly* the definition we see now.
694 // For more details, see GlobalValue::mayBeDerefined.
695 if (!F->hasExactDefinition())
Duncan Sands44c8cd92008-12-31 16:14:43 +0000696 continue;
697
Sanjay Patel4f742162017-02-13 23:10:51 +0000698 Changed |= addArgumentAttrsFromCallsites(*F);
699
Nick Lewycky4c378a42011-12-28 23:24:21 +0000700 // Functions that are readonly (or readnone) and nounwind and don't return
701 // a value can't capture arguments. Don't analyze them.
702 if (F->onlyReadsMemory() && F->doesNotThrow() &&
703 F->getReturnType()->isVoidTy()) {
Chandler Carruth63559d72015-09-13 06:47:20 +0000704 for (Function::arg_iterator A = F->arg_begin(), E = F->arg_end(); A != E;
705 ++A) {
Benjamin Kramer40d7f352013-06-22 16:56:32 +0000706 if (A->getType()->isPointerTy() && !A->hasNoCaptureAttr()) {
Reid Kleckner9d16fa02017-04-19 17:28:52 +0000707 A->addAttr(Attribute::NoCapture);
Benjamin Kramer40d7f352013-06-22 16:56:32 +0000708 ++NumNoCapture;
709 Changed = true;
Nick Lewycky4c378a42011-12-28 23:24:21 +0000710 }
Nick Lewycky4c378a42011-12-28 23:24:21 +0000711 }
Benjamin Kramer40d7f352013-06-22 16:56:32 +0000712 continue;
Benjamin Kramer76b7bd02013-06-22 15:51:19 +0000713 }
714
Chandler Carruth63559d72015-09-13 06:47:20 +0000715 for (Function::arg_iterator A = F->arg_begin(), E = F->arg_end(); A != E;
716 ++A) {
717 if (!A->getType()->isPointerTy())
718 continue;
Nick Lewyckyc2ec0722013-07-06 00:29:58 +0000719 bool HasNonLocalUses = false;
720 if (!A->hasNoCaptureAttr()) {
Benjamin Kramer40d7f352013-06-22 16:56:32 +0000721 ArgumentUsesTracker Tracker(SCCNodes);
Duncan P. N. Exon Smith17323402015-10-13 17:51:03 +0000722 PointerMayBeCaptured(&*A, &Tracker);
Benjamin Kramer40d7f352013-06-22 16:56:32 +0000723 if (!Tracker.Captured) {
724 if (Tracker.Uses.empty()) {
725 // If it's trivially not captured, mark it nocapture now.
Reid Kleckner9d16fa02017-04-19 17:28:52 +0000726 A->addAttr(Attribute::NoCapture);
Benjamin Kramer40d7f352013-06-22 16:56:32 +0000727 ++NumNoCapture;
728 Changed = true;
729 } else {
730 // If it's not trivially captured and not trivially not captured,
731 // then it must be calling into another function in our SCC. Save
732 // its particulars for Argument-SCC analysis later.
Duncan P. N. Exon Smith17323402015-10-13 17:51:03 +0000733 ArgumentGraphNode *Node = AG[&*A];
Benjamin Kramer135f7352016-06-26 12:28:59 +0000734 for (Argument *Use : Tracker.Uses) {
735 Node->Uses.push_back(AG[Use]);
736 if (Use != &*A)
Nick Lewyckyc2ec0722013-07-06 00:29:58 +0000737 HasNonLocalUses = true;
738 }
Benjamin Kramer40d7f352013-06-22 16:56:32 +0000739 }
740 }
741 // Otherwise, it's captured. Don't bother doing SCC analysis on it.
742 }
Nick Lewyckyc2ec0722013-07-06 00:29:58 +0000743 if (!HasNonLocalUses && !A->onlyReadsMemory()) {
744 // Can we determine that it's readonly/readnone without doing an SCC?
745 // Note that we don't allow any calls at all here, or else our result
746 // will be dependent on the iteration order through the functions in the
747 // SCC.
Chandler Carruth63559d72015-09-13 06:47:20 +0000748 SmallPtrSet<Argument *, 8> Self;
Duncan P. N. Exon Smith17323402015-10-13 17:51:03 +0000749 Self.insert(&*A);
750 Attribute::AttrKind R = determinePointerReadAttrs(&*A, Self);
Whitney Tsang1ccba7c2019-09-11 14:26:22 +0000751 if (R != Attribute::None)
752 Changed = addReadAttr(A, R);
Nick Lewyckyc2ec0722013-07-06 00:29:58 +0000753 }
754 }
Nick Lewycky4c378a42011-12-28 23:24:21 +0000755 }
756
757 // The graph we've collected is partial because we stopped scanning for
758 // argument uses once we solved the argument trivially. These partial nodes
759 // show up as ArgumentGraphNode objects with an empty Uses list, and for
760 // these nodes the final decision about whether they capture has already been
761 // made. If the definition doesn't have a 'nocapture' attribute by now, it
762 // captures.
763
Chandler Carruth63559d72015-09-13 06:47:20 +0000764 for (scc_iterator<ArgumentGraph *> I = scc_begin(&AG); !I.isAtEnd(); ++I) {
Duncan P. N. Exon Smithd2b2fac2014-04-25 18:24:50 +0000765 const std::vector<ArgumentGraphNode *> &ArgumentSCC = *I;
Nick Lewycky4c378a42011-12-28 23:24:21 +0000766 if (ArgumentSCC.size() == 1) {
Chandler Carruth63559d72015-09-13 06:47:20 +0000767 if (!ArgumentSCC[0]->Definition)
768 continue; // synthetic root node
Nick Lewycky4c378a42011-12-28 23:24:21 +0000769
770 // eg. "void f(int* x) { if (...) f(x); }"
771 if (ArgumentSCC[0]->Uses.size() == 1 &&
772 ArgumentSCC[0]->Uses[0] == ArgumentSCC[0]) {
Nick Lewyckyc2ec0722013-07-06 00:29:58 +0000773 Argument *A = ArgumentSCC[0]->Definition;
Reid Kleckner9d16fa02017-04-19 17:28:52 +0000774 A->addAttr(Attribute::NoCapture);
Nick Lewycky7e820552009-01-02 03:46:56 +0000775 ++NumNoCapture;
Duncan Sands44c8cd92008-12-31 16:14:43 +0000776 Changed = true;
777 }
Nick Lewycky4c378a42011-12-28 23:24:21 +0000778 continue;
779 }
780
781 bool SCCCaptured = false;
Duncan P. N. Exon Smithd2b2fac2014-04-25 18:24:50 +0000782 for (auto I = ArgumentSCC.begin(), E = ArgumentSCC.end();
783 I != E && !SCCCaptured; ++I) {
Nick Lewycky4c378a42011-12-28 23:24:21 +0000784 ArgumentGraphNode *Node = *I;
785 if (Node->Uses.empty()) {
786 if (!Node->Definition->hasNoCaptureAttr())
787 SCCCaptured = true;
788 }
789 }
Chandler Carruth63559d72015-09-13 06:47:20 +0000790 if (SCCCaptured)
791 continue;
Nick Lewycky4c378a42011-12-28 23:24:21 +0000792
Chandler Carruth63559d72015-09-13 06:47:20 +0000793 SmallPtrSet<Argument *, 8> ArgumentSCCNodes;
Nick Lewycky4c378a42011-12-28 23:24:21 +0000794 // Fill ArgumentSCCNodes with the elements of the ArgumentSCC. Used for
795 // quickly looking up whether a given Argument is in this ArgumentSCC.
Benjamin Kramer135f7352016-06-26 12:28:59 +0000796 for (ArgumentGraphNode *I : ArgumentSCC) {
797 ArgumentSCCNodes.insert(I->Definition);
Nick Lewycky4c378a42011-12-28 23:24:21 +0000798 }
799
Duncan P. N. Exon Smithd2b2fac2014-04-25 18:24:50 +0000800 for (auto I = ArgumentSCC.begin(), E = ArgumentSCC.end();
801 I != E && !SCCCaptured; ++I) {
Nick Lewycky4c378a42011-12-28 23:24:21 +0000802 ArgumentGraphNode *N = *I;
Benjamin Kramer135f7352016-06-26 12:28:59 +0000803 for (ArgumentGraphNode *Use : N->Uses) {
804 Argument *A = Use->Definition;
Nick Lewycky4c378a42011-12-28 23:24:21 +0000805 if (A->hasNoCaptureAttr() || ArgumentSCCNodes.count(A))
806 continue;
807 SCCCaptured = true;
808 break;
809 }
810 }
Chandler Carruth63559d72015-09-13 06:47:20 +0000811 if (SCCCaptured)
812 continue;
Nick Lewycky4c378a42011-12-28 23:24:21 +0000813
Nick Lewyckyf740db32012-01-05 22:21:45 +0000814 for (unsigned i = 0, e = ArgumentSCC.size(); i != e; ++i) {
Nick Lewycky4c378a42011-12-28 23:24:21 +0000815 Argument *A = ArgumentSCC[i]->Definition;
Reid Kleckner9d16fa02017-04-19 17:28:52 +0000816 A->addAttr(Attribute::NoCapture);
Nick Lewycky4c378a42011-12-28 23:24:21 +0000817 ++NumNoCapture;
818 Changed = true;
819 }
Nick Lewyckyc2ec0722013-07-06 00:29:58 +0000820
821 // We also want to compute readonly/readnone. With a small number of false
822 // negatives, we can assume that any pointer which is captured isn't going
823 // to be provably readonly or readnone, since by definition we can't
824 // analyze all uses of a captured pointer.
825 //
826 // The false negatives happen when the pointer is captured by a function
827 // that promises readonly/readnone behaviour on the pointer, then the
828 // pointer's lifetime ends before anything that writes to arbitrary memory.
829 // Also, a readonly/readnone pointer may be returned, but returning a
830 // pointer is capturing it.
831
832 Attribute::AttrKind ReadAttr = Attribute::ReadNone;
833 for (unsigned i = 0, e = ArgumentSCC.size(); i != e; ++i) {
834 Argument *A = ArgumentSCC[i]->Definition;
835 Attribute::AttrKind K = determinePointerReadAttrs(A, ArgumentSCCNodes);
836 if (K == Attribute::ReadNone)
837 continue;
838 if (K == Attribute::ReadOnly) {
839 ReadAttr = Attribute::ReadOnly;
840 continue;
841 }
842 ReadAttr = K;
843 break;
844 }
845
846 if (ReadAttr != Attribute::None) {
Nick Lewyckyc2ec0722013-07-06 00:29:58 +0000847 for (unsigned i = 0, e = ArgumentSCC.size(); i != e; ++i) {
848 Argument *A = ArgumentSCC[i]->Definition;
Whitney Tsang1ccba7c2019-09-11 14:26:22 +0000849 Changed = addReadAttr(A, ReadAttr);
Nick Lewyckyc2ec0722013-07-06 00:29:58 +0000850 }
851 }
Duncan Sands44c8cd92008-12-31 16:14:43 +0000852 }
853
854 return Changed;
855}
856
Chandler Carrutha632fb92015-09-13 06:57:25 +0000857/// Tests whether a function is "malloc-like".
858///
859/// A function is "malloc-like" if it returns either null or a pointer that
860/// doesn't alias any other pointer visible to the caller.
Chandler Carruthc518ebd2015-10-29 18:29:15 +0000861static bool isFunctionMallocLike(Function *F, const SCCNodeSet &SCCNodes) {
Benjamin Kramer15591272012-10-31 13:45:49 +0000862 SmallSetVector<Value *, 8> FlowsToReturn;
Benjamin Kramer135f7352016-06-26 12:28:59 +0000863 for (BasicBlock &BB : *F)
864 if (ReturnInst *Ret = dyn_cast<ReturnInst>(BB.getTerminator()))
Nick Lewyckyfbed86a2009-03-08 06:20:47 +0000865 FlowsToReturn.insert(Ret->getReturnValue());
866
867 for (unsigned i = 0; i != FlowsToReturn.size(); ++i) {
Benjamin Kramer15591272012-10-31 13:45:49 +0000868 Value *RetVal = FlowsToReturn[i];
Nick Lewyckyfbed86a2009-03-08 06:20:47 +0000869
870 if (Constant *C = dyn_cast<Constant>(RetVal)) {
871 if (!C->isNullValue() && !isa<UndefValue>(C))
872 return false;
873
874 continue;
875 }
876
877 if (isa<Argument>(RetVal))
878 return false;
879
880 if (Instruction *RVI = dyn_cast<Instruction>(RetVal))
881 switch (RVI->getOpcode()) {
Chandler Carruth63559d72015-09-13 06:47:20 +0000882 // Extend the analysis by looking upwards.
883 case Instruction::BitCast:
884 case Instruction::GetElementPtr:
885 case Instruction::AddrSpaceCast:
886 FlowsToReturn.insert(RVI->getOperand(0));
887 continue;
888 case Instruction::Select: {
889 SelectInst *SI = cast<SelectInst>(RVI);
890 FlowsToReturn.insert(SI->getTrueValue());
891 FlowsToReturn.insert(SI->getFalseValue());
892 continue;
893 }
894 case Instruction::PHI: {
895 PHINode *PN = cast<PHINode>(RVI);
896 for (Value *IncValue : PN->incoming_values())
897 FlowsToReturn.insert(IncValue);
898 continue;
899 }
Nick Lewyckyfbed86a2009-03-08 06:20:47 +0000900
Chandler Carruth63559d72015-09-13 06:47:20 +0000901 // Check whether the pointer came from an allocation.
902 case Instruction::Alloca:
903 break;
904 case Instruction::Call:
905 case Instruction::Invoke: {
906 CallSite CS(RVI);
Reid Klecknerfb502d22017-04-14 20:19:02 +0000907 if (CS.hasRetAttr(Attribute::NoAlias))
Nick Lewyckyfbed86a2009-03-08 06:20:47 +0000908 break;
Chandler Carruth63559d72015-09-13 06:47:20 +0000909 if (CS.getCalledFunction() && SCCNodes.count(CS.getCalledFunction()))
910 break;
Justin Bognercd1d5aa2016-08-17 20:30:52 +0000911 LLVM_FALLTHROUGH;
912 }
Chandler Carruth63559d72015-09-13 06:47:20 +0000913 default:
914 return false; // Did not come from an allocation.
Nick Lewyckyfbed86a2009-03-08 06:20:47 +0000915 }
916
Dan Gohman94e61762009-11-19 21:57:48 +0000917 if (PointerMayBeCaptured(RetVal, false, /*StoreCaptures=*/false))
Nick Lewyckyfbed86a2009-03-08 06:20:47 +0000918 return false;
919 }
920
921 return true;
922}
923
Chandler Carrutha632fb92015-09-13 06:57:25 +0000924/// Deduce noalias attributes for the SCC.
Chandler Carruthc518ebd2015-10-29 18:29:15 +0000925static bool addNoAliasAttrs(const SCCNodeSet &SCCNodes) {
Nick Lewycky9ec96d12009-03-08 17:08:09 +0000926 // Check each function in turn, determining which functions return noalias
927 // pointers.
Chandler Carruthc518ebd2015-10-29 18:29:15 +0000928 for (Function *F : SCCNodes) {
Nick Lewyckyfbed86a2009-03-08 06:20:47 +0000929 // Already noalias.
Reid Klecknera0b45f42017-05-03 18:17:31 +0000930 if (F->returnDoesNotAlias())
Nick Lewyckyfbed86a2009-03-08 06:20:47 +0000931 continue;
932
Sanjoy Das5ce32722016-04-08 00:48:30 +0000933 // We can infer and propagate function attributes only when we know that the
934 // definition we'll get at link time is *exactly* the definition we see now.
935 // For more details, see GlobalValue::mayBeDerefined.
936 if (!F->hasExactDefinition())
Nick Lewyckyfbed86a2009-03-08 06:20:47 +0000937 return false;
938
Chandler Carruth63559d72015-09-13 06:47:20 +0000939 // We annotate noalias return values, which are only applicable to
Nick Lewyckyfbed86a2009-03-08 06:20:47 +0000940 // pointer types.
Duncan Sands19d0b472010-02-16 11:11:14 +0000941 if (!F->getReturnType()->isPointerTy())
Nick Lewyckyfbed86a2009-03-08 06:20:47 +0000942 continue;
943
Chandler Carruth3824f852015-09-13 08:23:27 +0000944 if (!isFunctionMallocLike(F, SCCNodes))
Nick Lewyckyfbed86a2009-03-08 06:20:47 +0000945 return false;
946 }
947
948 bool MadeChange = false;
Chandler Carruthc518ebd2015-10-29 18:29:15 +0000949 for (Function *F : SCCNodes) {
Reid Klecknera0b45f42017-05-03 18:17:31 +0000950 if (F->returnDoesNotAlias() ||
Reid Kleckner6652a522017-04-28 18:37:16 +0000951 !F->getReturnType()->isPointerTy())
Nick Lewyckyfbed86a2009-03-08 06:20:47 +0000952 continue;
953
Reid Klecknera0b45f42017-05-03 18:17:31 +0000954 F->setReturnDoesNotAlias();
Nick Lewyckyfbed86a2009-03-08 06:20:47 +0000955 ++NumNoAlias;
956 MadeChange = true;
957 }
958
959 return MadeChange;
960}
961
Chandler Carrutha632fb92015-09-13 06:57:25 +0000962/// Tests whether this function is known to not return null.
Chandler Carruth8874b782015-09-13 08:17:14 +0000963///
964/// Requires that the function returns a pointer.
965///
966/// Returns true if it believes the function will not return a null, and sets
967/// \p Speculative based on whether the returned conclusion is a speculative
968/// conclusion due to SCC calls.
Chandler Carruthc518ebd2015-10-29 18:29:15 +0000969static bool isReturnNonNull(Function *F, const SCCNodeSet &SCCNodes,
Sean Silva45835e72016-07-02 23:47:27 +0000970 bool &Speculative) {
Philip Reamesa88caea2015-08-31 19:44:38 +0000971 assert(F->getReturnType()->isPointerTy() &&
972 "nonnull only meaningful on pointer types");
973 Speculative = false;
Chandler Carruth63559d72015-09-13 06:47:20 +0000974
Philip Reamesa88caea2015-08-31 19:44:38 +0000975 SmallSetVector<Value *, 8> FlowsToReturn;
976 for (BasicBlock &BB : *F)
977 if (auto *Ret = dyn_cast<ReturnInst>(BB.getTerminator()))
978 FlowsToReturn.insert(Ret->getReturnValue());
979
Nuno Lopes404f1062017-09-09 18:23:11 +0000980 auto &DL = F->getParent()->getDataLayout();
981
Philip Reamesa88caea2015-08-31 19:44:38 +0000982 for (unsigned i = 0; i != FlowsToReturn.size(); ++i) {
983 Value *RetVal = FlowsToReturn[i];
984
985 // If this value is locally known to be non-null, we're good
Nuno Lopes404f1062017-09-09 18:23:11 +0000986 if (isKnownNonZero(RetVal, DL))
Philip Reamesa88caea2015-08-31 19:44:38 +0000987 continue;
988
989 // Otherwise, we need to look upwards since we can't make any local
Chandler Carruth63559d72015-09-13 06:47:20 +0000990 // conclusions.
Philip Reamesa88caea2015-08-31 19:44:38 +0000991 Instruction *RVI = dyn_cast<Instruction>(RetVal);
992 if (!RVI)
993 return false;
994 switch (RVI->getOpcode()) {
Chandler Carruth63559d72015-09-13 06:47:20 +0000995 // Extend the analysis by looking upwards.
Philip Reamesa88caea2015-08-31 19:44:38 +0000996 case Instruction::BitCast:
997 case Instruction::GetElementPtr:
998 case Instruction::AddrSpaceCast:
999 FlowsToReturn.insert(RVI->getOperand(0));
1000 continue;
1001 case Instruction::Select: {
1002 SelectInst *SI = cast<SelectInst>(RVI);
1003 FlowsToReturn.insert(SI->getTrueValue());
1004 FlowsToReturn.insert(SI->getFalseValue());
1005 continue;
1006 }
1007 case Instruction::PHI: {
1008 PHINode *PN = cast<PHINode>(RVI);
1009 for (int i = 0, e = PN->getNumIncomingValues(); i != e; ++i)
1010 FlowsToReturn.insert(PN->getIncomingValue(i));
1011 continue;
1012 }
1013 case Instruction::Call:
1014 case Instruction::Invoke: {
1015 CallSite CS(RVI);
1016 Function *Callee = CS.getCalledFunction();
1017 // A call to a node within the SCC is assumed to return null until
1018 // proven otherwise
1019 if (Callee && SCCNodes.count(Callee)) {
1020 Speculative = true;
1021 continue;
1022 }
1023 return false;
1024 }
1025 default:
Chandler Carruth63559d72015-09-13 06:47:20 +00001026 return false; // Unknown source, may be null
Philip Reamesa88caea2015-08-31 19:44:38 +00001027 };
1028 llvm_unreachable("should have either continued or returned");
1029 }
1030
1031 return true;
1032}
1033
Chandler Carrutha632fb92015-09-13 06:57:25 +00001034/// Deduce nonnull attributes for the SCC.
Sean Silva45835e72016-07-02 23:47:27 +00001035static bool addNonNullAttrs(const SCCNodeSet &SCCNodes) {
Philip Reamesa88caea2015-08-31 19:44:38 +00001036 // Speculative that all functions in the SCC return only nonnull
1037 // pointers. We may refute this as we analyze functions.
1038 bool SCCReturnsNonNull = true;
1039
1040 bool MadeChange = false;
1041
1042 // Check each function in turn, determining which functions return nonnull
1043 // pointers.
Chandler Carruthc518ebd2015-10-29 18:29:15 +00001044 for (Function *F : SCCNodes) {
Philip Reamesa88caea2015-08-31 19:44:38 +00001045 // Already nonnull.
Reid Klecknerb5180542017-03-21 16:57:19 +00001046 if (F->getAttributes().hasAttribute(AttributeList::ReturnIndex,
Philip Reamesa88caea2015-08-31 19:44:38 +00001047 Attribute::NonNull))
1048 continue;
1049
Sanjoy Das5ce32722016-04-08 00:48:30 +00001050 // We can infer and propagate function attributes only when we know that the
1051 // definition we'll get at link time is *exactly* the definition we see now.
1052 // For more details, see GlobalValue::mayBeDerefined.
1053 if (!F->hasExactDefinition())
Philip Reamesa88caea2015-08-31 19:44:38 +00001054 return false;
1055
Chandler Carruth63559d72015-09-13 06:47:20 +00001056 // We annotate nonnull return values, which are only applicable to
Philip Reamesa88caea2015-08-31 19:44:38 +00001057 // pointer types.
1058 if (!F->getReturnType()->isPointerTy())
1059 continue;
1060
1061 bool Speculative = false;
Sean Silva45835e72016-07-02 23:47:27 +00001062 if (isReturnNonNull(F, SCCNodes, Speculative)) {
Philip Reamesa88caea2015-08-31 19:44:38 +00001063 if (!Speculative) {
1064 // Mark the function eagerly since we may discover a function
1065 // which prevents us from speculating about the entire SCC
Nicola Zaghend34e60c2018-05-14 12:53:11 +00001066 LLVM_DEBUG(dbgs() << "Eagerly marking " << F->getName()
1067 << " as nonnull\n");
Reid Klecknerb5180542017-03-21 16:57:19 +00001068 F->addAttribute(AttributeList::ReturnIndex, Attribute::NonNull);
Philip Reamesa88caea2015-08-31 19:44:38 +00001069 ++NumNonNullReturn;
1070 MadeChange = true;
1071 }
1072 continue;
1073 }
1074 // At least one function returns something which could be null, can't
1075 // speculate any more.
1076 SCCReturnsNonNull = false;
1077 }
1078
1079 if (SCCReturnsNonNull) {
Chandler Carruthc518ebd2015-10-29 18:29:15 +00001080 for (Function *F : SCCNodes) {
Reid Klecknerb5180542017-03-21 16:57:19 +00001081 if (F->getAttributes().hasAttribute(AttributeList::ReturnIndex,
Philip Reamesa88caea2015-08-31 19:44:38 +00001082 Attribute::NonNull) ||
1083 !F->getReturnType()->isPointerTy())
1084 continue;
1085
Nicola Zaghend34e60c2018-05-14 12:53:11 +00001086 LLVM_DEBUG(dbgs() << "SCC marking " << F->getName() << " as nonnull\n");
Reid Klecknerb5180542017-03-21 16:57:19 +00001087 F->addAttribute(AttributeList::ReturnIndex, Attribute::NonNull);
Philip Reamesa88caea2015-08-31 19:44:38 +00001088 ++NumNonNullReturn;
1089 MadeChange = true;
1090 }
1091 }
1092
1093 return MadeChange;
1094}
1095
Fedor Sergeev6660fd02018-03-23 21:46:16 +00001096namespace {
1097
1098/// Collects a set of attribute inference requests and performs them all in one
1099/// go on a single SCC Node. Inference involves scanning function bodies
1100/// looking for instructions that violate attribute assumptions.
1101/// As soon as all the bodies are fine we are free to set the attribute.
1102/// Customization of inference for individual attributes is performed by
1103/// providing a handful of predicates for each attribute.
1104class AttributeInferer {
1105public:
1106 /// Describes a request for inference of a single attribute.
1107 struct InferenceDescriptor {
1108
1109 /// Returns true if this function does not have to be handled.
1110 /// General intent for this predicate is to provide an optimization
1111 /// for functions that do not need this attribute inference at all
1112 /// (say, for functions that already have the attribute).
1113 std::function<bool(const Function &)> SkipFunction;
1114
1115 /// Returns true if this instruction violates attribute assumptions.
1116 std::function<bool(Instruction &)> InstrBreaksAttribute;
1117
1118 /// Sets the inferred attribute for this function.
1119 std::function<void(Function &)> SetAttribute;
1120
1121 /// Attribute we derive.
1122 Attribute::AttrKind AKind;
1123
1124 /// If true, only "exact" definitions can be used to infer this attribute.
1125 /// See GlobalValue::isDefinitionExact.
1126 bool RequiresExactDefinition;
1127
1128 InferenceDescriptor(Attribute::AttrKind AK,
1129 std::function<bool(const Function &)> SkipFunc,
1130 std::function<bool(Instruction &)> InstrScan,
1131 std::function<void(Function &)> SetAttr,
1132 bool ReqExactDef)
1133 : SkipFunction(SkipFunc), InstrBreaksAttribute(InstrScan),
1134 SetAttribute(SetAttr), AKind(AK),
1135 RequiresExactDefinition(ReqExactDef) {}
1136 };
1137
1138private:
1139 SmallVector<InferenceDescriptor, 4> InferenceDescriptors;
1140
1141public:
1142 void registerAttrInference(InferenceDescriptor AttrInference) {
1143 InferenceDescriptors.push_back(AttrInference);
1144 }
1145
1146 bool run(const SCCNodeSet &SCCNodes);
1147};
1148
1149/// Perform all the requested attribute inference actions according to the
1150/// attribute predicates stored before.
1151bool AttributeInferer::run(const SCCNodeSet &SCCNodes) {
1152 SmallVector<InferenceDescriptor, 4> InferInSCC = InferenceDescriptors;
1153 // Go through all the functions in SCC and check corresponding attribute
1154 // assumptions for each of them. Attributes that are invalid for this SCC
1155 // will be removed from InferInSCC.
Chandler Carruth3937bc72016-02-12 09:47:49 +00001156 for (Function *F : SCCNodes) {
Justin Lebar9d943972016-03-14 20:18:54 +00001157
Fedor Sergeev6660fd02018-03-23 21:46:16 +00001158 // No attributes whose assumptions are still valid - done.
1159 if (InferInSCC.empty())
1160 return false;
Justin Lebar9d943972016-03-14 20:18:54 +00001161
Fedor Sergeev6660fd02018-03-23 21:46:16 +00001162 // Check if our attributes ever need scanning/can be scanned.
1163 llvm::erase_if(InferInSCC, [F](const InferenceDescriptor &ID) {
1164 if (ID.SkipFunction(*F))
Justin Lebar9d943972016-03-14 20:18:54 +00001165 return false;
Fedor Sergeev6660fd02018-03-23 21:46:16 +00001166
1167 // Remove from further inference (invalidate) when visiting a function
1168 // that has no instructions to scan/has an unsuitable definition.
1169 return F->isDeclaration() ||
1170 (ID.RequiresExactDefinition && !F->hasExactDefinition());
1171 });
1172
1173 // For each attribute still in InferInSCC that doesn't explicitly skip F,
1174 // set up the F instructions scan to verify assumptions of the attribute.
1175 SmallVector<InferenceDescriptor, 4> InferInThisFunc;
1176 llvm::copy_if(
1177 InferInSCC, std::back_inserter(InferInThisFunc),
1178 [F](const InferenceDescriptor &ID) { return !ID.SkipFunction(*F); });
1179
1180 if (InferInThisFunc.empty())
1181 continue;
1182
1183 // Start instruction scan.
1184 for (Instruction &I : instructions(*F)) {
1185 llvm::erase_if(InferInThisFunc, [&](const InferenceDescriptor &ID) {
1186 if (!ID.InstrBreaksAttribute(I))
1187 return false;
1188 // Remove attribute from further inference on any other functions
1189 // because attribute assumptions have just been violated.
1190 llvm::erase_if(InferInSCC, [&ID](const InferenceDescriptor &D) {
1191 return D.AKind == ID.AKind;
1192 });
1193 // Remove attribute from the rest of current instruction scan.
1194 return true;
1195 });
1196
1197 if (InferInThisFunc.empty())
1198 break;
Justin Lebar9d943972016-03-14 20:18:54 +00001199 }
1200 }
1201
Fedor Sergeev6660fd02018-03-23 21:46:16 +00001202 if (InferInSCC.empty())
1203 return false;
Justin Lebar9d943972016-03-14 20:18:54 +00001204
Fedor Sergeev6660fd02018-03-23 21:46:16 +00001205 bool Changed = false;
1206 for (Function *F : SCCNodes)
1207 // At this point InferInSCC contains only functions that were either:
1208 // - explicitly skipped from scan/inference, or
1209 // - verified to have no instructions that break attribute assumptions.
1210 // Hence we just go and force the attribute for all non-skipped functions.
1211 for (auto &ID : InferInSCC) {
1212 if (ID.SkipFunction(*F))
1213 continue;
1214 Changed = true;
1215 ID.SetAttribute(*F);
1216 }
1217 return Changed;
1218}
Justin Lebar9d943972016-03-14 20:18:54 +00001219
Fedor Sergeev6660fd02018-03-23 21:46:16 +00001220} // end anonymous namespace
1221
1222/// Helper for non-Convergent inference predicate InstrBreaksAttribute.
1223static bool InstrBreaksNonConvergent(Instruction &I,
1224 const SCCNodeSet &SCCNodes) {
1225 const CallSite CS(&I);
1226 // Breaks non-convergent assumption if CS is a convergent call to a function
1227 // not in the SCC.
1228 return CS && CS.isConvergent() && SCCNodes.count(CS.getCalledFunction()) == 0;
1229}
1230
1231/// Helper for NoUnwind inference predicate InstrBreaksAttribute.
1232static bool InstrBreaksNonThrowing(Instruction &I, const SCCNodeSet &SCCNodes) {
1233 if (!I.mayThrow())
1234 return false;
1235 if (const auto *CI = dyn_cast<CallInst>(&I)) {
1236 if (Function *Callee = CI->getCalledFunction()) {
1237 // I is a may-throw call to a function inside our SCC. This doesn't
1238 // invalidate our current working assumption that the SCC is no-throw; we
1239 // just have to scan that other function.
1240 if (SCCNodes.count(Callee) > 0)
1241 return false;
1242 }
Chandler Carruth3937bc72016-02-12 09:47:49 +00001243 }
Justin Lebar260854b2016-02-09 23:03:22 +00001244 return true;
1245}
1246
Brian Homerdingb4b21d82019-07-08 15:57:56 +00001247/// Helper for NoFree inference predicate InstrBreaksAttribute.
1248static bool InstrBreaksNoFree(Instruction &I, const SCCNodeSet &SCCNodes) {
1249 CallSite CS(&I);
1250 if (!CS)
1251 return false;
1252
1253 Function *Callee = CS.getCalledFunction();
1254 if (!Callee)
1255 return true;
1256
1257 if (Callee->doesNotFreeMemory())
1258 return false;
1259
1260 if (SCCNodes.count(Callee) > 0)
1261 return false;
1262
1263 return true;
1264}
1265
Fedor Sergeev6660fd02018-03-23 21:46:16 +00001266/// Infer attributes from all functions in the SCC by scanning every
1267/// instruction for compliance to the attribute assumptions. Currently it
1268/// does:
1269/// - removal of Convergent attribute
1270/// - addition of NoUnwind attribute
1271///
1272/// Returns true if any changes to function attributes were made.
1273static bool inferAttrsFromFunctionBodies(const SCCNodeSet &SCCNodes) {
1274
1275 AttributeInferer AI;
1276
1277 // Request to remove the convergent attribute from all functions in the SCC
1278 // if every callsite within the SCC is not convergent (except for calls
1279 // to functions within the SCC).
1280 // Note: Removal of the attr from the callsites will happen in
1281 // InstCombineCalls separately.
1282 AI.registerAttrInference(AttributeInferer::InferenceDescriptor{
1283 Attribute::Convergent,
1284 // Skip non-convergent functions.
1285 [](const Function &F) { return !F.isConvergent(); },
1286 // Instructions that break non-convergent assumption.
1287 [SCCNodes](Instruction &I) {
1288 return InstrBreaksNonConvergent(I, SCCNodes);
1289 },
1290 [](Function &F) {
Nicola Zaghend34e60c2018-05-14 12:53:11 +00001291 LLVM_DEBUG(dbgs() << "Removing convergent attr from fn " << F.getName()
1292 << "\n");
Fedor Sergeev6660fd02018-03-23 21:46:16 +00001293 F.setNotConvergent();
1294 },
1295 /* RequiresExactDefinition= */ false});
1296
1297 if (!DisableNoUnwindInference)
1298 // Request to infer nounwind attribute for all the functions in the SCC if
1299 // every callsite within the SCC is not throwing (except for calls to
1300 // functions within the SCC). Note that nounwind attribute suffers from
1301 // derefinement - results may change depending on how functions are
1302 // optimized. Thus it can be inferred only from exact definitions.
1303 AI.registerAttrInference(AttributeInferer::InferenceDescriptor{
1304 Attribute::NoUnwind,
1305 // Skip non-throwing functions.
1306 [](const Function &F) { return F.doesNotThrow(); },
1307 // Instructions that break non-throwing assumption.
1308 [SCCNodes](Instruction &I) {
1309 return InstrBreaksNonThrowing(I, SCCNodes);
1310 },
1311 [](Function &F) {
Nicola Zaghend34e60c2018-05-14 12:53:11 +00001312 LLVM_DEBUG(dbgs()
1313 << "Adding nounwind attr to fn " << F.getName() << "\n");
Fedor Sergeev6660fd02018-03-23 21:46:16 +00001314 F.setDoesNotThrow();
1315 ++NumNoUnwind;
1316 },
1317 /* RequiresExactDefinition= */ true});
1318
Brian Homerdingb4b21d82019-07-08 15:57:56 +00001319 if (!DisableNoFreeInference)
1320 // Request to infer nofree attribute for all the functions in the SCC if
1321 // every callsite within the SCC does not directly or indirectly free
1322 // memory (except for calls to functions within the SCC). Note that nofree
1323 // attribute suffers from derefinement - results may change depending on
1324 // how functions are optimized. Thus it can be inferred only from exact
1325 // definitions.
1326 AI.registerAttrInference(AttributeInferer::InferenceDescriptor{
1327 Attribute::NoFree,
1328 // Skip functions known not to free memory.
1329 [](const Function &F) { return F.doesNotFreeMemory(); },
1330 // Instructions that break non-deallocating assumption.
1331 [SCCNodes](Instruction &I) {
1332 return InstrBreaksNoFree(I, SCCNodes);
1333 },
1334 [](Function &F) {
1335 LLVM_DEBUG(dbgs()
1336 << "Adding nofree attr to fn " << F.getName() << "\n");
1337 F.setDoesNotFreeMemory();
1338 ++NumNoFree;
1339 },
1340 /* RequiresExactDefinition= */ true});
1341
Fedor Sergeev6660fd02018-03-23 21:46:16 +00001342 // Perform all the requested attribute inference actions.
1343 return AI.run(SCCNodes);
1344}
1345
James Molloy7e9bdd52015-11-12 10:55:20 +00001346static bool setDoesNotRecurse(Function &F) {
1347 if (F.doesNotRecurse())
1348 return false;
1349 F.setDoesNotRecurse();
1350 ++NumNoRecurse;
1351 return true;
1352}
1353
Chandler Carruth632d2082016-02-13 08:47:51 +00001354static bool addNoRecurseAttrs(const SCCNodeSet &SCCNodes) {
James Molloy7e9bdd52015-11-12 10:55:20 +00001355 // Try and identify functions that do not recurse.
1356
1357 // If the SCC contains multiple nodes we know for sure there is recursion.
Chandler Carruth632d2082016-02-13 08:47:51 +00001358 if (SCCNodes.size() != 1)
James Molloy7e9bdd52015-11-12 10:55:20 +00001359 return false;
1360
Chandler Carruth632d2082016-02-13 08:47:51 +00001361 Function *F = *SCCNodes.begin();
Vivek Pandya11cb15f2019-06-10 04:16:04 +00001362 if (!F || !F->hasExactDefinition() || F->doesNotRecurse())
James Molloy7e9bdd52015-11-12 10:55:20 +00001363 return false;
1364
1365 // If all of the calls in F are identifiable and are to norecurse functions, F
1366 // is norecurse. This check also detects self-recursion as F is not currently
1367 // marked norecurse, so any called from F to F will not be marked norecurse.
Christian Bruel4ead99b2018-12-05 16:48:00 +00001368 for (auto &BB : *F)
1369 for (auto &I : BB.instructionsWithoutDebug())
1370 if (auto CS = CallSite(&I)) {
1371 Function *Callee = CS.getCalledFunction();
1372 if (!Callee || Callee == F || !Callee->doesNotRecurse())
1373 // Function calls a potentially recursive function.
1374 return false;
1375 }
James Molloy7e9bdd52015-11-12 10:55:20 +00001376
Chandler Carruth632d2082016-02-13 08:47:51 +00001377 // Every call was to a non-recursive function other than this function, and
1378 // we have no indirect recursion as the SCC size is one. This function cannot
1379 // recurse.
1380 return setDoesNotRecurse(*F);
James Molloy7e9bdd52015-11-12 10:55:20 +00001381}
1382
Johannes Doerfertbed4bab2018-08-01 16:37:51 +00001383template <typename AARGetterT>
Brian Homerdingb4b21d82019-07-08 15:57:56 +00001384static bool deriveAttrsInPostOrder(SCCNodeSet &SCCNodes,
1385 AARGetterT &&AARGetter,
Johannes Doerfertbed4bab2018-08-01 16:37:51 +00001386 bool HasUnknownCall) {
1387 bool Changed = false;
1388
1389 // Bail if the SCC only contains optnone functions.
1390 if (SCCNodes.empty())
1391 return Changed;
1392
1393 Changed |= addArgumentReturnedAttrs(SCCNodes);
1394 Changed |= addReadAttrs(SCCNodes, AARGetter);
1395 Changed |= addArgumentAttrs(SCCNodes);
1396
1397 // If we have no external nodes participating in the SCC, we can deduce some
1398 // more precise attributes as well.
1399 if (!HasUnknownCall) {
1400 Changed |= addNoAliasAttrs(SCCNodes);
1401 Changed |= addNonNullAttrs(SCCNodes);
1402 Changed |= inferAttrsFromFunctionBodies(SCCNodes);
1403 Changed |= addNoRecurseAttrs(SCCNodes);
1404 }
1405
1406 return Changed;
1407}
1408
Chandler Carruthb47f8012016-03-11 11:05:24 +00001409PreservedAnalyses PostOrderFunctionAttrsPass::run(LazyCallGraph::SCC &C,
Chandler Carruth88823462016-08-24 09:37:14 +00001410 CGSCCAnalysisManager &AM,
1411 LazyCallGraph &CG,
1412 CGSCCUpdateResult &) {
Chandler Carruth9c4ed172016-02-18 11:03:11 +00001413 FunctionAnalysisManager &FAM =
Chandler Carruth88823462016-08-24 09:37:14 +00001414 AM.getResult<FunctionAnalysisManagerCGSCCProxy>(C, CG).getManager();
Chandler Carruth9c4ed172016-02-18 11:03:11 +00001415
Chandler Carruth9c4ed172016-02-18 11:03:11 +00001416 // We pass a lambda into functions to wire them up to the analysis manager
1417 // for getting function analyses.
1418 auto AARGetter = [&](Function &F) -> AAResults & {
1419 return FAM.getResult<AAManager>(F);
1420 };
1421
1422 // Fill SCCNodes with the elements of the SCC. Also track whether there are
1423 // any external or opt-none nodes that will prevent us from optimizing any
1424 // part of the SCC.
1425 SCCNodeSet SCCNodes;
1426 bool HasUnknownCall = false;
1427 for (LazyCallGraph::Node &N : C) {
1428 Function &F = N.getFunction();
Evandro Menezes85bd3972019-04-04 22:40:06 +00001429 if (F.hasOptNone() || F.hasFnAttribute(Attribute::Naked)) {
Chandler Carruth9c4ed172016-02-18 11:03:11 +00001430 // Treat any function we're trying not to optimize as if it were an
1431 // indirect call and omit it from the node set used below.
1432 HasUnknownCall = true;
1433 continue;
1434 }
1435 // Track whether any functions in this SCC have an unknown call edge.
1436 // Note: if this is ever a performance hit, we can common it with
1437 // subsequent routines which also do scans over the instructions of the
1438 // function.
1439 if (!HasUnknownCall)
1440 for (Instruction &I : instructions(F))
1441 if (auto CS = CallSite(&I))
1442 if (!CS.getCalledFunction()) {
1443 HasUnknownCall = true;
1444 break;
1445 }
1446
1447 SCCNodes.insert(&F);
1448 }
1449
Johannes Doerfertbed4bab2018-08-01 16:37:51 +00001450 if (deriveAttrsInPostOrder(SCCNodes, AARGetter, HasUnknownCall))
1451 return PreservedAnalyses::none();
Chandler Carruth9c4ed172016-02-18 11:03:11 +00001452
Johannes Doerfertbed4bab2018-08-01 16:37:51 +00001453 return PreservedAnalyses::all();
Chandler Carruth9c4ed172016-02-18 11:03:11 +00001454}
1455
1456namespace {
Eugene Zelenkof27d1612017-10-19 21:21:30 +00001457
Chandler Carruth9c4ed172016-02-18 11:03:11 +00001458struct PostOrderFunctionAttrsLegacyPass : public CallGraphSCCPass {
Eugene Zelenkof27d1612017-10-19 21:21:30 +00001459 // Pass identification, replacement for typeid
1460 static char ID;
1461
Chandler Carruth9c4ed172016-02-18 11:03:11 +00001462 PostOrderFunctionAttrsLegacyPass() : CallGraphSCCPass(ID) {
Chad Rosier611b73b2016-11-07 16:28:04 +00001463 initializePostOrderFunctionAttrsLegacyPassPass(
1464 *PassRegistry::getPassRegistry());
Chandler Carruth9c4ed172016-02-18 11:03:11 +00001465 }
1466
1467 bool runOnSCC(CallGraphSCC &SCC) override;
1468
1469 void getAnalysisUsage(AnalysisUsage &AU) const override {
1470 AU.setPreservesCFG();
Daniel Jasperaec2fa32016-12-19 08:22:17 +00001471 AU.addRequired<AssumptionCacheTracker>();
Chandler Carruth12884f72016-03-02 15:56:53 +00001472 getAAResultsAnalysisUsage(AU);
Chandler Carruth9c4ed172016-02-18 11:03:11 +00001473 CallGraphSCCPass::getAnalysisUsage(AU);
1474 }
Chandler Carruth9c4ed172016-02-18 11:03:11 +00001475};
Eugene Zelenkof27d1612017-10-19 21:21:30 +00001476
1477} // end anonymous namespace
Chandler Carruth9c4ed172016-02-18 11:03:11 +00001478
1479char PostOrderFunctionAttrsLegacyPass::ID = 0;
1480INITIALIZE_PASS_BEGIN(PostOrderFunctionAttrsLegacyPass, "functionattrs",
1481 "Deduce function attributes", false, false)
Daniel Jasperaec2fa32016-12-19 08:22:17 +00001482INITIALIZE_PASS_DEPENDENCY(AssumptionCacheTracker)
Chandler Carruth9c4ed172016-02-18 11:03:11 +00001483INITIALIZE_PASS_DEPENDENCY(CallGraphWrapperPass)
Chandler Carruth9c4ed172016-02-18 11:03:11 +00001484INITIALIZE_PASS_END(PostOrderFunctionAttrsLegacyPass, "functionattrs",
1485 "Deduce function attributes", false, false)
1486
Chad Rosier611b73b2016-11-07 16:28:04 +00001487Pass *llvm::createPostOrderFunctionAttrsLegacyPass() {
1488 return new PostOrderFunctionAttrsLegacyPass();
1489}
Chandler Carruth9c4ed172016-02-18 11:03:11 +00001490
Sean Silva997cbea2016-07-03 03:35:03 +00001491template <typename AARGetterT>
1492static bool runImpl(CallGraphSCC &SCC, AARGetterT AARGetter) {
Chandler Carruthc518ebd2015-10-29 18:29:15 +00001493
1494 // Fill SCCNodes with the elements of the SCC. Used for quickly looking up
1495 // whether a given CallGraphNode is in this SCC. Also track whether there are
1496 // any external or opt-none nodes that will prevent us from optimizing any
1497 // part of the SCC.
1498 SCCNodeSet SCCNodes;
1499 bool ExternalNode = false;
Benjamin Kramer135f7352016-06-26 12:28:59 +00001500 for (CallGraphNode *I : SCC) {
1501 Function *F = I->getFunction();
Evandro Menezes85bd3972019-04-04 22:40:06 +00001502 if (!F || F->hasOptNone() || F->hasFnAttribute(Attribute::Naked)) {
Chandler Carruthc518ebd2015-10-29 18:29:15 +00001503 // External node or function we're trying not to optimize - we both avoid
1504 // transform them and avoid leveraging information they provide.
1505 ExternalNode = true;
1506 continue;
1507 }
1508
1509 SCCNodes.insert(F);
1510 }
1511
Johannes Doerfertbed4bab2018-08-01 16:37:51 +00001512 return deriveAttrsInPostOrder(SCCNodes, AARGetter, ExternalNode);
James Molloy7e9bdd52015-11-12 10:55:20 +00001513}
Chandler Carruthc518ebd2015-10-29 18:29:15 +00001514
Sean Silva997cbea2016-07-03 03:35:03 +00001515bool PostOrderFunctionAttrsLegacyPass::runOnSCC(CallGraphSCC &SCC) {
1516 if (skipSCC(SCC))
1517 return false;
Peter Collingbournecea1e4e2017-02-09 23:11:52 +00001518 return runImpl(SCC, LegacyAARGetter(*this));
Sean Silva997cbea2016-07-03 03:35:03 +00001519}
1520
Chandler Carruth1926b702016-01-08 10:55:52 +00001521namespace {
Eugene Zelenkof27d1612017-10-19 21:21:30 +00001522
Sean Silvaf5080192016-06-12 07:48:51 +00001523struct ReversePostOrderFunctionAttrsLegacyPass : public ModulePass {
Eugene Zelenkof27d1612017-10-19 21:21:30 +00001524 // Pass identification, replacement for typeid
1525 static char ID;
1526
Sean Silvaf5080192016-06-12 07:48:51 +00001527 ReversePostOrderFunctionAttrsLegacyPass() : ModulePass(ID) {
Chad Rosier611b73b2016-11-07 16:28:04 +00001528 initializeReversePostOrderFunctionAttrsLegacyPassPass(
1529 *PassRegistry::getPassRegistry());
Chandler Carruth1926b702016-01-08 10:55:52 +00001530 }
1531
1532 bool runOnModule(Module &M) override;
1533
1534 void getAnalysisUsage(AnalysisUsage &AU) const override {
1535 AU.setPreservesCFG();
1536 AU.addRequired<CallGraphWrapperPass>();
Mehdi Amini0ddf4042016-05-02 18:03:33 +00001537 AU.addPreserved<CallGraphWrapperPass>();
Chandler Carruth1926b702016-01-08 10:55:52 +00001538 }
1539};
Eugene Zelenkof27d1612017-10-19 21:21:30 +00001540
1541} // end anonymous namespace
Chandler Carruth1926b702016-01-08 10:55:52 +00001542
Sean Silvaf5080192016-06-12 07:48:51 +00001543char ReversePostOrderFunctionAttrsLegacyPass::ID = 0;
Eugene Zelenkof27d1612017-10-19 21:21:30 +00001544
Sean Silvaf5080192016-06-12 07:48:51 +00001545INITIALIZE_PASS_BEGIN(ReversePostOrderFunctionAttrsLegacyPass, "rpo-functionattrs",
Chandler Carruth1926b702016-01-08 10:55:52 +00001546 "Deduce function attributes in RPO", false, false)
1547INITIALIZE_PASS_DEPENDENCY(CallGraphWrapperPass)
Sean Silvaf5080192016-06-12 07:48:51 +00001548INITIALIZE_PASS_END(ReversePostOrderFunctionAttrsLegacyPass, "rpo-functionattrs",
Chandler Carruth1926b702016-01-08 10:55:52 +00001549 "Deduce function attributes in RPO", false, false)
1550
1551Pass *llvm::createReversePostOrderFunctionAttrsPass() {
Sean Silvaf5080192016-06-12 07:48:51 +00001552 return new ReversePostOrderFunctionAttrsLegacyPass();
Chandler Carruth1926b702016-01-08 10:55:52 +00001553}
1554
1555static bool addNoRecurseAttrsTopDown(Function &F) {
1556 // We check the preconditions for the function prior to calling this to avoid
1557 // the cost of building up a reversible post-order list. We assert them here
1558 // to make sure none of the invariants this relies on were violated.
1559 assert(!F.isDeclaration() && "Cannot deduce norecurse without a definition!");
1560 assert(!F.doesNotRecurse() &&
1561 "This function has already been deduced as norecurs!");
1562 assert(F.hasInternalLinkage() &&
1563 "Can only do top-down deduction for internal linkage functions!");
1564
1565 // If F is internal and all of its uses are calls from a non-recursive
1566 // functions, then none of its calls could in fact recurse without going
1567 // through a function marked norecurse, and so we can mark this function too
1568 // as norecurse. Note that the uses must actually be calls -- otherwise
1569 // a pointer to this function could be returned from a norecurse function but
1570 // this function could be recursively (indirectly) called. Note that this
1571 // also detects if F is directly recursive as F is not yet marked as
1572 // a norecurse function.
1573 for (auto *U : F.users()) {
1574 auto *I = dyn_cast<Instruction>(U);
1575 if (!I)
1576 return false;
1577 CallSite CS(I);
1578 if (!CS || !CS.getParent()->getParent()->doesNotRecurse())
1579 return false;
1580 }
1581 return setDoesNotRecurse(F);
1582}
1583
Sean Silvaadc79392016-06-12 05:44:51 +00001584static bool deduceFunctionAttributeInRPO(Module &M, CallGraph &CG) {
Chandler Carruth1926b702016-01-08 10:55:52 +00001585 // We only have a post-order SCC traversal (because SCCs are inherently
1586 // discovered in post-order), so we accumulate them in a vector and then walk
1587 // it in reverse. This is simpler than using the RPO iterator infrastructure
1588 // because we need to combine SCC detection and the PO walk of the call
1589 // graph. We can also cheat egregiously because we're primarily interested in
1590 // synthesizing norecurse and so we can only save the singular SCCs as SCCs
1591 // with multiple functions in them will clearly be recursive.
Chandler Carruth1926b702016-01-08 10:55:52 +00001592 SmallVector<Function *, 16> Worklist;
1593 for (scc_iterator<CallGraph *> I = scc_begin(&CG); !I.isAtEnd(); ++I) {
1594 if (I->size() != 1)
1595 continue;
1596
1597 Function *F = I->front()->getFunction();
1598 if (F && !F->isDeclaration() && !F->doesNotRecurse() &&
1599 F->hasInternalLinkage())
1600 Worklist.push_back(F);
1601 }
1602
James Molloy7e9bdd52015-11-12 10:55:20 +00001603 bool Changed = false;
Eugene Zelenkof27d1612017-10-19 21:21:30 +00001604 for (auto *F : llvm::reverse(Worklist))
Chandler Carruth1926b702016-01-08 10:55:52 +00001605 Changed |= addNoRecurseAttrsTopDown(*F);
1606
Duncan Sands44c8cd92008-12-31 16:14:43 +00001607 return Changed;
1608}
Sean Silvaadc79392016-06-12 05:44:51 +00001609
Sean Silvaf5080192016-06-12 07:48:51 +00001610bool ReversePostOrderFunctionAttrsLegacyPass::runOnModule(Module &M) {
Sean Silvaadc79392016-06-12 05:44:51 +00001611 if (skipModule(M))
1612 return false;
1613
1614 auto &CG = getAnalysis<CallGraphWrapperPass>().getCallGraph();
1615
1616 return deduceFunctionAttributeInRPO(M, CG);
1617}
Sean Silvaf5080192016-06-12 07:48:51 +00001618
1619PreservedAnalyses
Sean Silvafd03ac62016-08-09 00:28:38 +00001620ReversePostOrderFunctionAttrsPass::run(Module &M, ModuleAnalysisManager &AM) {
Sean Silvaf5080192016-06-12 07:48:51 +00001621 auto &CG = AM.getResult<CallGraphAnalysis>(M);
1622
Chandler Carruth6acdca72017-01-24 12:55:57 +00001623 if (!deduceFunctionAttributeInRPO(M, CG))
Sean Silvaf5080192016-06-12 07:48:51 +00001624 return PreservedAnalyses::all();
Chandler Carruth6acdca72017-01-24 12:55:57 +00001625
Sean Silvaf5080192016-06-12 07:48:51 +00001626 PreservedAnalyses PA;
1627 PA.preserve<CallGraphAnalysis>();
1628 return PA;
1629}