blob: bb1ebda90849ef43ea426e24e8f13f94f7c9f197 [file] [log] [blame]
Dan Gohman3d5aff52010-10-14 23:06:10 +00001//===--- CodeGenTypes.cpp - TBAA information for LLVM CodeGen -------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
Dan Gohman565cc442010-10-21 18:49:12 +000010// This is the code that manages TBAA information and defines the TBAA policy
11// for the optimizer to use. Relevant standards text includes:
Dan Gohman780658a2010-10-15 20:54:41 +000012//
13// C99 6.5p7
14// C++ [basic.lval] (p10 in n3126, p15 in some earlier versions)
Dan Gohman3d5aff52010-10-14 23:06:10 +000015//
16//===----------------------------------------------------------------------===//
17
18#include "CodeGenTBAA.h"
19#include "clang/AST/ASTContext.h"
Benjamin Kramer2fa67ef2012-12-01 15:09:41 +000020#include "clang/AST/Attr.h"
Peter Collingbourne14110472011-01-13 18:57:25 +000021#include "clang/AST/Mangle.h"
Benjamin Kramer2fa67ef2012-12-01 15:09:41 +000022#include "clang/AST/RecordLayout.h"
Kostya Serebryanyc9fe6052012-04-24 06:57:01 +000023#include "clang/Frontend/CodeGenOptions.h"
Manman Renb37a73d2013-04-04 21:53:22 +000024#include "llvm/ADT/SmallSet.h"
Chandler Carruth3b844ba2013-01-02 11:45:17 +000025#include "llvm/IR/Constants.h"
26#include "llvm/IR/LLVMContext.h"
27#include "llvm/IR/Metadata.h"
28#include "llvm/IR/Type.h"
Dan Gohman3d5aff52010-10-14 23:06:10 +000029using namespace clang;
30using namespace CodeGen;
31
32CodeGenTBAA::CodeGenTBAA(ASTContext &Ctx, llvm::LLVMContext& VMContext,
Kostya Serebryanyc9fe6052012-04-24 06:57:01 +000033 const CodeGenOptions &CGO,
Dan Gohman0b5c4fc2010-10-15 20:23:12 +000034 const LangOptions &Features, MangleContext &MContext)
Benjamin Kramerfacde172012-06-06 17:32:50 +000035 : Context(Ctx), CodeGenOpts(CGO), Features(Features), MContext(MContext),
Duncan Sands2d7cb062012-04-15 18:04:54 +000036 MDHelper(VMContext), Root(0), Char(0) {
Dan Gohman3d5aff52010-10-14 23:06:10 +000037}
38
39CodeGenTBAA::~CodeGenTBAA() {
40}
41
Dan Gohman224d7592010-10-25 21:48:30 +000042llvm::MDNode *CodeGenTBAA::getRoot() {
43 // Define the root of the tree. This identifies the tree, so that
44 // if our LLVM IR is linked with LLVM IR from a different front-end
45 // (or a different version of this front-end), their TBAA trees will
46 // remain distinct, and the optimizer will treat them conservatively.
47 if (!Root)
Duncan Sands60c77072012-04-16 16:29:47 +000048 Root = MDHelper.createTBAARoot("Simple C/C++ TBAA");
Dan Gohman224d7592010-10-25 21:48:30 +000049
50 return Root;
51}
52
Manman Renca835182013-04-11 23:02:56 +000053// For struct-path aware TBAA, the scalar type has the same format as
54// the struct type: name, offset, pointer to another node in the type DAG.
55// For scalar TBAA, the scalar type is the same as the scalar tag:
56// name and a parent pointer.
57llvm::MDNode *CodeGenTBAA::createTBAAScalarType(StringRef Name,
58 llvm::MDNode *Parent) {
59 if (CodeGenOpts.StructPathTBAA)
60 return MDHelper.createTBAAScalarTypeNode(Name, 0, Parent);
61 else
62 return MDHelper.createTBAANode(Name, Parent);
63}
64
Dan Gohman224d7592010-10-25 21:48:30 +000065llvm::MDNode *CodeGenTBAA::getChar() {
66 // Define the root of the tree for user-accessible memory. C and C++
67 // give special powers to char and certain similar types. However,
68 // these special powers only cover user-accessible memory, and doesn't
69 // include things like vtables.
70 if (!Char)
Manman Renca835182013-04-11 23:02:56 +000071 Char = createTBAAScalarType("omnipotent char", getRoot());
Dan Gohman224d7592010-10-25 21:48:30 +000072
73 return Char;
74}
75
Dan Gohman2ea7e732010-12-13 23:51:08 +000076static bool TypeHasMayAlias(QualType QTy) {
77 // Tagged types have declarations, and therefore may have attributes.
78 if (const TagType *TTy = dyn_cast<TagType>(QTy))
79 return TTy->getDecl()->hasAttr<MayAliasAttr>();
80
81 // Typedef types have declarations, and therefore may have attributes.
82 if (const TypedefType *TTy = dyn_cast<TypedefType>(QTy)) {
83 if (TTy->getDecl()->hasAttr<MayAliasAttr>())
84 return true;
85 // Also, their underlying types may have relevant attributes.
86 return TypeHasMayAlias(TTy->desugar());
87 }
88
89 return false;
90}
91
Dan Gohman3d5aff52010-10-14 23:06:10 +000092llvm::MDNode *
93CodeGenTBAA::getTBAAInfo(QualType QTy) {
Kostya Serebryanyc9fe6052012-04-24 06:57:01 +000094 // At -O0 TBAA is not emitted for regular types.
95 if (CodeGenOpts.OptimizationLevel == 0 || CodeGenOpts.RelaxedAliasing)
96 return NULL;
97
Dan Gohman2ea7e732010-12-13 23:51:08 +000098 // If the type has the may_alias attribute (even on a typedef), it is
99 // effectively in the general char alias class.
100 if (TypeHasMayAlias(QTy))
101 return getChar();
102
John McCallf4c73712011-01-19 06:33:43 +0000103 const Type *Ty = Context.getCanonicalType(QTy).getTypePtr();
Dan Gohman3d5aff52010-10-14 23:06:10 +0000104
105 if (llvm::MDNode *N = MetadataCache[Ty])
106 return N;
107
Dan Gohman565cc442010-10-21 18:49:12 +0000108 // Handle builtin types.
Dan Gohman9af2f832010-10-14 23:39:00 +0000109 if (const BuiltinType *BTy = dyn_cast<BuiltinType>(Ty)) {
Dan Gohman3d5aff52010-10-14 23:06:10 +0000110 switch (BTy->getKind()) {
Dan Gohman85623482010-10-15 17:52:03 +0000111 // Character types are special and can alias anything.
112 // In C++, this technically only includes "char" and "unsigned char",
113 // and not "signed char". In C, it includes all three. For now,
Dan Gohman0a531982010-10-15 20:24:10 +0000114 // the risk of exploiting this detail in C++ seems likely to outweigh
Dan Gohman85623482010-10-15 17:52:03 +0000115 // the benefit.
Dan Gohman3d5aff52010-10-14 23:06:10 +0000116 case BuiltinType::Char_U:
117 case BuiltinType::Char_S:
118 case BuiltinType::UChar:
119 case BuiltinType::SChar:
Dan Gohman224d7592010-10-25 21:48:30 +0000120 return getChar();
Dan Gohman9af2f832010-10-14 23:39:00 +0000121
122 // Unsigned types can alias their corresponding signed types.
123 case BuiltinType::UShort:
124 return getTBAAInfo(Context.ShortTy);
125 case BuiltinType::UInt:
126 return getTBAAInfo(Context.IntTy);
127 case BuiltinType::ULong:
128 return getTBAAInfo(Context.LongTy);
129 case BuiltinType::ULongLong:
130 return getTBAAInfo(Context.LongLongTy);
131 case BuiltinType::UInt128:
132 return getTBAAInfo(Context.Int128Ty);
133
Dan Gohman2f8c21d2010-10-15 20:24:53 +0000134 // Treat all other builtin types as distinct types. This includes
135 // treating wchar_t, char16_t, and char32_t as distinct from their
136 // "underlying types".
Dan Gohman3d5aff52010-10-14 23:06:10 +0000137 default:
138 return MetadataCache[Ty] =
Manman Renca835182013-04-11 23:02:56 +0000139 createTBAAScalarType(BTy->getName(Features), getChar());
Dan Gohman3d5aff52010-10-14 23:06:10 +0000140 }
141 }
142
Dan Gohman565cc442010-10-21 18:49:12 +0000143 // Handle pointers.
Dan Gohmandc491112010-10-15 20:26:20 +0000144 // TODO: Implement C++'s type "similarity" and consider dis-"similar"
145 // pointers distinct.
Dan Gohmanc1028f42010-10-15 00:01:39 +0000146 if (Ty->isPointerType())
Manman Renca835182013-04-11 23:02:56 +0000147 return MetadataCache[Ty] = createTBAAScalarType("any pointer",
148 getChar());
Dan Gohmanc1028f42010-10-15 00:01:39 +0000149
Dan Gohman0b5c4fc2010-10-15 20:23:12 +0000150 // Enum types are distinct types. In C++ they have "underlying types",
151 // however they aren't related for TBAA.
152 if (const EnumType *ETy = dyn_cast<EnumType>(Ty)) {
Sylvestre Ledruf3477c12012-09-27 10:16:10 +0000153 // In C mode, two anonymous enums are compatible iff their members
Dan Gohman0b5c4fc2010-10-15 20:23:12 +0000154 // are the same -- see C99 6.2.7p1. For now, be conservative. We could
155 // theoretically implement this by combining information about all the
156 // members into a single identifying MDNode.
157 if (!Features.CPlusPlus &&
Richard Smith162e1c12011-04-15 14:24:37 +0000158 ETy->getDecl()->getTypedefNameForAnonDecl())
Dan Gohman224d7592010-10-25 21:48:30 +0000159 return MetadataCache[Ty] = getChar();
Dan Gohman0b5c4fc2010-10-15 20:23:12 +0000160
161 // In C++ mode, types have linkage, so we can rely on the ODR and
162 // on their mangled names, if they're external.
163 // TODO: Is there a way to get a program-wide unique name for a
164 // decl with local linkage or no linkage?
165 if (Features.CPlusPlus &&
166 ETy->getDecl()->getLinkage() != ExternalLinkage)
Dan Gohman224d7592010-10-25 21:48:30 +0000167 return MetadataCache[Ty] = getChar();
Dan Gohman0b5c4fc2010-10-15 20:23:12 +0000168
169 // TODO: This is using the RTTI name. Is there a better way to get
170 // a unique string for a type?
Dylan Noblesmithf7ccbad2012-02-05 02:13:05 +0000171 SmallString<256> OutName;
Rafael Espindolaf0be9792011-02-11 02:52:17 +0000172 llvm::raw_svector_ostream Out(OutName);
173 MContext.mangleCXXRTTIName(QualType(ETy, 0), Out);
174 Out.flush();
Manman Renca835182013-04-11 23:02:56 +0000175 return MetadataCache[Ty] = createTBAAScalarType(OutName, getChar());
Dan Gohman0b5c4fc2010-10-15 20:23:12 +0000176 }
177
Dan Gohman9af2f832010-10-14 23:39:00 +0000178 // For now, handle any other kind of type conservatively.
Dan Gohman224d7592010-10-25 21:48:30 +0000179 return MetadataCache[Ty] = getChar();
Dan Gohman3d5aff52010-10-14 23:06:10 +0000180}
Kostya Serebryany8cb4a072012-03-26 17:03:51 +0000181
182llvm::MDNode *CodeGenTBAA::getTBAAInfoForVTablePtr() {
Manman Renca835182013-04-11 23:02:56 +0000183 return createTBAAScalarType("vtable pointer", getRoot());
Kostya Serebryany8cb4a072012-03-26 17:03:51 +0000184}
Dan Gohmanb22c7dc2012-09-28 21:58:29 +0000185
186bool
187CodeGenTBAA::CollectFields(uint64_t BaseOffset,
188 QualType QTy,
189 SmallVectorImpl<llvm::MDBuilder::TBAAStructField> &
190 Fields,
191 bool MayAlias) {
192 /* Things not handled yet include: C++ base classes, bitfields, */
193
194 if (const RecordType *TTy = QTy->getAs<RecordType>()) {
195 const RecordDecl *RD = TTy->getDecl()->getDefinition();
196 if (RD->hasFlexibleArrayMember())
197 return false;
198
199 // TODO: Handle C++ base classes.
200 if (const CXXRecordDecl *Decl = dyn_cast<CXXRecordDecl>(RD))
201 if (Decl->bases_begin() != Decl->bases_end())
202 return false;
203
204 const ASTRecordLayout &Layout = Context.getASTRecordLayout(RD);
205
206 unsigned idx = 0;
207 for (RecordDecl::field_iterator i = RD->field_begin(),
208 e = RD->field_end(); i != e; ++i, ++idx) {
209 uint64_t Offset = BaseOffset +
210 Layout.getFieldOffset(idx) / Context.getCharWidth();
211 QualType FieldQTy = i->getType();
212 if (!CollectFields(Offset, FieldQTy, Fields,
213 MayAlias || TypeHasMayAlias(FieldQTy)))
214 return false;
215 }
216 return true;
217 }
218
219 /* Otherwise, treat whatever it is as a field. */
220 uint64_t Offset = BaseOffset;
221 uint64_t Size = Context.getTypeSizeInChars(QTy).getQuantity();
222 llvm::MDNode *TBAAInfo = MayAlias ? getChar() : getTBAAInfo(QTy);
223 Fields.push_back(llvm::MDBuilder::TBAAStructField(Offset, Size, TBAAInfo));
224 return true;
225}
226
227llvm::MDNode *
228CodeGenTBAA::getTBAAStructInfo(QualType QTy) {
229 const Type *Ty = Context.getCanonicalType(QTy).getTypePtr();
230
231 if (llvm::MDNode *N = StructMetadataCache[Ty])
232 return N;
233
234 SmallVector<llvm::MDBuilder::TBAAStructField, 4> Fields;
235 if (CollectFields(0, QTy, Fields, TypeHasMayAlias(QTy)))
236 return MDHelper.createTBAAStructNode(Fields);
237
238 // For now, handle any other kind of type conservatively.
239 return StructMetadataCache[Ty] = NULL;
240}
Manman Renb37a73d2013-04-04 21:53:22 +0000241
242/// Check if the given type can be handled by path-aware TBAA.
243static bool isTBAAPathStruct(QualType QTy) {
244 if (const RecordType *TTy = QTy->getAs<RecordType>()) {
245 const RecordDecl *RD = TTy->getDecl()->getDefinition();
246 // RD can be struct, union, class, interface or enum.
247 // For now, we only handle struct.
248 if (RD->isStruct() && !RD->hasFlexibleArrayMember())
249 return true;
250 }
251 return false;
252}
253
254llvm::MDNode *
255CodeGenTBAA::getTBAAStructTypeInfo(QualType QTy) {
256 const Type *Ty = Context.getCanonicalType(QTy).getTypePtr();
257 assert(isTBAAPathStruct(QTy));
258
259 if (llvm::MDNode *N = StructTypeMetadataCache[Ty])
260 return N;
261
262 if (const RecordType *TTy = QTy->getAs<RecordType>()) {
263 const RecordDecl *RD = TTy->getDecl()->getDefinition();
264
265 const ASTRecordLayout &Layout = Context.getASTRecordLayout(RD);
266 SmallVector <std::pair<uint64_t, llvm::MDNode*>, 4> Fields;
Manman Renb37a73d2013-04-04 21:53:22 +0000267 unsigned idx = 0;
268 for (RecordDecl::field_iterator i = RD->field_begin(),
269 e = RD->field_end(); i != e; ++i, ++idx) {
270 QualType FieldQTy = i->getType();
271 llvm::MDNode *FieldNode;
272 if (isTBAAPathStruct(FieldQTy))
273 FieldNode = getTBAAStructTypeInfo(FieldQTy);
Manman Renca835182013-04-11 23:02:56 +0000274 else
Manman Renb37a73d2013-04-04 21:53:22 +0000275 FieldNode = getTBAAInfo(FieldQTy);
Manman Renb37a73d2013-04-04 21:53:22 +0000276 if (!FieldNode)
277 return StructTypeMetadataCache[Ty] = NULL;
278 Fields.push_back(std::make_pair(
279 Layout.getFieldOffset(idx) / Context.getCharWidth(), FieldNode));
280 }
281
282 // TODO: This is using the RTTI name. Is there a better way to get
283 // a unique string for a type?
284 SmallString<256> OutName;
285 llvm::raw_svector_ostream Out(OutName);
286 MContext.mangleCXXRTTIName(QualType(Ty, 0), Out);
287 Out.flush();
288 // Create the struct type node with a vector of pairs (offset, type).
289 return StructTypeMetadataCache[Ty] =
290 MDHelper.createTBAAStructTypeNode(OutName, Fields);
291 }
292
293 return StructMetadataCache[Ty] = NULL;
294}
295
296llvm::MDNode *
297CodeGenTBAA::getTBAAStructTagInfo(QualType BaseQTy, llvm::MDNode *AccessNode,
298 uint64_t Offset) {
299 if (!CodeGenOpts.StructPathTBAA)
300 return AccessNode;
301
302 const Type *BTy = Context.getCanonicalType(BaseQTy).getTypePtr();
303 TBAAPathTag PathTag = TBAAPathTag(BTy, AccessNode, Offset);
304 if (llvm::MDNode *N = StructTagMetadataCache[PathTag])
305 return N;
306
307 llvm::MDNode *BNode = 0;
308 if (isTBAAPathStruct(BaseQTy))
309 BNode = getTBAAStructTypeInfo(BaseQTy);
310 if (!BNode)
Manman Renca835182013-04-11 23:02:56 +0000311 return StructTagMetadataCache[PathTag] =
312 MDHelper.createTBAAStructTagNode(AccessNode, AccessNode, 0);
Manman Renb37a73d2013-04-04 21:53:22 +0000313
314 return StructTagMetadataCache[PathTag] =
315 MDHelper.createTBAAStructTagNode(BNode, AccessNode, Offset);
316}
Manman Renca835182013-04-11 23:02:56 +0000317
318llvm::MDNode *
319CodeGenTBAA::getTBAAScalarTagInfo(llvm::MDNode *AccessNode) {
320 if (llvm::MDNode *N = ScalarTagMetadataCache[AccessNode])
321 return N;
322
323 return ScalarTagMetadataCache[AccessNode] =
324 MDHelper.createTBAAStructTagNode(AccessNode, AccessNode, 0);
325}