blob: c4296c3f1c7bd829e58ca641cf77d508fb38eb15 [file] [log] [blame]
Ted Kremenek8fbc88e2007-12-04 22:42:20 +00001///===--- FileManager.cpp - File System Probing and Caching ----------------===//
Reid Spencer5f016e22007-07-11 17:01:13 +00002//
3// The LLVM Compiler Infrastructure
4//
Chris Lattner0bc735f2007-12-29 19:59:25 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Reid Spencer5f016e22007-07-11 17:01:13 +00007//
8//===----------------------------------------------------------------------===//
9//
10// This file implements the FileManager interface.
11//
12//===----------------------------------------------------------------------===//
13//
14// TODO: This should index all interesting directories with dirent calls.
15// getdirentries ?
16// opendir/readdir_r/closedir ?
17//
18//===----------------------------------------------------------------------===//
19
20#include "clang/Basic/FileManager.h"
21#include "llvm/ADT/SmallString.h"
Chris Lattnerd57a7ef2009-08-23 22:45:33 +000022#include "llvm/Support/raw_ostream.h"
Douglas Gregor4fed3f42009-04-27 18:38:38 +000023#include "llvm/System/Path.h"
Ted Kremenek6bb816a2008-02-24 03:15:25 +000024#include "llvm/Config/config.h"
Benjamin Kramer458fb102009-09-05 09:49:39 +000025#include <map>
26#include <set>
27#include <string>
Reid Spencer5f016e22007-07-11 17:01:13 +000028using namespace clang;
29
30// FIXME: Enhance libsystem to support inode and other fields.
31#include <sys/stat.h>
32
Chris Lattnera8c11c62007-09-03 18:37:14 +000033#if defined(_MSC_VER)
Chris Lattner3102c832009-02-12 01:37:35 +000034#define S_ISDIR(s) (_S_IFDIR & s)
Chris Lattnera8c11c62007-09-03 18:37:14 +000035#endif
Reid Spencer5f016e22007-07-11 17:01:13 +000036
Ted Kremenek3d2da3d2008-01-11 20:42:05 +000037/// NON_EXISTENT_DIR - A special value distinct from null that is used to
Reid Spencer5f016e22007-07-11 17:01:13 +000038/// represent a dir name that doesn't exist on the disk.
Ted Kremenek3d2da3d2008-01-11 20:42:05 +000039#define NON_EXISTENT_DIR reinterpret_cast<DirectoryEntry*>((intptr_t)-1)
Reid Spencer5f016e22007-07-11 17:01:13 +000040
Ted Kremenekcb8d58b2009-01-28 00:27:31 +000041//===----------------------------------------------------------------------===//
42// Windows.
43//===----------------------------------------------------------------------===//
44
Ted Kremenek6bb816a2008-02-24 03:15:25 +000045#ifdef LLVM_ON_WIN32
46
47#define IS_DIR_SEPARATOR_CHAR(x) ((x) == '/' || (x) == '\\')
48
49namespace {
Mike Stump1eb44332009-09-09 15:08:12 +000050 static std::string GetFullPath(const char *relPath) {
Ted Kremenek6bb816a2008-02-24 03:15:25 +000051 char *absPathStrPtr = _fullpath(NULL, relPath, 0);
52 assert(absPathStrPtr && "_fullpath() returned NULL!");
53
54 std::string absPath(absPathStrPtr);
55
56 free(absPathStrPtr);
57 return absPath;
58 }
59}
60
61class FileManager::UniqueDirContainer {
62 /// UniqueDirs - Cache from full path to existing directories/files.
63 ///
Mike Stump1eb44332009-09-09 15:08:12 +000064 llvm::StringMap<DirectoryEntry> UniqueDirs;
Ted Kremenek6bb816a2008-02-24 03:15:25 +000065
66public:
67 DirectoryEntry &getDirectory(const char *Name, struct stat &StatBuf) {
68 std::string FullPath(GetFullPath(Name));
69 return UniqueDirs.GetOrCreateValue(
70 FullPath.c_str(),
71 FullPath.c_str() + FullPath.size()
72 ).getValue();
73 }
Mike Stump1eb44332009-09-09 15:08:12 +000074
Ted Kremenek6bb816a2008-02-24 03:15:25 +000075 size_t size() { return UniqueDirs.size(); }
76};
77
78class FileManager::UniqueFileContainer {
79 /// UniqueFiles - Cache from full path to existing directories/files.
80 ///
Ted Kremenek75368892009-01-28 01:01:07 +000081 llvm::StringMap<FileEntry, llvm::BumpPtrAllocator> UniqueFiles;
Ted Kremenek6bb816a2008-02-24 03:15:25 +000082
83public:
84 FileEntry &getFile(const char *Name, struct stat &StatBuf) {
85 std::string FullPath(GetFullPath(Name));
86 return UniqueFiles.GetOrCreateValue(
87 FullPath.c_str(),
88 FullPath.c_str() + FullPath.size()
89 ).getValue();
90 }
91
92 size_t size() { return UniqueFiles.size(); }
93};
94
Ted Kremenekcb8d58b2009-01-28 00:27:31 +000095//===----------------------------------------------------------------------===//
96// Unix-like Systems.
97//===----------------------------------------------------------------------===//
98
Ted Kremenek6bb816a2008-02-24 03:15:25 +000099#else
100
101#define IS_DIR_SEPARATOR_CHAR(x) ((x) == '/')
102
103class FileManager::UniqueDirContainer {
104 /// UniqueDirs - Cache from ID's to existing directories/files.
105 ///
Mike Stump1eb44332009-09-09 15:08:12 +0000106 std::map<std::pair<dev_t, ino_t>, DirectoryEntry> UniqueDirs;
Ted Kremenek6bb816a2008-02-24 03:15:25 +0000107
108public:
109 DirectoryEntry &getDirectory(const char *Name, struct stat &StatBuf) {
110 return UniqueDirs[std::make_pair(StatBuf.st_dev, StatBuf.st_ino)];
111 }
112
113 size_t size() { return UniqueDirs.size(); }
114};
115
116class FileManager::UniqueFileContainer {
117 /// UniqueFiles - Cache from ID's to existing directories/files.
118 ///
119 std::set<FileEntry> UniqueFiles;
120
121public:
122 FileEntry &getFile(const char *Name, struct stat &StatBuf) {
123 return
124 const_cast<FileEntry&>(
125 *UniqueFiles.insert(FileEntry(StatBuf.st_dev,
Ted Kremenek96438f32009-02-12 03:17:57 +0000126 StatBuf.st_ino,
127 StatBuf.st_mode)).first);
Ted Kremenek6bb816a2008-02-24 03:15:25 +0000128 }
129
130 size_t size() { return UniqueFiles.size(); }
131};
132
133#endif
134
Ted Kremenekcb8d58b2009-01-28 00:27:31 +0000135//===----------------------------------------------------------------------===//
136// Common logic.
137//===----------------------------------------------------------------------===//
Ted Kremenek6bb816a2008-02-24 03:15:25 +0000138
Ted Kremenek96438f32009-02-12 03:17:57 +0000139FileManager::FileManager()
Ted Kremenekfc7052d2009-02-12 00:39:05 +0000140 : UniqueDirs(*new UniqueDirContainer),
141 UniqueFiles(*new UniqueFileContainer),
Ted Kremenek96438f32009-02-12 03:17:57 +0000142 DirEntries(64), FileEntries(64), NextFileUID(0) {
Ted Kremenek6bb816a2008-02-24 03:15:25 +0000143 NumDirLookups = NumFileLookups = 0;
144 NumDirCacheMisses = NumFileCacheMisses = 0;
145}
146
147FileManager::~FileManager() {
148 delete &UniqueDirs;
149 delete &UniqueFiles;
Douglas Gregor057e5672009-12-02 18:12:28 +0000150 for (llvm::SmallVectorImpl<FileEntry *>::iterator
151 V = VirtualFileEntries.begin(),
152 VEnd = VirtualFileEntries.end();
153 V != VEnd;
154 ++V)
155 delete *V;
Ted Kremenek6bb816a2008-02-24 03:15:25 +0000156}
157
Douglas Gregor52e71082009-10-16 18:18:30 +0000158void FileManager::addStatCache(StatSysCallCache *statCache, bool AtBeginning) {
159 assert(statCache && "No stat cache provided?");
160 if (AtBeginning || StatCache.get() == 0) {
161 statCache->setNextStatCache(StatCache.take());
162 StatCache.reset(statCache);
163 return;
164 }
165
166 StatSysCallCache *LastCache = StatCache.get();
167 while (LastCache->getNextStatCache())
168 LastCache = LastCache->getNextStatCache();
169
170 LastCache->setNextStatCache(statCache);
171}
172
173void FileManager::removeStatCache(StatSysCallCache *statCache) {
174 if (!statCache)
175 return;
176
177 if (StatCache.get() == statCache) {
178 // This is the first stat cache.
179 StatCache.reset(StatCache->takeNextStatCache());
180 return;
181 }
182
183 // Find the stat cache in the list.
184 StatSysCallCache *PrevCache = StatCache.get();
185 while (PrevCache && PrevCache->getNextStatCache() != statCache)
186 PrevCache = PrevCache->getNextStatCache();
187 if (PrevCache)
188 PrevCache->setNextStatCache(statCache->getNextStatCache());
189 else
190 assert(false && "Stat cache not found for removal");
191}
192
Douglas Gregor057e5672009-12-02 18:12:28 +0000193/// \brief Retrieve the directory that the given file name resides in.
194static const DirectoryEntry *getDirectoryFromFile(FileManager &FileMgr,
195 const char *NameStart,
196 const char *NameEnd) {
197 // Figure out what directory it is in. If the string contains a / in it,
198 // strip off everything after it.
199 // FIXME: this logic should be in sys::Path.
200 const char *SlashPos = NameEnd-1;
201 while (SlashPos >= NameStart && !IS_DIR_SEPARATOR_CHAR(SlashPos[0]))
202 --SlashPos;
203 // Ignore duplicate //'s.
204 while (SlashPos > NameStart && IS_DIR_SEPARATOR_CHAR(SlashPos[-1]))
205 --SlashPos;
206
207 if (SlashPos < NameStart) {
208 // Use the current directory if file has no path component.
209 const char *Name = ".";
210 return FileMgr.getDirectory(Name, Name+1);
211 } else if (SlashPos == NameEnd-1)
212 return 0; // If filename ends with a /, it's a directory.
213 else
214 return FileMgr.getDirectory(NameStart, SlashPos);
215}
216
Reid Spencer5f016e22007-07-11 17:01:13 +0000217/// getDirectory - Lookup, cache, and verify the specified directory. This
218/// returns null if the directory doesn't exist.
Mike Stump1eb44332009-09-09 15:08:12 +0000219///
Reid Spencer5f016e22007-07-11 17:01:13 +0000220const DirectoryEntry *FileManager::getDirectory(const char *NameStart,
221 const char *NameEnd) {
John Thompson9a6ac542009-12-18 14:18:21 +0000222 // stat doesn't like trailing separators (at least on Windows).
223 if (((NameEnd - NameStart) > 1) &&
224 ((*(NameEnd - 1) == '/') || (*(NameEnd - 1) == '\\')))
225 NameEnd--;
226
Reid Spencer5f016e22007-07-11 17:01:13 +0000227 ++NumDirLookups;
228 llvm::StringMapEntry<DirectoryEntry *> &NamedDirEnt =
229 DirEntries.GetOrCreateValue(NameStart, NameEnd);
Mike Stump1eb44332009-09-09 15:08:12 +0000230
Reid Spencer5f016e22007-07-11 17:01:13 +0000231 // See if there is already an entry in the map.
232 if (NamedDirEnt.getValue())
Ted Kremenek3d2da3d2008-01-11 20:42:05 +0000233 return NamedDirEnt.getValue() == NON_EXISTENT_DIR
Reid Spencer5f016e22007-07-11 17:01:13 +0000234 ? 0 : NamedDirEnt.getValue();
Mike Stump1eb44332009-09-09 15:08:12 +0000235
Reid Spencer5f016e22007-07-11 17:01:13 +0000236 ++NumDirCacheMisses;
Mike Stump1eb44332009-09-09 15:08:12 +0000237
Reid Spencer5f016e22007-07-11 17:01:13 +0000238 // By default, initialize it to invalid.
Ted Kremenek3d2da3d2008-01-11 20:42:05 +0000239 NamedDirEnt.setValue(NON_EXISTENT_DIR);
Mike Stump1eb44332009-09-09 15:08:12 +0000240
Reid Spencer5f016e22007-07-11 17:01:13 +0000241 // Get the null-terminated directory name as stored as the key of the
242 // DirEntries map.
243 const char *InterndDirName = NamedDirEnt.getKeyData();
Mike Stump1eb44332009-09-09 15:08:12 +0000244
Reid Spencer5f016e22007-07-11 17:01:13 +0000245 // Check to see if the directory exists.
246 struct stat StatBuf;
Ted Kremenekfc7052d2009-02-12 00:39:05 +0000247 if (stat_cached(InterndDirName, &StatBuf) || // Error stat'ing.
Reid Spencer5f016e22007-07-11 17:01:13 +0000248 !S_ISDIR(StatBuf.st_mode)) // Not a directory?
249 return 0;
Ted Kremenek6bb816a2008-02-24 03:15:25 +0000250
Reid Spencer5f016e22007-07-11 17:01:13 +0000251 // It exists. See if we have already opened a directory with the same inode.
Mike Stump1eb44332009-09-09 15:08:12 +0000252 // This occurs when one dir is symlinked to another, for example.
Ted Kremenek6bb816a2008-02-24 03:15:25 +0000253 DirectoryEntry &UDE = UniqueDirs.getDirectory(InterndDirName, StatBuf);
Mike Stump1eb44332009-09-09 15:08:12 +0000254
Reid Spencer5f016e22007-07-11 17:01:13 +0000255 NamedDirEnt.setValue(&UDE);
256 if (UDE.getName()) // Already have an entry with this inode, return it.
257 return &UDE;
Mike Stump1eb44332009-09-09 15:08:12 +0000258
Reid Spencer5f016e22007-07-11 17:01:13 +0000259 // Otherwise, we don't have this directory yet, add it. We use the string
260 // key from the DirEntries map as the string.
261 UDE.Name = InterndDirName;
262 return &UDE;
263}
264
Ted Kremenek3d2da3d2008-01-11 20:42:05 +0000265/// NON_EXISTENT_FILE - A special value distinct from null that is used to
Reid Spencer5f016e22007-07-11 17:01:13 +0000266/// represent a filename that doesn't exist on the disk.
Ted Kremenek3d2da3d2008-01-11 20:42:05 +0000267#define NON_EXISTENT_FILE reinterpret_cast<FileEntry*>((intptr_t)-1)
Reid Spencer5f016e22007-07-11 17:01:13 +0000268
269/// getFile - Lookup, cache, and verify the specified file. This returns null
270/// if the file doesn't exist.
Mike Stump1eb44332009-09-09 15:08:12 +0000271///
Reid Spencer5f016e22007-07-11 17:01:13 +0000272const FileEntry *FileManager::getFile(const char *NameStart,
273 const char *NameEnd) {
274 ++NumFileLookups;
Mike Stump1eb44332009-09-09 15:08:12 +0000275
Reid Spencer5f016e22007-07-11 17:01:13 +0000276 // See if there is already an entry in the map.
277 llvm::StringMapEntry<FileEntry *> &NamedFileEnt =
278 FileEntries.GetOrCreateValue(NameStart, NameEnd);
279
280 // See if there is already an entry in the map.
281 if (NamedFileEnt.getValue())
Ted Kremenek3d2da3d2008-01-11 20:42:05 +0000282 return NamedFileEnt.getValue() == NON_EXISTENT_FILE
Reid Spencer5f016e22007-07-11 17:01:13 +0000283 ? 0 : NamedFileEnt.getValue();
Mike Stump1eb44332009-09-09 15:08:12 +0000284
Reid Spencer5f016e22007-07-11 17:01:13 +0000285 ++NumFileCacheMisses;
286
287 // By default, initialize it to invalid.
Ted Kremenek3d2da3d2008-01-11 20:42:05 +0000288 NamedFileEnt.setValue(NON_EXISTENT_FILE);
Reid Spencer5f016e22007-07-11 17:01:13 +0000289
Mike Stump1eb44332009-09-09 15:08:12 +0000290
Reid Spencer5f016e22007-07-11 17:01:13 +0000291 // Get the null-terminated file name as stored as the key of the
292 // FileEntries map.
293 const char *InterndFileName = NamedFileEnt.getKeyData();
Mike Stump1eb44332009-09-09 15:08:12 +0000294
Douglas Gregor057e5672009-12-02 18:12:28 +0000295 const DirectoryEntry *DirInfo
296 = getDirectoryFromFile(*this, NameStart, NameEnd);
297 if (DirInfo == 0) // Directory doesn't exist, file can't exist.
298 return 0;
299
Reid Spencer5f016e22007-07-11 17:01:13 +0000300 // FIXME: Use the directory info to prune this, before doing the stat syscall.
301 // FIXME: This will reduce the # syscalls.
Mike Stump1eb44332009-09-09 15:08:12 +0000302
Reid Spencer5f016e22007-07-11 17:01:13 +0000303 // Nope, there isn't. Check to see if the file exists.
304 struct stat StatBuf;
Benjamin Kramer6cb7c1a2009-08-23 12:08:50 +0000305 //llvm::errs() << "STATING: " << Filename;
Ted Kremenekfc7052d2009-02-12 00:39:05 +0000306 if (stat_cached(InterndFileName, &StatBuf) || // Error stat'ing.
307 S_ISDIR(StatBuf.st_mode)) { // A directory?
Reid Spencer5f016e22007-07-11 17:01:13 +0000308 // If this file doesn't exist, we leave a null in FileEntries for this path.
Benjamin Kramer6cb7c1a2009-08-23 12:08:50 +0000309 //llvm::errs() << ": Not existing\n";
Reid Spencer5f016e22007-07-11 17:01:13 +0000310 return 0;
311 }
Benjamin Kramer6cb7c1a2009-08-23 12:08:50 +0000312 //llvm::errs() << ": exists\n";
Mike Stump1eb44332009-09-09 15:08:12 +0000313
Ted Kremenekbca6d122007-12-18 22:29:39 +0000314 // It exists. See if we have already opened a file with the same inode.
Reid Spencer5f016e22007-07-11 17:01:13 +0000315 // This occurs when one dir is symlinked to another, for example.
Ted Kremenek6bb816a2008-02-24 03:15:25 +0000316 FileEntry &UFE = UniqueFiles.getFile(InterndFileName, StatBuf);
Mike Stump1eb44332009-09-09 15:08:12 +0000317
Reid Spencer5f016e22007-07-11 17:01:13 +0000318 NamedFileEnt.setValue(&UFE);
319 if (UFE.getName()) // Already have an entry with this inode, return it.
320 return &UFE;
321
322 // Otherwise, we don't have this directory yet, add it.
323 // FIXME: Change the name to be a char* that points back to the 'FileEntries'
324 // key.
325 UFE.Name = InterndFileName;
326 UFE.Size = StatBuf.st_size;
327 UFE.ModTime = StatBuf.st_mtime;
328 UFE.Dir = DirInfo;
329 UFE.UID = NextFileUID++;
330 return &UFE;
331}
332
Douglas Gregor057e5672009-12-02 18:12:28 +0000333const FileEntry *
334FileManager::getVirtualFile(const llvm::StringRef &Filename,
335 off_t Size, time_t ModificationTime) {
336 const char *NameStart = Filename.begin(), *NameEnd = Filename.end();
337
338 ++NumFileLookups;
339
340 // See if there is already an entry in the map.
341 llvm::StringMapEntry<FileEntry *> &NamedFileEnt =
342 FileEntries.GetOrCreateValue(NameStart, NameEnd);
343
344 // See if there is already an entry in the map.
345 if (NamedFileEnt.getValue())
346 return NamedFileEnt.getValue() == NON_EXISTENT_FILE
347 ? 0 : NamedFileEnt.getValue();
348
349 ++NumFileCacheMisses;
350
351 // By default, initialize it to invalid.
352 NamedFileEnt.setValue(NON_EXISTENT_FILE);
353
354 const DirectoryEntry *DirInfo
355 = getDirectoryFromFile(*this, NameStart, NameEnd);
356 if (DirInfo == 0) // Directory doesn't exist, file can't exist.
357 return 0;
358
359 FileEntry *UFE = new FileEntry();
360 VirtualFileEntries.push_back(UFE);
361 NamedFileEnt.setValue(UFE);
362
363 UFE->Name = NamedFileEnt.getKeyData();
364 UFE->Size = Size;
365 UFE->ModTime = ModificationTime;
366 UFE->Dir = DirInfo;
367 UFE->UID = NextFileUID++;
368 return UFE;
369}
370
Reid Spencer5f016e22007-07-11 17:01:13 +0000371void FileManager::PrintStats() const {
Benjamin Kramer6cb7c1a2009-08-23 12:08:50 +0000372 llvm::errs() << "\n*** File Manager Stats:\n";
373 llvm::errs() << UniqueFiles.size() << " files found, "
374 << UniqueDirs.size() << " dirs found.\n";
375 llvm::errs() << NumDirLookups << " dir lookups, "
376 << NumDirCacheMisses << " dir cache misses.\n";
377 llvm::errs() << NumFileLookups << " file lookups, "
378 << NumFileCacheMisses << " file cache misses.\n";
Mike Stump1eb44332009-09-09 15:08:12 +0000379
Benjamin Kramer6cb7c1a2009-08-23 12:08:50 +0000380 //llvm::errs() << PagesMapped << BytesOfPagesMapped << FSLookups;
Reid Spencer5f016e22007-07-11 17:01:13 +0000381}
Douglas Gregor4fed3f42009-04-27 18:38:38 +0000382
383int MemorizeStatCalls::stat(const char *path, struct stat *buf) {
Douglas Gregor52e71082009-10-16 18:18:30 +0000384 int result = StatSysCallCache::stat(path, buf);
385
Daniel Dunbar475ddb42009-12-11 00:27:20 +0000386 // Do not cache failed stats, it is easy to construct common inconsistent
387 // situations if we do, and they are not important for PCH performance (which
388 // currently only needs the stats to construct the initial FileManager
389 // entries).
390 if (result != 0)
391 return result;
392
393 // Cache file 'stat' results and directories with absolutely paths.
394 if (!S_ISDIR(buf->st_mode) || llvm::sys::Path(path).isAbsolute())
Douglas Gregor4fed3f42009-04-27 18:38:38 +0000395 StatCalls[path] = StatResult(result, *buf);
Mike Stump1eb44332009-09-09 15:08:12 +0000396
397 return result;
Douglas Gregor4fed3f42009-04-27 18:38:38 +0000398}