FileManager.cpp revision 475ddb4547ce35706ce1ff54b14bdcfdc51954c2
1///===--- FileManager.cpp - File System Probing and Caching ----------------===// 2// 3// The LLVM Compiler Infrastructure 4// 5// This file is distributed under the University of Illinois Open Source 6// License. See LICENSE.TXT for details. 7// 8//===----------------------------------------------------------------------===// 9// 10// This file implements the FileManager interface. 11// 12//===----------------------------------------------------------------------===// 13// 14// TODO: This should index all interesting directories with dirent calls. 15// getdirentries ? 16// opendir/readdir_r/closedir ? 17// 18//===----------------------------------------------------------------------===// 19 20#include "clang/Basic/FileManager.h" 21#include "llvm/ADT/SmallString.h" 22#include "llvm/Support/raw_ostream.h" 23#include "llvm/System/Path.h" 24#include "llvm/Config/config.h" 25#include <map> 26#include <set> 27#include <string> 28using namespace clang; 29 30// FIXME: Enhance libsystem to support inode and other fields. 31#include <sys/stat.h> 32 33#if defined(_MSC_VER) 34#define S_ISDIR(s) (_S_IFDIR & s) 35#endif 36 37/// NON_EXISTENT_DIR - A special value distinct from null that is used to 38/// represent a dir name that doesn't exist on the disk. 39#define NON_EXISTENT_DIR reinterpret_cast<DirectoryEntry*>((intptr_t)-1) 40 41//===----------------------------------------------------------------------===// 42// Windows. 43//===----------------------------------------------------------------------===// 44 45#ifdef LLVM_ON_WIN32 46 47#define IS_DIR_SEPARATOR_CHAR(x) ((x) == '/' || (x) == '\\') 48 49namespace { 50 static std::string GetFullPath(const char *relPath) { 51 char *absPathStrPtr = _fullpath(NULL, relPath, 0); 52 assert(absPathStrPtr && "_fullpath() returned NULL!"); 53 54 std::string absPath(absPathStrPtr); 55 56 free(absPathStrPtr); 57 return absPath; 58 } 59} 60 61class FileManager::UniqueDirContainer { 62 /// UniqueDirs - Cache from full path to existing directories/files. 63 /// 64 llvm::StringMap<DirectoryEntry> UniqueDirs; 65 66public: 67 DirectoryEntry &getDirectory(const char *Name, struct stat &StatBuf) { 68 std::string FullPath(GetFullPath(Name)); 69 return UniqueDirs.GetOrCreateValue( 70 FullPath.c_str(), 71 FullPath.c_str() + FullPath.size() 72 ).getValue(); 73 } 74 75 size_t size() { return UniqueDirs.size(); } 76}; 77 78class FileManager::UniqueFileContainer { 79 /// UniqueFiles - Cache from full path to existing directories/files. 80 /// 81 llvm::StringMap<FileEntry, llvm::BumpPtrAllocator> UniqueFiles; 82 83public: 84 FileEntry &getFile(const char *Name, struct stat &StatBuf) { 85 std::string FullPath(GetFullPath(Name)); 86 return UniqueFiles.GetOrCreateValue( 87 FullPath.c_str(), 88 FullPath.c_str() + FullPath.size() 89 ).getValue(); 90 } 91 92 size_t size() { return UniqueFiles.size(); } 93}; 94 95//===----------------------------------------------------------------------===// 96// Unix-like Systems. 97//===----------------------------------------------------------------------===// 98 99#else 100 101#define IS_DIR_SEPARATOR_CHAR(x) ((x) == '/') 102 103class FileManager::UniqueDirContainer { 104 /// UniqueDirs - Cache from ID's to existing directories/files. 105 /// 106 std::map<std::pair<dev_t, ino_t>, DirectoryEntry> UniqueDirs; 107 108public: 109 DirectoryEntry &getDirectory(const char *Name, struct stat &StatBuf) { 110 return UniqueDirs[std::make_pair(StatBuf.st_dev, StatBuf.st_ino)]; 111 } 112 113 size_t size() { return UniqueDirs.size(); } 114}; 115 116class FileManager::UniqueFileContainer { 117 /// UniqueFiles - Cache from ID's to existing directories/files. 118 /// 119 std::set<FileEntry> UniqueFiles; 120 121public: 122 FileEntry &getFile(const char *Name, struct stat &StatBuf) { 123 return 124 const_cast<FileEntry&>( 125 *UniqueFiles.insert(FileEntry(StatBuf.st_dev, 126 StatBuf.st_ino, 127 StatBuf.st_mode)).first); 128 } 129 130 size_t size() { return UniqueFiles.size(); } 131}; 132 133#endif 134 135//===----------------------------------------------------------------------===// 136// Common logic. 137//===----------------------------------------------------------------------===// 138 139FileManager::FileManager() 140 : UniqueDirs(*new UniqueDirContainer), 141 UniqueFiles(*new UniqueFileContainer), 142 DirEntries(64), FileEntries(64), NextFileUID(0) { 143 NumDirLookups = NumFileLookups = 0; 144 NumDirCacheMisses = NumFileCacheMisses = 0; 145} 146 147FileManager::~FileManager() { 148 delete &UniqueDirs; 149 delete &UniqueFiles; 150 for (llvm::SmallVectorImpl<FileEntry *>::iterator 151 V = VirtualFileEntries.begin(), 152 VEnd = VirtualFileEntries.end(); 153 V != VEnd; 154 ++V) 155 delete *V; 156} 157 158void FileManager::addStatCache(StatSysCallCache *statCache, bool AtBeginning) { 159 assert(statCache && "No stat cache provided?"); 160 if (AtBeginning || StatCache.get() == 0) { 161 statCache->setNextStatCache(StatCache.take()); 162 StatCache.reset(statCache); 163 return; 164 } 165 166 StatSysCallCache *LastCache = StatCache.get(); 167 while (LastCache->getNextStatCache()) 168 LastCache = LastCache->getNextStatCache(); 169 170 LastCache->setNextStatCache(statCache); 171} 172 173void FileManager::removeStatCache(StatSysCallCache *statCache) { 174 if (!statCache) 175 return; 176 177 if (StatCache.get() == statCache) { 178 // This is the first stat cache. 179 StatCache.reset(StatCache->takeNextStatCache()); 180 return; 181 } 182 183 // Find the stat cache in the list. 184 StatSysCallCache *PrevCache = StatCache.get(); 185 while (PrevCache && PrevCache->getNextStatCache() != statCache) 186 PrevCache = PrevCache->getNextStatCache(); 187 if (PrevCache) 188 PrevCache->setNextStatCache(statCache->getNextStatCache()); 189 else 190 assert(false && "Stat cache not found for removal"); 191} 192 193/// \brief Retrieve the directory that the given file name resides in. 194static const DirectoryEntry *getDirectoryFromFile(FileManager &FileMgr, 195 const char *NameStart, 196 const char *NameEnd) { 197 // Figure out what directory it is in. If the string contains a / in it, 198 // strip off everything after it. 199 // FIXME: this logic should be in sys::Path. 200 const char *SlashPos = NameEnd-1; 201 while (SlashPos >= NameStart && !IS_DIR_SEPARATOR_CHAR(SlashPos[0])) 202 --SlashPos; 203 // Ignore duplicate //'s. 204 while (SlashPos > NameStart && IS_DIR_SEPARATOR_CHAR(SlashPos[-1])) 205 --SlashPos; 206 207 if (SlashPos < NameStart) { 208 // Use the current directory if file has no path component. 209 const char *Name = "."; 210 return FileMgr.getDirectory(Name, Name+1); 211 } else if (SlashPos == NameEnd-1) 212 return 0; // If filename ends with a /, it's a directory. 213 else 214 return FileMgr.getDirectory(NameStart, SlashPos); 215} 216 217/// getDirectory - Lookup, cache, and verify the specified directory. This 218/// returns null if the directory doesn't exist. 219/// 220const DirectoryEntry *FileManager::getDirectory(const char *NameStart, 221 const char *NameEnd) { 222 ++NumDirLookups; 223 llvm::StringMapEntry<DirectoryEntry *> &NamedDirEnt = 224 DirEntries.GetOrCreateValue(NameStart, NameEnd); 225 226 // See if there is already an entry in the map. 227 if (NamedDirEnt.getValue()) 228 return NamedDirEnt.getValue() == NON_EXISTENT_DIR 229 ? 0 : NamedDirEnt.getValue(); 230 231 ++NumDirCacheMisses; 232 233 // By default, initialize it to invalid. 234 NamedDirEnt.setValue(NON_EXISTENT_DIR); 235 236 // Get the null-terminated directory name as stored as the key of the 237 // DirEntries map. 238 const char *InterndDirName = NamedDirEnt.getKeyData(); 239 240 // Check to see if the directory exists. 241 struct stat StatBuf; 242 if (stat_cached(InterndDirName, &StatBuf) || // Error stat'ing. 243 !S_ISDIR(StatBuf.st_mode)) // Not a directory? 244 return 0; 245 246 // It exists. See if we have already opened a directory with the same inode. 247 // This occurs when one dir is symlinked to another, for example. 248 DirectoryEntry &UDE = UniqueDirs.getDirectory(InterndDirName, StatBuf); 249 250 NamedDirEnt.setValue(&UDE); 251 if (UDE.getName()) // Already have an entry with this inode, return it. 252 return &UDE; 253 254 // Otherwise, we don't have this directory yet, add it. We use the string 255 // key from the DirEntries map as the string. 256 UDE.Name = InterndDirName; 257 return &UDE; 258} 259 260/// NON_EXISTENT_FILE - A special value distinct from null that is used to 261/// represent a filename that doesn't exist on the disk. 262#define NON_EXISTENT_FILE reinterpret_cast<FileEntry*>((intptr_t)-1) 263 264/// getFile - Lookup, cache, and verify the specified file. This returns null 265/// if the file doesn't exist. 266/// 267const FileEntry *FileManager::getFile(const char *NameStart, 268 const char *NameEnd) { 269 ++NumFileLookups; 270 271 // See if there is already an entry in the map. 272 llvm::StringMapEntry<FileEntry *> &NamedFileEnt = 273 FileEntries.GetOrCreateValue(NameStart, NameEnd); 274 275 // See if there is already an entry in the map. 276 if (NamedFileEnt.getValue()) 277 return NamedFileEnt.getValue() == NON_EXISTENT_FILE 278 ? 0 : NamedFileEnt.getValue(); 279 280 ++NumFileCacheMisses; 281 282 // By default, initialize it to invalid. 283 NamedFileEnt.setValue(NON_EXISTENT_FILE); 284 285 286 // Get the null-terminated file name as stored as the key of the 287 // FileEntries map. 288 const char *InterndFileName = NamedFileEnt.getKeyData(); 289 290 const DirectoryEntry *DirInfo 291 = getDirectoryFromFile(*this, NameStart, NameEnd); 292 if (DirInfo == 0) // Directory doesn't exist, file can't exist. 293 return 0; 294 295 // FIXME: Use the directory info to prune this, before doing the stat syscall. 296 // FIXME: This will reduce the # syscalls. 297 298 // Nope, there isn't. Check to see if the file exists. 299 struct stat StatBuf; 300 //llvm::errs() << "STATING: " << Filename; 301 if (stat_cached(InterndFileName, &StatBuf) || // Error stat'ing. 302 S_ISDIR(StatBuf.st_mode)) { // A directory? 303 // If this file doesn't exist, we leave a null in FileEntries for this path. 304 //llvm::errs() << ": Not existing\n"; 305 return 0; 306 } 307 //llvm::errs() << ": exists\n"; 308 309 // It exists. See if we have already opened a file with the same inode. 310 // This occurs when one dir is symlinked to another, for example. 311 FileEntry &UFE = UniqueFiles.getFile(InterndFileName, StatBuf); 312 313 NamedFileEnt.setValue(&UFE); 314 if (UFE.getName()) // Already have an entry with this inode, return it. 315 return &UFE; 316 317 // Otherwise, we don't have this directory yet, add it. 318 // FIXME: Change the name to be a char* that points back to the 'FileEntries' 319 // key. 320 UFE.Name = InterndFileName; 321 UFE.Size = StatBuf.st_size; 322 UFE.ModTime = StatBuf.st_mtime; 323 UFE.Dir = DirInfo; 324 UFE.UID = NextFileUID++; 325 return &UFE; 326} 327 328const FileEntry * 329FileManager::getVirtualFile(const llvm::StringRef &Filename, 330 off_t Size, time_t ModificationTime) { 331 const char *NameStart = Filename.begin(), *NameEnd = Filename.end(); 332 333 ++NumFileLookups; 334 335 // See if there is already an entry in the map. 336 llvm::StringMapEntry<FileEntry *> &NamedFileEnt = 337 FileEntries.GetOrCreateValue(NameStart, NameEnd); 338 339 // See if there is already an entry in the map. 340 if (NamedFileEnt.getValue()) 341 return NamedFileEnt.getValue() == NON_EXISTENT_FILE 342 ? 0 : NamedFileEnt.getValue(); 343 344 ++NumFileCacheMisses; 345 346 // By default, initialize it to invalid. 347 NamedFileEnt.setValue(NON_EXISTENT_FILE); 348 349 const DirectoryEntry *DirInfo 350 = getDirectoryFromFile(*this, NameStart, NameEnd); 351 if (DirInfo == 0) // Directory doesn't exist, file can't exist. 352 return 0; 353 354 FileEntry *UFE = new FileEntry(); 355 VirtualFileEntries.push_back(UFE); 356 NamedFileEnt.setValue(UFE); 357 358 UFE->Name = NamedFileEnt.getKeyData(); 359 UFE->Size = Size; 360 UFE->ModTime = ModificationTime; 361 UFE->Dir = DirInfo; 362 UFE->UID = NextFileUID++; 363 return UFE; 364} 365 366void FileManager::PrintStats() const { 367 llvm::errs() << "\n*** File Manager Stats:\n"; 368 llvm::errs() << UniqueFiles.size() << " files found, " 369 << UniqueDirs.size() << " dirs found.\n"; 370 llvm::errs() << NumDirLookups << " dir lookups, " 371 << NumDirCacheMisses << " dir cache misses.\n"; 372 llvm::errs() << NumFileLookups << " file lookups, " 373 << NumFileCacheMisses << " file cache misses.\n"; 374 375 //llvm::errs() << PagesMapped << BytesOfPagesMapped << FSLookups; 376} 377 378int MemorizeStatCalls::stat(const char *path, struct stat *buf) { 379 int result = StatSysCallCache::stat(path, buf); 380 381 // Do not cache failed stats, it is easy to construct common inconsistent 382 // situations if we do, and they are not important for PCH performance (which 383 // currently only needs the stats to construct the initial FileManager 384 // entries). 385 if (result != 0) 386 return result; 387 388 // Cache file 'stat' results and directories with absolutely paths. 389 if (!S_ISDIR(buf->st_mode) || llvm::sys::Path(path).isAbsolute()) 390 StatCalls[path] = StatResult(result, *buf); 391 392 return result; 393} 394