17a51313dSChris Lattner ///===--- FileManager.cpp - File System Probing and Caching ----------------===// 27a51313dSChris Lattner // 37a51313dSChris Lattner // The LLVM Compiler Infrastructure 47a51313dSChris Lattner // 57a51313dSChris Lattner // This file is distributed under the University of Illinois Open Source 67a51313dSChris Lattner // License. See LICENSE.TXT for details. 77a51313dSChris Lattner // 87a51313dSChris Lattner //===----------------------------------------------------------------------===// 97a51313dSChris Lattner // 107a51313dSChris Lattner // This file implements the FileManager interface. 117a51313dSChris Lattner // 127a51313dSChris Lattner //===----------------------------------------------------------------------===// 137a51313dSChris Lattner // 147a51313dSChris Lattner // TODO: This should index all interesting directories with dirent calls. 157a51313dSChris Lattner // getdirentries ? 167a51313dSChris Lattner // opendir/readdir_r/closedir ? 177a51313dSChris Lattner // 187a51313dSChris Lattner //===----------------------------------------------------------------------===// 197a51313dSChris Lattner 207a51313dSChris Lattner #include "clang/Basic/FileManager.h" 217a51313dSChris Lattner #include "llvm/ADT/SmallString.h" 223441b4f7SChris Lattner #include "llvm/Support/raw_ostream.h" 23c5046832SDouglas Gregor #include "llvm/System/Path.h" 247a51313dSChris Lattner #include "llvm/Config/config.h" 2526db6481SBenjamin Kramer #include <map> 2626db6481SBenjamin Kramer #include <set> 2726db6481SBenjamin Kramer #include <string> 287a51313dSChris Lattner using namespace clang; 297a51313dSChris Lattner 307a51313dSChris Lattner // FIXME: Enhance libsystem to support inode and other fields. 317a51313dSChris Lattner #include <sys/stat.h> 327a51313dSChris Lattner 337a51313dSChris Lattner #if defined(_MSC_VER) 34882018b8SChris Lattner #define S_ISDIR(s) (_S_IFDIR & s) 357a51313dSChris Lattner #endif 367a51313dSChris Lattner 377a51313dSChris Lattner /// NON_EXISTENT_DIR - A special value distinct from null that is used to 387a51313dSChris Lattner /// represent a dir name that doesn't exist on the disk. 397a51313dSChris Lattner #define NON_EXISTENT_DIR reinterpret_cast<DirectoryEntry*>((intptr_t)-1) 407a51313dSChris Lattner 415c04bd81STed Kremenek //===----------------------------------------------------------------------===// 425c04bd81STed Kremenek // Windows. 435c04bd81STed Kremenek //===----------------------------------------------------------------------===// 445c04bd81STed Kremenek 457a51313dSChris Lattner #ifdef LLVM_ON_WIN32 467a51313dSChris Lattner 477a51313dSChris Lattner #define IS_DIR_SEPARATOR_CHAR(x) ((x) == '/' || (x) == '\\') 487a51313dSChris Lattner 497a51313dSChris Lattner namespace { 5011289f42SMike Stump static std::string GetFullPath(const char *relPath) { 517a51313dSChris Lattner char *absPathStrPtr = _fullpath(NULL, relPath, 0); 527a51313dSChris Lattner assert(absPathStrPtr && "_fullpath() returned NULL!"); 537a51313dSChris Lattner 547a51313dSChris Lattner std::string absPath(absPathStrPtr); 557a51313dSChris Lattner 567a51313dSChris Lattner free(absPathStrPtr); 577a51313dSChris Lattner return absPath; 587a51313dSChris Lattner } 597a51313dSChris Lattner } 607a51313dSChris Lattner 617a51313dSChris Lattner class FileManager::UniqueDirContainer { 627a51313dSChris Lattner /// UniqueDirs - Cache from full path to existing directories/files. 637a51313dSChris Lattner /// 647a51313dSChris Lattner llvm::StringMap<DirectoryEntry> UniqueDirs; 657a51313dSChris Lattner 667a51313dSChris Lattner public: 677a51313dSChris Lattner DirectoryEntry &getDirectory(const char *Name, struct stat &StatBuf) { 687a51313dSChris Lattner std::string FullPath(GetFullPath(Name)); 697a51313dSChris Lattner return UniqueDirs.GetOrCreateValue( 707a51313dSChris Lattner FullPath.c_str(), 717a51313dSChris Lattner FullPath.c_str() + FullPath.size() 727a51313dSChris Lattner ).getValue(); 737a51313dSChris Lattner } 747a51313dSChris Lattner 757a51313dSChris Lattner size_t size() { return UniqueDirs.size(); } 767a51313dSChris Lattner }; 777a51313dSChris Lattner 787a51313dSChris Lattner class FileManager::UniqueFileContainer { 797a51313dSChris Lattner /// UniqueFiles - Cache from full path to existing directories/files. 807a51313dSChris Lattner /// 811502b7e2STed Kremenek llvm::StringMap<FileEntry, llvm::BumpPtrAllocator> UniqueFiles; 827a51313dSChris Lattner 837a51313dSChris Lattner public: 847a51313dSChris Lattner FileEntry &getFile(const char *Name, struct stat &StatBuf) { 857a51313dSChris Lattner std::string FullPath(GetFullPath(Name)); 867a51313dSChris Lattner return UniqueFiles.GetOrCreateValue( 877a51313dSChris Lattner FullPath.c_str(), 887a51313dSChris Lattner FullPath.c_str() + FullPath.size() 897a51313dSChris Lattner ).getValue(); 907a51313dSChris Lattner } 917a51313dSChris Lattner 927a51313dSChris Lattner size_t size() { return UniqueFiles.size(); } 937a51313dSChris Lattner }; 947a51313dSChris Lattner 955c04bd81STed Kremenek //===----------------------------------------------------------------------===// 965c04bd81STed Kremenek // Unix-like Systems. 975c04bd81STed Kremenek //===----------------------------------------------------------------------===// 985c04bd81STed Kremenek 997a51313dSChris Lattner #else 1007a51313dSChris Lattner 1017a51313dSChris Lattner #define IS_DIR_SEPARATOR_CHAR(x) ((x) == '/') 1027a51313dSChris Lattner 1037a51313dSChris Lattner class FileManager::UniqueDirContainer { 1047a51313dSChris Lattner /// UniqueDirs - Cache from ID's to existing directories/files. 1057a51313dSChris Lattner /// 1067a51313dSChris Lattner std::map<std::pair<dev_t, ino_t>, DirectoryEntry> UniqueDirs; 1077a51313dSChris Lattner 1087a51313dSChris Lattner public: 1097a51313dSChris Lattner DirectoryEntry &getDirectory(const char *Name, struct stat &StatBuf) { 1107a51313dSChris Lattner return UniqueDirs[std::make_pair(StatBuf.st_dev, StatBuf.st_ino)]; 1117a51313dSChris Lattner } 1127a51313dSChris Lattner 1137a51313dSChris Lattner size_t size() { return UniqueDirs.size(); } 1147a51313dSChris Lattner }; 1157a51313dSChris Lattner 1167a51313dSChris Lattner class FileManager::UniqueFileContainer { 1177a51313dSChris Lattner /// UniqueFiles - Cache from ID's to existing directories/files. 1187a51313dSChris Lattner /// 1197a51313dSChris Lattner std::set<FileEntry> UniqueFiles; 1207a51313dSChris Lattner 1217a51313dSChris Lattner public: 1227a51313dSChris Lattner FileEntry &getFile(const char *Name, struct stat &StatBuf) { 1237a51313dSChris Lattner return 1247a51313dSChris Lattner const_cast<FileEntry&>( 1257a51313dSChris Lattner *UniqueFiles.insert(FileEntry(StatBuf.st_dev, 1265d7e2e17STed Kremenek StatBuf.st_ino, 1275d7e2e17STed Kremenek StatBuf.st_mode)).first); 1287a51313dSChris Lattner } 1297a51313dSChris Lattner 1307a51313dSChris Lattner size_t size() { return UniqueFiles.size(); } 1317a51313dSChris Lattner }; 1327a51313dSChris Lattner 1337a51313dSChris Lattner #endif 1347a51313dSChris Lattner 1355c04bd81STed Kremenek //===----------------------------------------------------------------------===// 1365c04bd81STed Kremenek // Common logic. 1375c04bd81STed Kremenek //===----------------------------------------------------------------------===// 1387a51313dSChris Lattner 1395d7e2e17STed Kremenek FileManager::FileManager() 140c8b740eaSTed Kremenek : UniqueDirs(*new UniqueDirContainer), 1417a51313dSChris Lattner UniqueFiles(*new UniqueFileContainer), 1425d7e2e17STed Kremenek DirEntries(64), FileEntries(64), NextFileUID(0) { 1437a51313dSChris Lattner NumDirLookups = NumFileLookups = 0; 1447a51313dSChris Lattner NumDirCacheMisses = NumFileCacheMisses = 0; 1457a51313dSChris Lattner } 1467a51313dSChris Lattner 1477a51313dSChris Lattner FileManager::~FileManager() { 1487a51313dSChris Lattner delete &UniqueDirs; 1497a51313dSChris Lattner delete &UniqueFiles; 1507a51313dSChris Lattner } 1517a51313dSChris Lattner 1527a51313dSChris Lattner /// getDirectory - Lookup, cache, and verify the specified directory. This 1537a51313dSChris Lattner /// returns null if the directory doesn't exist. 1547a51313dSChris Lattner /// 1557a51313dSChris Lattner const DirectoryEntry *FileManager::getDirectory(const char *NameStart, 1567a51313dSChris Lattner const char *NameEnd) { 1577a51313dSChris Lattner ++NumDirLookups; 1587a51313dSChris Lattner llvm::StringMapEntry<DirectoryEntry *> &NamedDirEnt = 1597a51313dSChris Lattner DirEntries.GetOrCreateValue(NameStart, NameEnd); 1607a51313dSChris Lattner 1617a51313dSChris Lattner // See if there is already an entry in the map. 1627a51313dSChris Lattner if (NamedDirEnt.getValue()) 1637a51313dSChris Lattner return NamedDirEnt.getValue() == NON_EXISTENT_DIR 1647a51313dSChris Lattner ? 0 : NamedDirEnt.getValue(); 1657a51313dSChris Lattner 1667a51313dSChris Lattner ++NumDirCacheMisses; 1677a51313dSChris Lattner 1687a51313dSChris Lattner // By default, initialize it to invalid. 1697a51313dSChris Lattner NamedDirEnt.setValue(NON_EXISTENT_DIR); 1707a51313dSChris Lattner 1717a51313dSChris Lattner // Get the null-terminated directory name as stored as the key of the 1727a51313dSChris Lattner // DirEntries map. 1737a51313dSChris Lattner const char *InterndDirName = NamedDirEnt.getKeyData(); 1747a51313dSChris Lattner 1757a51313dSChris Lattner // Check to see if the directory exists. 1767a51313dSChris Lattner struct stat StatBuf; 177c8b740eaSTed Kremenek if (stat_cached(InterndDirName, &StatBuf) || // Error stat'ing. 1787a51313dSChris Lattner !S_ISDIR(StatBuf.st_mode)) // Not a directory? 1797a51313dSChris Lattner return 0; 1807a51313dSChris Lattner 1817a51313dSChris Lattner // It exists. See if we have already opened a directory with the same inode. 1827a51313dSChris Lattner // This occurs when one dir is symlinked to another, for example. 1837a51313dSChris Lattner DirectoryEntry &UDE = UniqueDirs.getDirectory(InterndDirName, StatBuf); 1847a51313dSChris Lattner 1857a51313dSChris Lattner NamedDirEnt.setValue(&UDE); 1867a51313dSChris Lattner if (UDE.getName()) // Already have an entry with this inode, return it. 1877a51313dSChris Lattner return &UDE; 1887a51313dSChris Lattner 1897a51313dSChris Lattner // Otherwise, we don't have this directory yet, add it. We use the string 1907a51313dSChris Lattner // key from the DirEntries map as the string. 1917a51313dSChris Lattner UDE.Name = InterndDirName; 1927a51313dSChris Lattner return &UDE; 1937a51313dSChris Lattner } 1947a51313dSChris Lattner 1957a51313dSChris Lattner /// NON_EXISTENT_FILE - A special value distinct from null that is used to 1967a51313dSChris Lattner /// represent a filename that doesn't exist on the disk. 1977a51313dSChris Lattner #define NON_EXISTENT_FILE reinterpret_cast<FileEntry*>((intptr_t)-1) 1987a51313dSChris Lattner 1997a51313dSChris Lattner /// getFile - Lookup, cache, and verify the specified file. This returns null 2007a51313dSChris Lattner /// if the file doesn't exist. 2017a51313dSChris Lattner /// 2027a51313dSChris Lattner const FileEntry *FileManager::getFile(const char *NameStart, 2037a51313dSChris Lattner const char *NameEnd) { 2047a51313dSChris Lattner ++NumFileLookups; 2057a51313dSChris Lattner 2067a51313dSChris Lattner // See if there is already an entry in the map. 2077a51313dSChris Lattner llvm::StringMapEntry<FileEntry *> &NamedFileEnt = 2087a51313dSChris Lattner FileEntries.GetOrCreateValue(NameStart, NameEnd); 2097a51313dSChris Lattner 2107a51313dSChris Lattner // See if there is already an entry in the map. 2117a51313dSChris Lattner if (NamedFileEnt.getValue()) 2127a51313dSChris Lattner return NamedFileEnt.getValue() == NON_EXISTENT_FILE 2137a51313dSChris Lattner ? 0 : NamedFileEnt.getValue(); 2147a51313dSChris Lattner 2157a51313dSChris Lattner ++NumFileCacheMisses; 2167a51313dSChris Lattner 2177a51313dSChris Lattner // By default, initialize it to invalid. 2187a51313dSChris Lattner NamedFileEnt.setValue(NON_EXISTENT_FILE); 2197a51313dSChris Lattner 2207a51313dSChris Lattner // Figure out what directory it is in. If the string contains a / in it, 2217a51313dSChris Lattner // strip off everything after it. 2227a51313dSChris Lattner // FIXME: this logic should be in sys::Path. 2237a51313dSChris Lattner const char *SlashPos = NameEnd-1; 2247a51313dSChris Lattner while (SlashPos >= NameStart && !IS_DIR_SEPARATOR_CHAR(SlashPos[0])) 2257a51313dSChris Lattner --SlashPos; 22691f5ff6bSChris Lattner // Ignore duplicate //'s. 22791f5ff6bSChris Lattner while (SlashPos > NameStart && IS_DIR_SEPARATOR_CHAR(SlashPos[-1])) 22891f5ff6bSChris Lattner --SlashPos; 2297a51313dSChris Lattner 2307a51313dSChris Lattner const DirectoryEntry *DirInfo; 2317a51313dSChris Lattner if (SlashPos < NameStart) { 2327a51313dSChris Lattner // Use the current directory if file has no path component. 2337a51313dSChris Lattner const char *Name = "."; 2347a51313dSChris Lattner DirInfo = getDirectory(Name, Name+1); 2357a51313dSChris Lattner } else if (SlashPos == NameEnd-1) 2367a51313dSChris Lattner return 0; // If filename ends with a /, it's a directory. 2377a51313dSChris Lattner else 2387a51313dSChris Lattner DirInfo = getDirectory(NameStart, SlashPos); 2397a51313dSChris Lattner 2407a51313dSChris Lattner if (DirInfo == 0) // Directory doesn't exist, file can't exist. 2417a51313dSChris Lattner return 0; 2427a51313dSChris Lattner 2437a51313dSChris Lattner // Get the null-terminated file name as stored as the key of the 2447a51313dSChris Lattner // FileEntries map. 2457a51313dSChris Lattner const char *InterndFileName = NamedFileEnt.getKeyData(); 2467a51313dSChris Lattner 2477a51313dSChris Lattner // FIXME: Use the directory info to prune this, before doing the stat syscall. 2487a51313dSChris Lattner // FIXME: This will reduce the # syscalls. 2497a51313dSChris Lattner 2507a51313dSChris Lattner // Nope, there isn't. Check to see if the file exists. 2517a51313dSChris Lattner struct stat StatBuf; 25289b422c1SBenjamin Kramer //llvm::errs() << "STATING: " << Filename; 253c8b740eaSTed Kremenek if (stat_cached(InterndFileName, &StatBuf) || // Error stat'ing. 2547a51313dSChris Lattner S_ISDIR(StatBuf.st_mode)) { // A directory? 2557a51313dSChris Lattner // If this file doesn't exist, we leave a null in FileEntries for this path. 25689b422c1SBenjamin Kramer //llvm::errs() << ": Not existing\n"; 2577a51313dSChris Lattner return 0; 2587a51313dSChris Lattner } 25989b422c1SBenjamin Kramer //llvm::errs() << ": exists\n"; 2607a51313dSChris Lattner 2617a51313dSChris Lattner // It exists. See if we have already opened a file with the same inode. 2627a51313dSChris Lattner // This occurs when one dir is symlinked to another, for example. 2637a51313dSChris Lattner FileEntry &UFE = UniqueFiles.getFile(InterndFileName, StatBuf); 2647a51313dSChris Lattner 2657a51313dSChris Lattner NamedFileEnt.setValue(&UFE); 2667a51313dSChris Lattner if (UFE.getName()) // Already have an entry with this inode, return it. 2677a51313dSChris Lattner return &UFE; 2687a51313dSChris Lattner 2697a51313dSChris Lattner // Otherwise, we don't have this directory yet, add it. 2707a51313dSChris Lattner // FIXME: Change the name to be a char* that points back to the 'FileEntries' 2717a51313dSChris Lattner // key. 2727a51313dSChris Lattner UFE.Name = InterndFileName; 2737a51313dSChris Lattner UFE.Size = StatBuf.st_size; 2747a51313dSChris Lattner UFE.ModTime = StatBuf.st_mtime; 2757a51313dSChris Lattner UFE.Dir = DirInfo; 2767a51313dSChris Lattner UFE.UID = NextFileUID++; 2777a51313dSChris Lattner return &UFE; 2787a51313dSChris Lattner } 2797a51313dSChris Lattner 2807a51313dSChris Lattner void FileManager::PrintStats() const { 28189b422c1SBenjamin Kramer llvm::errs() << "\n*** File Manager Stats:\n"; 28289b422c1SBenjamin Kramer llvm::errs() << UniqueFiles.size() << " files found, " 2837a51313dSChris Lattner << UniqueDirs.size() << " dirs found.\n"; 28489b422c1SBenjamin Kramer llvm::errs() << NumDirLookups << " dir lookups, " 2857a51313dSChris Lattner << NumDirCacheMisses << " dir cache misses.\n"; 28689b422c1SBenjamin Kramer llvm::errs() << NumFileLookups << " file lookups, " 2877a51313dSChris Lattner << NumFileCacheMisses << " file cache misses.\n"; 2887a51313dSChris Lattner 28989b422c1SBenjamin Kramer //llvm::errs() << PagesMapped << BytesOfPagesMapped << FSLookups; 2907a51313dSChris Lattner } 291c5046832SDouglas Gregor 292c5046832SDouglas Gregor int MemorizeStatCalls::stat(const char *path, struct stat *buf) { 293c5046832SDouglas Gregor int result = ::stat(path, buf); 294c5046832SDouglas Gregor 295c5046832SDouglas Gregor if (result != 0) { 296c5046832SDouglas Gregor // Cache failed 'stat' results. 297c5046832SDouglas Gregor struct stat empty; 298*01ce06fbSChris Lattner memset(&empty, 0, sizeof(empty)); 299c5046832SDouglas Gregor StatCalls[path] = StatResult(result, empty); 300c5046832SDouglas Gregor } 301c5046832SDouglas Gregor else if (!S_ISDIR(buf->st_mode) || llvm::sys::Path(path).isAbsolute()) { 302c5046832SDouglas Gregor // Cache file 'stat' results and directories with absolutely 303c5046832SDouglas Gregor // paths. 304c5046832SDouglas Gregor StatCalls[path] = StatResult(result, *buf); 305c5046832SDouglas Gregor } 306c5046832SDouglas Gregor 307c5046832SDouglas Gregor return result; 308c5046832SDouglas Gregor } 309