17a51313dSChris Lattner ///===--- FileManager.cpp - File System Probing and Caching ----------------===// 27a51313dSChris Lattner // 37a51313dSChris Lattner // The LLVM Compiler Infrastructure 47a51313dSChris Lattner // 57a51313dSChris Lattner // This file is distributed under the University of Illinois Open Source 67a51313dSChris Lattner // License. See LICENSE.TXT for details. 77a51313dSChris Lattner // 87a51313dSChris Lattner //===----------------------------------------------------------------------===// 97a51313dSChris Lattner // 107a51313dSChris Lattner // This file implements the FileManager interface. 117a51313dSChris Lattner // 127a51313dSChris Lattner //===----------------------------------------------------------------------===// 137a51313dSChris Lattner // 147a51313dSChris Lattner // TODO: This should index all interesting directories with dirent calls. 157a51313dSChris Lattner // getdirentries ? 167a51313dSChris Lattner // opendir/readdir_r/closedir ? 177a51313dSChris Lattner // 187a51313dSChris Lattner //===----------------------------------------------------------------------===// 197a51313dSChris Lattner 207a51313dSChris Lattner #include "clang/Basic/FileManager.h" 217a51313dSChris Lattner #include "llvm/ADT/SmallString.h" 22c5046832SDouglas Gregor #include "llvm/System/Path.h" 237a51313dSChris Lattner #include "llvm/Support/Streams.h" 247a51313dSChris Lattner #include "llvm/Config/config.h" 257a51313dSChris Lattner using namespace clang; 267a51313dSChris Lattner 277a51313dSChris Lattner // FIXME: Enhance libsystem to support inode and other fields. 287a51313dSChris Lattner #include <sys/stat.h> 297a51313dSChris Lattner 307a51313dSChris Lattner #if defined(_MSC_VER) 31882018b8SChris Lattner #define S_ISDIR(s) (_S_IFDIR & s) 327a51313dSChris Lattner #endif 337a51313dSChris Lattner 347a51313dSChris Lattner /// NON_EXISTENT_DIR - A special value distinct from null that is used to 357a51313dSChris Lattner /// represent a dir name that doesn't exist on the disk. 367a51313dSChris Lattner #define NON_EXISTENT_DIR reinterpret_cast<DirectoryEntry*>((intptr_t)-1) 377a51313dSChris Lattner 385c04bd81STed Kremenek //===----------------------------------------------------------------------===// 395c04bd81STed Kremenek // Windows. 405c04bd81STed Kremenek //===----------------------------------------------------------------------===// 415c04bd81STed Kremenek 427a51313dSChris Lattner #ifdef LLVM_ON_WIN32 437a51313dSChris Lattner 447a51313dSChris Lattner #define IS_DIR_SEPARATOR_CHAR(x) ((x) == '/' || (x) == '\\') 457a51313dSChris Lattner 467a51313dSChris Lattner namespace { 477a51313dSChris Lattner static std::string GetFullPath(const char *relPath) 487a51313dSChris Lattner { 497a51313dSChris Lattner char *absPathStrPtr = _fullpath(NULL, relPath, 0); 507a51313dSChris Lattner assert(absPathStrPtr && "_fullpath() returned NULL!"); 517a51313dSChris Lattner 527a51313dSChris Lattner std::string absPath(absPathStrPtr); 537a51313dSChris Lattner 547a51313dSChris Lattner free(absPathStrPtr); 557a51313dSChris Lattner return absPath; 567a51313dSChris Lattner } 577a51313dSChris Lattner } 587a51313dSChris Lattner 597a51313dSChris Lattner class FileManager::UniqueDirContainer { 607a51313dSChris Lattner /// UniqueDirs - Cache from full path to existing directories/files. 617a51313dSChris Lattner /// 627a51313dSChris Lattner llvm::StringMap<DirectoryEntry> UniqueDirs; 637a51313dSChris Lattner 647a51313dSChris Lattner public: 657a51313dSChris Lattner DirectoryEntry &getDirectory(const char *Name, struct stat &StatBuf) { 667a51313dSChris Lattner std::string FullPath(GetFullPath(Name)); 677a51313dSChris Lattner return UniqueDirs.GetOrCreateValue( 687a51313dSChris Lattner FullPath.c_str(), 697a51313dSChris Lattner FullPath.c_str() + FullPath.size() 707a51313dSChris Lattner ).getValue(); 717a51313dSChris Lattner } 727a51313dSChris Lattner 737a51313dSChris Lattner size_t size() { return UniqueDirs.size(); } 747a51313dSChris Lattner }; 757a51313dSChris Lattner 767a51313dSChris Lattner class FileManager::UniqueFileContainer { 777a51313dSChris Lattner /// UniqueFiles - Cache from full path to existing directories/files. 787a51313dSChris Lattner /// 791502b7e2STed Kremenek llvm::StringMap<FileEntry, llvm::BumpPtrAllocator> UniqueFiles; 807a51313dSChris Lattner 817a51313dSChris Lattner public: 827a51313dSChris Lattner FileEntry &getFile(const char *Name, struct stat &StatBuf) { 837a51313dSChris Lattner std::string FullPath(GetFullPath(Name)); 847a51313dSChris Lattner return UniqueFiles.GetOrCreateValue( 857a51313dSChris Lattner FullPath.c_str(), 867a51313dSChris Lattner FullPath.c_str() + FullPath.size() 877a51313dSChris Lattner ).getValue(); 887a51313dSChris Lattner } 897a51313dSChris Lattner 907a51313dSChris Lattner size_t size() { return UniqueFiles.size(); } 917a51313dSChris Lattner }; 927a51313dSChris Lattner 935c04bd81STed Kremenek //===----------------------------------------------------------------------===// 945c04bd81STed Kremenek // Unix-like Systems. 955c04bd81STed Kremenek //===----------------------------------------------------------------------===// 965c04bd81STed Kremenek 977a51313dSChris Lattner #else 987a51313dSChris Lattner 997a51313dSChris Lattner #define IS_DIR_SEPARATOR_CHAR(x) ((x) == '/') 1007a51313dSChris Lattner 1017a51313dSChris Lattner class FileManager::UniqueDirContainer { 1027a51313dSChris Lattner /// UniqueDirs - Cache from ID's to existing directories/files. 1037a51313dSChris Lattner /// 1047a51313dSChris Lattner std::map<std::pair<dev_t, ino_t>, DirectoryEntry> UniqueDirs; 1057a51313dSChris Lattner 1067a51313dSChris Lattner public: 1077a51313dSChris Lattner DirectoryEntry &getDirectory(const char *Name, struct stat &StatBuf) { 1087a51313dSChris Lattner return UniqueDirs[std::make_pair(StatBuf.st_dev, StatBuf.st_ino)]; 1097a51313dSChris Lattner } 1107a51313dSChris Lattner 1117a51313dSChris Lattner size_t size() { return UniqueDirs.size(); } 1127a51313dSChris Lattner }; 1137a51313dSChris Lattner 1147a51313dSChris Lattner class FileManager::UniqueFileContainer { 1157a51313dSChris Lattner /// UniqueFiles - Cache from ID's to existing directories/files. 1167a51313dSChris Lattner /// 1177a51313dSChris Lattner std::set<FileEntry> UniqueFiles; 1187a51313dSChris Lattner 1197a51313dSChris Lattner public: 1207a51313dSChris Lattner FileEntry &getFile(const char *Name, struct stat &StatBuf) { 1217a51313dSChris Lattner return 1227a51313dSChris Lattner const_cast<FileEntry&>( 1237a51313dSChris Lattner *UniqueFiles.insert(FileEntry(StatBuf.st_dev, 1245d7e2e17STed Kremenek StatBuf.st_ino, 1255d7e2e17STed Kremenek StatBuf.st_mode)).first); 1267a51313dSChris Lattner } 1277a51313dSChris Lattner 1287a51313dSChris Lattner size_t size() { return UniqueFiles.size(); } 1297a51313dSChris Lattner }; 1307a51313dSChris Lattner 1317a51313dSChris Lattner #endif 1327a51313dSChris Lattner 1335c04bd81STed Kremenek //===----------------------------------------------------------------------===// 1345c04bd81STed Kremenek // Common logic. 1355c04bd81STed Kremenek //===----------------------------------------------------------------------===// 1367a51313dSChris Lattner 1375d7e2e17STed Kremenek FileManager::FileManager() 138c8b740eaSTed Kremenek : UniqueDirs(*new UniqueDirContainer), 1397a51313dSChris Lattner UniqueFiles(*new UniqueFileContainer), 1405d7e2e17STed Kremenek DirEntries(64), FileEntries(64), NextFileUID(0) { 1417a51313dSChris Lattner NumDirLookups = NumFileLookups = 0; 1427a51313dSChris Lattner NumDirCacheMisses = NumFileCacheMisses = 0; 1437a51313dSChris Lattner } 1447a51313dSChris Lattner 1457a51313dSChris Lattner FileManager::~FileManager() { 1467a51313dSChris Lattner delete &UniqueDirs; 1477a51313dSChris Lattner delete &UniqueFiles; 1487a51313dSChris Lattner } 1497a51313dSChris Lattner 1507a51313dSChris Lattner /// getDirectory - Lookup, cache, and verify the specified directory. This 1517a51313dSChris Lattner /// returns null if the directory doesn't exist. 1527a51313dSChris Lattner /// 1537a51313dSChris Lattner const DirectoryEntry *FileManager::getDirectory(const char *NameStart, 1547a51313dSChris Lattner const char *NameEnd) { 1557a51313dSChris Lattner ++NumDirLookups; 1567a51313dSChris Lattner llvm::StringMapEntry<DirectoryEntry *> &NamedDirEnt = 1577a51313dSChris Lattner DirEntries.GetOrCreateValue(NameStart, NameEnd); 1587a51313dSChris Lattner 1597a51313dSChris Lattner // See if there is already an entry in the map. 1607a51313dSChris Lattner if (NamedDirEnt.getValue()) 1617a51313dSChris Lattner return NamedDirEnt.getValue() == NON_EXISTENT_DIR 1627a51313dSChris Lattner ? 0 : NamedDirEnt.getValue(); 1637a51313dSChris Lattner 1647a51313dSChris Lattner ++NumDirCacheMisses; 1657a51313dSChris Lattner 1667a51313dSChris Lattner // By default, initialize it to invalid. 1677a51313dSChris Lattner NamedDirEnt.setValue(NON_EXISTENT_DIR); 1687a51313dSChris Lattner 1697a51313dSChris Lattner // Get the null-terminated directory name as stored as the key of the 1707a51313dSChris Lattner // DirEntries map. 1717a51313dSChris Lattner const char *InterndDirName = NamedDirEnt.getKeyData(); 1727a51313dSChris Lattner 1737a51313dSChris Lattner // Check to see if the directory exists. 1747a51313dSChris Lattner struct stat StatBuf; 175c8b740eaSTed Kremenek if (stat_cached(InterndDirName, &StatBuf) || // Error stat'ing. 1767a51313dSChris Lattner !S_ISDIR(StatBuf.st_mode)) // Not a directory? 1777a51313dSChris Lattner return 0; 1787a51313dSChris Lattner 1797a51313dSChris Lattner // It exists. See if we have already opened a directory with the same inode. 1807a51313dSChris Lattner // This occurs when one dir is symlinked to another, for example. 1817a51313dSChris Lattner DirectoryEntry &UDE = UniqueDirs.getDirectory(InterndDirName, StatBuf); 1827a51313dSChris Lattner 1837a51313dSChris Lattner NamedDirEnt.setValue(&UDE); 1847a51313dSChris Lattner if (UDE.getName()) // Already have an entry with this inode, return it. 1857a51313dSChris Lattner return &UDE; 1867a51313dSChris Lattner 1877a51313dSChris Lattner // Otherwise, we don't have this directory yet, add it. We use the string 1887a51313dSChris Lattner // key from the DirEntries map as the string. 1897a51313dSChris Lattner UDE.Name = InterndDirName; 1907a51313dSChris Lattner return &UDE; 1917a51313dSChris Lattner } 1927a51313dSChris Lattner 1937a51313dSChris Lattner /// NON_EXISTENT_FILE - A special value distinct from null that is used to 1947a51313dSChris Lattner /// represent a filename that doesn't exist on the disk. 1957a51313dSChris Lattner #define NON_EXISTENT_FILE reinterpret_cast<FileEntry*>((intptr_t)-1) 1967a51313dSChris Lattner 1977a51313dSChris Lattner /// getFile - Lookup, cache, and verify the specified file. This returns null 1987a51313dSChris Lattner /// if the file doesn't exist. 1997a51313dSChris Lattner /// 2007a51313dSChris Lattner const FileEntry *FileManager::getFile(const char *NameStart, 2017a51313dSChris Lattner const char *NameEnd) { 2027a51313dSChris Lattner ++NumFileLookups; 2037a51313dSChris Lattner 2047a51313dSChris Lattner // See if there is already an entry in the map. 2057a51313dSChris Lattner llvm::StringMapEntry<FileEntry *> &NamedFileEnt = 2067a51313dSChris Lattner FileEntries.GetOrCreateValue(NameStart, NameEnd); 2077a51313dSChris Lattner 2087a51313dSChris Lattner // See if there is already an entry in the map. 2097a51313dSChris Lattner if (NamedFileEnt.getValue()) 2107a51313dSChris Lattner return NamedFileEnt.getValue() == NON_EXISTENT_FILE 2117a51313dSChris Lattner ? 0 : NamedFileEnt.getValue(); 2127a51313dSChris Lattner 2137a51313dSChris Lattner ++NumFileCacheMisses; 2147a51313dSChris Lattner 2157a51313dSChris Lattner // By default, initialize it to invalid. 2167a51313dSChris Lattner NamedFileEnt.setValue(NON_EXISTENT_FILE); 2177a51313dSChris Lattner 2187a51313dSChris Lattner // Figure out what directory it is in. If the string contains a / in it, 2197a51313dSChris Lattner // strip off everything after it. 2207a51313dSChris Lattner // FIXME: this logic should be in sys::Path. 2217a51313dSChris Lattner const char *SlashPos = NameEnd-1; 2227a51313dSChris Lattner while (SlashPos >= NameStart && !IS_DIR_SEPARATOR_CHAR(SlashPos[0])) 2237a51313dSChris Lattner --SlashPos; 224*91f5ff6bSChris Lattner // Ignore duplicate //'s. 225*91f5ff6bSChris Lattner while (SlashPos > NameStart && IS_DIR_SEPARATOR_CHAR(SlashPos[-1])) 226*91f5ff6bSChris Lattner --SlashPos; 2277a51313dSChris Lattner 2287a51313dSChris Lattner const DirectoryEntry *DirInfo; 2297a51313dSChris Lattner if (SlashPos < NameStart) { 2307a51313dSChris Lattner // Use the current directory if file has no path component. 2317a51313dSChris Lattner const char *Name = "."; 2327a51313dSChris Lattner DirInfo = getDirectory(Name, Name+1); 2337a51313dSChris Lattner } else if (SlashPos == NameEnd-1) 2347a51313dSChris Lattner return 0; // If filename ends with a /, it's a directory. 2357a51313dSChris Lattner else 2367a51313dSChris Lattner DirInfo = getDirectory(NameStart, SlashPos); 2377a51313dSChris Lattner 2387a51313dSChris Lattner if (DirInfo == 0) // Directory doesn't exist, file can't exist. 2397a51313dSChris Lattner return 0; 2407a51313dSChris Lattner 2417a51313dSChris Lattner // Get the null-terminated file name as stored as the key of the 2427a51313dSChris Lattner // FileEntries map. 2437a51313dSChris Lattner const char *InterndFileName = NamedFileEnt.getKeyData(); 2447a51313dSChris Lattner 2457a51313dSChris Lattner // FIXME: Use the directory info to prune this, before doing the stat syscall. 2467a51313dSChris Lattner // FIXME: This will reduce the # syscalls. 2477a51313dSChris Lattner 2487a51313dSChris Lattner // Nope, there isn't. Check to see if the file exists. 2497a51313dSChris Lattner struct stat StatBuf; 2507a51313dSChris Lattner //llvm::cerr << "STATING: " << Filename; 251c8b740eaSTed Kremenek if (stat_cached(InterndFileName, &StatBuf) || // Error stat'ing. 2527a51313dSChris Lattner S_ISDIR(StatBuf.st_mode)) { // A directory? 2537a51313dSChris Lattner // If this file doesn't exist, we leave a null in FileEntries for this path. 2547a51313dSChris Lattner //llvm::cerr << ": Not existing\n"; 2557a51313dSChris Lattner return 0; 2567a51313dSChris Lattner } 2577a51313dSChris Lattner //llvm::cerr << ": exists\n"; 2587a51313dSChris Lattner 2597a51313dSChris Lattner // It exists. See if we have already opened a file with the same inode. 2607a51313dSChris Lattner // This occurs when one dir is symlinked to another, for example. 2617a51313dSChris Lattner FileEntry &UFE = UniqueFiles.getFile(InterndFileName, StatBuf); 2627a51313dSChris Lattner 2637a51313dSChris Lattner NamedFileEnt.setValue(&UFE); 2647a51313dSChris Lattner if (UFE.getName()) // Already have an entry with this inode, return it. 2657a51313dSChris Lattner return &UFE; 2667a51313dSChris Lattner 2677a51313dSChris Lattner // Otherwise, we don't have this directory yet, add it. 2687a51313dSChris Lattner // FIXME: Change the name to be a char* that points back to the 'FileEntries' 2697a51313dSChris Lattner // key. 2707a51313dSChris Lattner UFE.Name = InterndFileName; 2717a51313dSChris Lattner UFE.Size = StatBuf.st_size; 2727a51313dSChris Lattner UFE.ModTime = StatBuf.st_mtime; 2737a51313dSChris Lattner UFE.Dir = DirInfo; 2747a51313dSChris Lattner UFE.UID = NextFileUID++; 2757a51313dSChris Lattner return &UFE; 2767a51313dSChris Lattner } 2777a51313dSChris Lattner 2787a51313dSChris Lattner void FileManager::PrintStats() const { 2797a51313dSChris Lattner llvm::cerr << "\n*** File Manager Stats:\n"; 2807a51313dSChris Lattner llvm::cerr << UniqueFiles.size() << " files found, " 2817a51313dSChris Lattner << UniqueDirs.size() << " dirs found.\n"; 2827a51313dSChris Lattner llvm::cerr << NumDirLookups << " dir lookups, " 2837a51313dSChris Lattner << NumDirCacheMisses << " dir cache misses.\n"; 2847a51313dSChris Lattner llvm::cerr << NumFileLookups << " file lookups, " 2857a51313dSChris Lattner << NumFileCacheMisses << " file cache misses.\n"; 2867a51313dSChris Lattner 2877a51313dSChris Lattner //llvm::cerr << PagesMapped << BytesOfPagesMapped << FSLookups; 2887a51313dSChris Lattner } 289c5046832SDouglas Gregor 290c5046832SDouglas Gregor int MemorizeStatCalls::stat(const char *path, struct stat *buf) { 291c5046832SDouglas Gregor int result = ::stat(path, buf); 292c5046832SDouglas Gregor 293c5046832SDouglas Gregor if (result != 0) { 294c5046832SDouglas Gregor // Cache failed 'stat' results. 295c5046832SDouglas Gregor struct stat empty; 296c5046832SDouglas Gregor StatCalls[path] = StatResult(result, empty); 297c5046832SDouglas Gregor } 298c5046832SDouglas Gregor else if (!S_ISDIR(buf->st_mode) || llvm::sys::Path(path).isAbsolute()) { 299c5046832SDouglas Gregor // Cache file 'stat' results and directories with absolutely 300c5046832SDouglas Gregor // paths. 301c5046832SDouglas Gregor StatCalls[path] = StatResult(result, *buf); 302c5046832SDouglas Gregor } 303c5046832SDouglas Gregor 304c5046832SDouglas Gregor return result; 305c5046832SDouglas Gregor } 306