17a51313dSChris Lattner ///===--- FileManager.cpp - File System Probing and Caching ----------------===// 27a51313dSChris Lattner // 37a51313dSChris Lattner // The LLVM Compiler Infrastructure 47a51313dSChris Lattner // 57a51313dSChris Lattner // This file is distributed under the University of Illinois Open Source 67a51313dSChris Lattner // License. See LICENSE.TXT for details. 77a51313dSChris Lattner // 87a51313dSChris Lattner //===----------------------------------------------------------------------===// 97a51313dSChris Lattner // 107a51313dSChris Lattner // This file implements the FileManager interface. 117a51313dSChris Lattner // 127a51313dSChris Lattner //===----------------------------------------------------------------------===// 137a51313dSChris Lattner // 147a51313dSChris Lattner // TODO: This should index all interesting directories with dirent calls. 157a51313dSChris Lattner // getdirentries ? 167a51313dSChris Lattner // opendir/readdir_r/closedir ? 177a51313dSChris Lattner // 187a51313dSChris Lattner //===----------------------------------------------------------------------===// 197a51313dSChris Lattner 207a51313dSChris Lattner #include "clang/Basic/FileManager.h" 217a51313dSChris Lattner #include "llvm/ADT/SmallString.h" 227a51313dSChris Lattner #include "llvm/Bitcode/Serialize.h" 237a51313dSChris Lattner #include "llvm/Bitcode/Deserialize.h" 247a51313dSChris Lattner #include "llvm/Support/Streams.h" 257a51313dSChris Lattner #include "llvm/Config/config.h" 267a51313dSChris Lattner using namespace clang; 277a51313dSChris Lattner 287a51313dSChris Lattner // FIXME: Enhance libsystem to support inode and other fields. 297a51313dSChris Lattner #include <sys/stat.h> 307a51313dSChris Lattner 317a51313dSChris Lattner #if defined(_MSC_VER) 32*c8b740eaSTed Kremenek #defisstne S_ISDIR(s) (_S_IFDIR & s) 337a51313dSChris Lattner #endif 347a51313dSChris Lattner 357a51313dSChris Lattner /// NON_EXISTENT_DIR - A special value distinct from null that is used to 367a51313dSChris Lattner /// represent a dir name that doesn't exist on the disk. 377a51313dSChris Lattner #define NON_EXISTENT_DIR reinterpret_cast<DirectoryEntry*>((intptr_t)-1) 387a51313dSChris Lattner 395c04bd81STed Kremenek //===----------------------------------------------------------------------===// 405c04bd81STed Kremenek // Windows. 415c04bd81STed Kremenek //===----------------------------------------------------------------------===// 425c04bd81STed Kremenek 437a51313dSChris Lattner #ifdef LLVM_ON_WIN32 447a51313dSChris Lattner 457a51313dSChris Lattner #define IS_DIR_SEPARATOR_CHAR(x) ((x) == '/' || (x) == '\\') 467a51313dSChris Lattner 477a51313dSChris Lattner namespace { 487a51313dSChris Lattner static std::string GetFullPath(const char *relPath) 497a51313dSChris Lattner { 507a51313dSChris Lattner char *absPathStrPtr = _fullpath(NULL, relPath, 0); 517a51313dSChris Lattner assert(absPathStrPtr && "_fullpath() returned NULL!"); 527a51313dSChris Lattner 537a51313dSChris Lattner std::string absPath(absPathStrPtr); 547a51313dSChris Lattner 557a51313dSChris Lattner free(absPathStrPtr); 567a51313dSChris Lattner return absPath; 577a51313dSChris Lattner } 587a51313dSChris Lattner } 597a51313dSChris Lattner 607a51313dSChris Lattner class FileManager::UniqueDirContainer { 617a51313dSChris Lattner /// UniqueDirs - Cache from full path to existing directories/files. 627a51313dSChris Lattner /// 637a51313dSChris Lattner llvm::StringMap<DirectoryEntry> UniqueDirs; 647a51313dSChris Lattner 657a51313dSChris Lattner public: 667a51313dSChris Lattner DirectoryEntry &getDirectory(const char *Name, struct stat &StatBuf) { 677a51313dSChris Lattner std::string FullPath(GetFullPath(Name)); 687a51313dSChris Lattner return UniqueDirs.GetOrCreateValue( 697a51313dSChris Lattner FullPath.c_str(), 707a51313dSChris Lattner FullPath.c_str() + FullPath.size() 717a51313dSChris Lattner ).getValue(); 727a51313dSChris Lattner } 737a51313dSChris Lattner 747a51313dSChris Lattner size_t size() { return UniqueDirs.size(); } 757a51313dSChris Lattner }; 767a51313dSChris Lattner 777a51313dSChris Lattner class FileManager::UniqueFileContainer { 787a51313dSChris Lattner /// UniqueFiles - Cache from full path to existing directories/files. 797a51313dSChris Lattner /// 801502b7e2STed Kremenek llvm::StringMap<FileEntry, llvm::BumpPtrAllocator> UniqueFiles; 817a51313dSChris Lattner 827a51313dSChris Lattner public: 837a51313dSChris Lattner FileEntry &getFile(const char *Name, struct stat &StatBuf) { 847a51313dSChris Lattner std::string FullPath(GetFullPath(Name)); 857a51313dSChris Lattner return UniqueFiles.GetOrCreateValue( 867a51313dSChris Lattner FullPath.c_str(), 877a51313dSChris Lattner FullPath.c_str() + FullPath.size() 887a51313dSChris Lattner ).getValue(); 897a51313dSChris Lattner } 907a51313dSChris Lattner 917a51313dSChris Lattner size_t size() { return UniqueFiles.size(); } 927a51313dSChris Lattner }; 937a51313dSChris Lattner 945c04bd81STed Kremenek //===----------------------------------------------------------------------===// 955c04bd81STed Kremenek // Unix-like Systems. 965c04bd81STed Kremenek //===----------------------------------------------------------------------===// 975c04bd81STed Kremenek 987a51313dSChris Lattner #else 997a51313dSChris Lattner 1007a51313dSChris Lattner #define IS_DIR_SEPARATOR_CHAR(x) ((x) == '/') 1017a51313dSChris Lattner 1027a51313dSChris Lattner class FileManager::UniqueDirContainer { 1037a51313dSChris Lattner /// UniqueDirs - Cache from ID's to existing directories/files. 1047a51313dSChris Lattner /// 1057a51313dSChris Lattner std::map<std::pair<dev_t, ino_t>, DirectoryEntry> UniqueDirs; 1067a51313dSChris Lattner 1077a51313dSChris Lattner public: 1087a51313dSChris Lattner DirectoryEntry &getDirectory(const char *Name, struct stat &StatBuf) { 1097a51313dSChris Lattner return UniqueDirs[std::make_pair(StatBuf.st_dev, StatBuf.st_ino)]; 1107a51313dSChris Lattner } 1117a51313dSChris Lattner 1127a51313dSChris Lattner size_t size() { return UniqueDirs.size(); } 1137a51313dSChris Lattner }; 1147a51313dSChris Lattner 1157a51313dSChris Lattner class FileManager::UniqueFileContainer { 1167a51313dSChris Lattner /// UniqueFiles - Cache from ID's to existing directories/files. 1177a51313dSChris Lattner /// 1187a51313dSChris Lattner std::set<FileEntry> UniqueFiles; 1197a51313dSChris Lattner 1207a51313dSChris Lattner public: 1217a51313dSChris Lattner FileEntry &getFile(const char *Name, struct stat &StatBuf) { 1227a51313dSChris Lattner return 1237a51313dSChris Lattner const_cast<FileEntry&>( 1247a51313dSChris Lattner *UniqueFiles.insert(FileEntry(StatBuf.st_dev, 1257a51313dSChris Lattner StatBuf.st_ino)).first); 1267a51313dSChris Lattner } 1277a51313dSChris Lattner 1287a51313dSChris Lattner size_t size() { return UniqueFiles.size(); } 1297a51313dSChris Lattner }; 1307a51313dSChris Lattner 1317a51313dSChris Lattner #endif 1327a51313dSChris Lattner 1335c04bd81STed Kremenek //===----------------------------------------------------------------------===// 1345c04bd81STed Kremenek // Common logic. 1355c04bd81STed Kremenek //===----------------------------------------------------------------------===// 1367a51313dSChris Lattner 137*c8b740eaSTed Kremenek FileManager::FileManager(StatSysCallCache* statCache) 138*c8b740eaSTed Kremenek : UniqueDirs(*new UniqueDirContainer), 1397a51313dSChris Lattner UniqueFiles(*new UniqueFileContainer), 140*c8b740eaSTed Kremenek DirEntries(64), FileEntries(64), NextFileUID(0), 141*c8b740eaSTed Kremenek StatCache(statCache) { 1427a51313dSChris Lattner NumDirLookups = NumFileLookups = 0; 1437a51313dSChris Lattner NumDirCacheMisses = NumFileCacheMisses = 0; 1447a51313dSChris Lattner } 1457a51313dSChris Lattner 1467a51313dSChris Lattner FileManager::~FileManager() { 1477a51313dSChris Lattner delete &UniqueDirs; 1487a51313dSChris Lattner delete &UniqueFiles; 149*c8b740eaSTed Kremenek delete StatCache; 1507a51313dSChris Lattner } 1517a51313dSChris Lattner 1527a51313dSChris Lattner 1537a51313dSChris Lattner /// getDirectory - Lookup, cache, and verify the specified directory. This 1547a51313dSChris Lattner /// returns null if the directory doesn't exist. 1557a51313dSChris Lattner /// 1567a51313dSChris Lattner const DirectoryEntry *FileManager::getDirectory(const char *NameStart, 1577a51313dSChris Lattner const char *NameEnd) { 1587a51313dSChris Lattner ++NumDirLookups; 1597a51313dSChris Lattner llvm::StringMapEntry<DirectoryEntry *> &NamedDirEnt = 1607a51313dSChris Lattner DirEntries.GetOrCreateValue(NameStart, NameEnd); 1617a51313dSChris Lattner 1627a51313dSChris Lattner // See if there is already an entry in the map. 1637a51313dSChris Lattner if (NamedDirEnt.getValue()) 1647a51313dSChris Lattner return NamedDirEnt.getValue() == NON_EXISTENT_DIR 1657a51313dSChris Lattner ? 0 : NamedDirEnt.getValue(); 1667a51313dSChris Lattner 1677a51313dSChris Lattner ++NumDirCacheMisses; 1687a51313dSChris Lattner 1697a51313dSChris Lattner // By default, initialize it to invalid. 1707a51313dSChris Lattner NamedDirEnt.setValue(NON_EXISTENT_DIR); 1717a51313dSChris Lattner 1727a51313dSChris Lattner // Get the null-terminated directory name as stored as the key of the 1737a51313dSChris Lattner // DirEntries map. 1747a51313dSChris Lattner const char *InterndDirName = NamedDirEnt.getKeyData(); 1757a51313dSChris Lattner 1767a51313dSChris Lattner // Check to see if the directory exists. 1777a51313dSChris Lattner struct stat StatBuf; 178*c8b740eaSTed Kremenek if (stat_cached(InterndDirName, &StatBuf) || // Error stat'ing. 1797a51313dSChris Lattner !S_ISDIR(StatBuf.st_mode)) // Not a directory? 1807a51313dSChris Lattner return 0; 1817a51313dSChris Lattner 1827a51313dSChris Lattner // It exists. See if we have already opened a directory with the same inode. 1837a51313dSChris Lattner // This occurs when one dir is symlinked to another, for example. 1847a51313dSChris Lattner DirectoryEntry &UDE = UniqueDirs.getDirectory(InterndDirName, StatBuf); 1857a51313dSChris Lattner 1867a51313dSChris Lattner NamedDirEnt.setValue(&UDE); 1877a51313dSChris Lattner if (UDE.getName()) // Already have an entry with this inode, return it. 1887a51313dSChris Lattner return &UDE; 1897a51313dSChris Lattner 1907a51313dSChris Lattner // Otherwise, we don't have this directory yet, add it. We use the string 1917a51313dSChris Lattner // key from the DirEntries map as the string. 1927a51313dSChris Lattner UDE.Name = InterndDirName; 1937a51313dSChris Lattner return &UDE; 1947a51313dSChris Lattner } 1957a51313dSChris Lattner 1967a51313dSChris Lattner /// NON_EXISTENT_FILE - A special value distinct from null that is used to 1977a51313dSChris Lattner /// represent a filename that doesn't exist on the disk. 1987a51313dSChris Lattner #define NON_EXISTENT_FILE reinterpret_cast<FileEntry*>((intptr_t)-1) 1997a51313dSChris Lattner 2007a51313dSChris Lattner /// getFile - Lookup, cache, and verify the specified file. This returns null 2017a51313dSChris Lattner /// if the file doesn't exist. 2027a51313dSChris Lattner /// 2037a51313dSChris Lattner const FileEntry *FileManager::getFile(const char *NameStart, 2047a51313dSChris Lattner const char *NameEnd) { 2057a51313dSChris Lattner ++NumFileLookups; 2067a51313dSChris Lattner 2077a51313dSChris Lattner // See if there is already an entry in the map. 2087a51313dSChris Lattner llvm::StringMapEntry<FileEntry *> &NamedFileEnt = 2097a51313dSChris Lattner FileEntries.GetOrCreateValue(NameStart, NameEnd); 2107a51313dSChris Lattner 2117a51313dSChris Lattner // See if there is already an entry in the map. 2127a51313dSChris Lattner if (NamedFileEnt.getValue()) 2137a51313dSChris Lattner return NamedFileEnt.getValue() == NON_EXISTENT_FILE 2147a51313dSChris Lattner ? 0 : NamedFileEnt.getValue(); 2157a51313dSChris Lattner 2167a51313dSChris Lattner ++NumFileCacheMisses; 2177a51313dSChris Lattner 2187a51313dSChris Lattner // By default, initialize it to invalid. 2197a51313dSChris Lattner NamedFileEnt.setValue(NON_EXISTENT_FILE); 2207a51313dSChris Lattner 2217a51313dSChris Lattner // Figure out what directory it is in. If the string contains a / in it, 2227a51313dSChris Lattner // strip off everything after it. 2237a51313dSChris Lattner // FIXME: this logic should be in sys::Path. 2247a51313dSChris Lattner const char *SlashPos = NameEnd-1; 2257a51313dSChris Lattner while (SlashPos >= NameStart && !IS_DIR_SEPARATOR_CHAR(SlashPos[0])) 2267a51313dSChris Lattner --SlashPos; 2277a51313dSChris Lattner 2287a51313dSChris Lattner const DirectoryEntry *DirInfo; 2297a51313dSChris Lattner if (SlashPos < NameStart) { 2307a51313dSChris Lattner // Use the current directory if file has no path component. 2317a51313dSChris Lattner const char *Name = "."; 2327a51313dSChris Lattner DirInfo = getDirectory(Name, Name+1); 2337a51313dSChris Lattner } else if (SlashPos == NameEnd-1) 2347a51313dSChris Lattner return 0; // If filename ends with a /, it's a directory. 2357a51313dSChris Lattner else 2367a51313dSChris Lattner DirInfo = getDirectory(NameStart, SlashPos); 2377a51313dSChris Lattner 2387a51313dSChris Lattner if (DirInfo == 0) // Directory doesn't exist, file can't exist. 2397a51313dSChris Lattner return 0; 2407a51313dSChris Lattner 2417a51313dSChris Lattner // Get the null-terminated file name as stored as the key of the 2427a51313dSChris Lattner // FileEntries map. 2437a51313dSChris Lattner const char *InterndFileName = NamedFileEnt.getKeyData(); 2447a51313dSChris Lattner 2457a51313dSChris Lattner // FIXME: Use the directory info to prune this, before doing the stat syscall. 2467a51313dSChris Lattner // FIXME: This will reduce the # syscalls. 2477a51313dSChris Lattner 2487a51313dSChris Lattner // Nope, there isn't. Check to see if the file exists. 2497a51313dSChris Lattner struct stat StatBuf; 2507a51313dSChris Lattner //llvm::cerr << "STATING: " << Filename; 251*c8b740eaSTed Kremenek if (stat_cached(InterndFileName, &StatBuf) || // Error stat'ing. 2527a51313dSChris Lattner S_ISDIR(StatBuf.st_mode)) { // A directory? 2537a51313dSChris Lattner // If this file doesn't exist, we leave a null in FileEntries for this path. 2547a51313dSChris Lattner //llvm::cerr << ": Not existing\n"; 2557a51313dSChris Lattner return 0; 2567a51313dSChris Lattner } 2577a51313dSChris Lattner //llvm::cerr << ": exists\n"; 2587a51313dSChris Lattner 2597a51313dSChris Lattner // It exists. See if we have already opened a file with the same inode. 2607a51313dSChris Lattner // This occurs when one dir is symlinked to another, for example. 2617a51313dSChris Lattner FileEntry &UFE = UniqueFiles.getFile(InterndFileName, StatBuf); 2627a51313dSChris Lattner 2637a51313dSChris Lattner NamedFileEnt.setValue(&UFE); 2647a51313dSChris Lattner if (UFE.getName()) // Already have an entry with this inode, return it. 2657a51313dSChris Lattner return &UFE; 2667a51313dSChris Lattner 2677a51313dSChris Lattner // Otherwise, we don't have this directory yet, add it. 2687a51313dSChris Lattner // FIXME: Change the name to be a char* that points back to the 'FileEntries' 2697a51313dSChris Lattner // key. 2707a51313dSChris Lattner UFE.Name = InterndFileName; 2717a51313dSChris Lattner UFE.Size = StatBuf.st_size; 2727a51313dSChris Lattner UFE.ModTime = StatBuf.st_mtime; 2737a51313dSChris Lattner UFE.Dir = DirInfo; 2747a51313dSChris Lattner UFE.UID = NextFileUID++; 2757a51313dSChris Lattner return &UFE; 2767a51313dSChris Lattner } 2777a51313dSChris Lattner 2787a51313dSChris Lattner void FileManager::PrintStats() const { 2797a51313dSChris Lattner llvm::cerr << "\n*** File Manager Stats:\n"; 2807a51313dSChris Lattner llvm::cerr << UniqueFiles.size() << " files found, " 2817a51313dSChris Lattner << UniqueDirs.size() << " dirs found.\n"; 2827a51313dSChris Lattner llvm::cerr << NumDirLookups << " dir lookups, " 2837a51313dSChris Lattner << NumDirCacheMisses << " dir cache misses.\n"; 2847a51313dSChris Lattner llvm::cerr << NumFileLookups << " file lookups, " 2857a51313dSChris Lattner << NumFileCacheMisses << " file cache misses.\n"; 2867a51313dSChris Lattner 2877a51313dSChris Lattner //llvm::cerr << PagesMapped << BytesOfPagesMapped << FSLookups; 2887a51313dSChris Lattner } 289