17a51313dSChris Lattner ///===--- FileManager.cpp - File System Probing and Caching ----------------===//
27a51313dSChris Lattner //
37a51313dSChris Lattner //                     The LLVM Compiler Infrastructure
47a51313dSChris Lattner //
57a51313dSChris Lattner // This file is distributed under the University of Illinois Open Source
67a51313dSChris Lattner // License. See LICENSE.TXT for details.
77a51313dSChris Lattner //
87a51313dSChris Lattner //===----------------------------------------------------------------------===//
97a51313dSChris Lattner //
107a51313dSChris Lattner //  This file implements the FileManager interface.
117a51313dSChris Lattner //
127a51313dSChris Lattner //===----------------------------------------------------------------------===//
137a51313dSChris Lattner //
147a51313dSChris Lattner // TODO: This should index all interesting directories with dirent calls.
157a51313dSChris Lattner //  getdirentries ?
167a51313dSChris Lattner //  opendir/readdir_r/closedir ?
177a51313dSChris Lattner //
187a51313dSChris Lattner //===----------------------------------------------------------------------===//
197a51313dSChris Lattner 
207a51313dSChris Lattner #include "clang/Basic/FileManager.h"
217a51313dSChris Lattner #include "llvm/ADT/SmallString.h"
223441b4f7SChris Lattner #include "llvm/Support/raw_ostream.h"
23c5046832SDouglas Gregor #include "llvm/System/Path.h"
247a51313dSChris Lattner #include "llvm/Config/config.h"
2526db6481SBenjamin Kramer #include <map>
2626db6481SBenjamin Kramer #include <set>
2726db6481SBenjamin Kramer #include <string>
287a51313dSChris Lattner using namespace clang;
297a51313dSChris Lattner 
307a51313dSChris Lattner // FIXME: Enhance libsystem to support inode and other fields.
317a51313dSChris Lattner #include <sys/stat.h>
327a51313dSChris Lattner 
337a51313dSChris Lattner #if defined(_MSC_VER)
34882018b8SChris Lattner #define S_ISDIR(s) (_S_IFDIR & s)
357a51313dSChris Lattner #endif
367a51313dSChris Lattner 
377a51313dSChris Lattner /// NON_EXISTENT_DIR - A special value distinct from null that is used to
387a51313dSChris Lattner /// represent a dir name that doesn't exist on the disk.
397a51313dSChris Lattner #define NON_EXISTENT_DIR reinterpret_cast<DirectoryEntry*>((intptr_t)-1)
407a51313dSChris Lattner 
415c04bd81STed Kremenek //===----------------------------------------------------------------------===//
425c04bd81STed Kremenek // Windows.
435c04bd81STed Kremenek //===----------------------------------------------------------------------===//
445c04bd81STed Kremenek 
457a51313dSChris Lattner #ifdef LLVM_ON_WIN32
467a51313dSChris Lattner 
477a51313dSChris Lattner #define IS_DIR_SEPARATOR_CHAR(x) ((x) == '/' || (x) == '\\')
487a51313dSChris Lattner 
497a51313dSChris Lattner namespace {
5011289f42SMike Stump   static std::string GetFullPath(const char *relPath) {
517a51313dSChris Lattner     char *absPathStrPtr = _fullpath(NULL, relPath, 0);
527a51313dSChris Lattner     assert(absPathStrPtr && "_fullpath() returned NULL!");
537a51313dSChris Lattner 
547a51313dSChris Lattner     std::string absPath(absPathStrPtr);
557a51313dSChris Lattner 
567a51313dSChris Lattner     free(absPathStrPtr);
577a51313dSChris Lattner     return absPath;
587a51313dSChris Lattner   }
597a51313dSChris Lattner }
607a51313dSChris Lattner 
617a51313dSChris Lattner class FileManager::UniqueDirContainer {
627a51313dSChris Lattner   /// UniqueDirs - Cache from full path to existing directories/files.
637a51313dSChris Lattner   ///
647a51313dSChris Lattner   llvm::StringMap<DirectoryEntry> UniqueDirs;
657a51313dSChris Lattner 
667a51313dSChris Lattner public:
677a51313dSChris Lattner   DirectoryEntry &getDirectory(const char *Name, struct stat &StatBuf) {
687a51313dSChris Lattner     std::string FullPath(GetFullPath(Name));
697a51313dSChris Lattner     return UniqueDirs.GetOrCreateValue(
707a51313dSChris Lattner                               FullPath.c_str(),
717a51313dSChris Lattner                               FullPath.c_str() + FullPath.size()
727a51313dSChris Lattner                                                                 ).getValue();
737a51313dSChris Lattner   }
747a51313dSChris Lattner 
757a51313dSChris Lattner   size_t size() { return UniqueDirs.size(); }
767a51313dSChris Lattner };
777a51313dSChris Lattner 
787a51313dSChris Lattner class FileManager::UniqueFileContainer {
797a51313dSChris Lattner   /// UniqueFiles - Cache from full path to existing directories/files.
807a51313dSChris Lattner   ///
811502b7e2STed Kremenek   llvm::StringMap<FileEntry, llvm::BumpPtrAllocator> UniqueFiles;
827a51313dSChris Lattner 
837a51313dSChris Lattner public:
847a51313dSChris Lattner   FileEntry &getFile(const char *Name, struct stat &StatBuf) {
857a51313dSChris Lattner     std::string FullPath(GetFullPath(Name));
867a51313dSChris Lattner     return UniqueFiles.GetOrCreateValue(
877a51313dSChris Lattner                                FullPath.c_str(),
887a51313dSChris Lattner                                FullPath.c_str() + FullPath.size()
897a51313dSChris Lattner                                                                  ).getValue();
907a51313dSChris Lattner   }
917a51313dSChris Lattner 
927a51313dSChris Lattner   size_t size() { return UniqueFiles.size(); }
937a51313dSChris Lattner };
947a51313dSChris Lattner 
955c04bd81STed Kremenek //===----------------------------------------------------------------------===//
965c04bd81STed Kremenek // Unix-like Systems.
975c04bd81STed Kremenek //===----------------------------------------------------------------------===//
985c04bd81STed Kremenek 
997a51313dSChris Lattner #else
1007a51313dSChris Lattner 
1017a51313dSChris Lattner #define IS_DIR_SEPARATOR_CHAR(x) ((x) == '/')
1027a51313dSChris Lattner 
1037a51313dSChris Lattner class FileManager::UniqueDirContainer {
1047a51313dSChris Lattner   /// UniqueDirs - Cache from ID's to existing directories/files.
1057a51313dSChris Lattner   ///
1067a51313dSChris Lattner   std::map<std::pair<dev_t, ino_t>, DirectoryEntry> UniqueDirs;
1077a51313dSChris Lattner 
1087a51313dSChris Lattner public:
1097a51313dSChris Lattner   DirectoryEntry &getDirectory(const char *Name, struct stat &StatBuf) {
1107a51313dSChris Lattner     return UniqueDirs[std::make_pair(StatBuf.st_dev, StatBuf.st_ino)];
1117a51313dSChris Lattner   }
1127a51313dSChris Lattner 
1137a51313dSChris Lattner   size_t size() { return UniqueDirs.size(); }
1147a51313dSChris Lattner };
1157a51313dSChris Lattner 
1167a51313dSChris Lattner class FileManager::UniqueFileContainer {
1177a51313dSChris Lattner   /// UniqueFiles - Cache from ID's to existing directories/files.
1187a51313dSChris Lattner   ///
1197a51313dSChris Lattner   std::set<FileEntry> UniqueFiles;
1207a51313dSChris Lattner 
1217a51313dSChris Lattner public:
1227a51313dSChris Lattner   FileEntry &getFile(const char *Name, struct stat &StatBuf) {
1237a51313dSChris Lattner     return
1247a51313dSChris Lattner       const_cast<FileEntry&>(
1257a51313dSChris Lattner                     *UniqueFiles.insert(FileEntry(StatBuf.st_dev,
1265d7e2e17STed Kremenek                                                   StatBuf.st_ino,
1275d7e2e17STed Kremenek                                                   StatBuf.st_mode)).first);
1287a51313dSChris Lattner   }
1297a51313dSChris Lattner 
1307a51313dSChris Lattner   size_t size() { return UniqueFiles.size(); }
1317a51313dSChris Lattner };
1327a51313dSChris Lattner 
1337a51313dSChris Lattner #endif
1347a51313dSChris Lattner 
1355c04bd81STed Kremenek //===----------------------------------------------------------------------===//
1365c04bd81STed Kremenek // Common logic.
1375c04bd81STed Kremenek //===----------------------------------------------------------------------===//
1387a51313dSChris Lattner 
1395d7e2e17STed Kremenek FileManager::FileManager()
140c8b740eaSTed Kremenek   : UniqueDirs(*new UniqueDirContainer),
1417a51313dSChris Lattner     UniqueFiles(*new UniqueFileContainer),
1425d7e2e17STed Kremenek     DirEntries(64), FileEntries(64), NextFileUID(0) {
1437a51313dSChris Lattner   NumDirLookups = NumFileLookups = 0;
1447a51313dSChris Lattner   NumDirCacheMisses = NumFileCacheMisses = 0;
1457a51313dSChris Lattner }
1467a51313dSChris Lattner 
1477a51313dSChris Lattner FileManager::~FileManager() {
1487a51313dSChris Lattner   delete &UniqueDirs;
1497a51313dSChris Lattner   delete &UniqueFiles;
1507a51313dSChris Lattner }
1517a51313dSChris Lattner 
152*d2eb58abSDouglas Gregor void FileManager::addStatCache(StatSysCallCache *statCache, bool AtBeginning) {
153*d2eb58abSDouglas Gregor   assert(statCache && "No stat cache provided?");
154*d2eb58abSDouglas Gregor   if (AtBeginning || StatCache.get() == 0) {
155*d2eb58abSDouglas Gregor     statCache->setNextStatCache(StatCache.take());
156*d2eb58abSDouglas Gregor     StatCache.reset(statCache);
157*d2eb58abSDouglas Gregor     return;
158*d2eb58abSDouglas Gregor   }
159*d2eb58abSDouglas Gregor 
160*d2eb58abSDouglas Gregor   StatSysCallCache *LastCache = StatCache.get();
161*d2eb58abSDouglas Gregor   while (LastCache->getNextStatCache())
162*d2eb58abSDouglas Gregor     LastCache = LastCache->getNextStatCache();
163*d2eb58abSDouglas Gregor 
164*d2eb58abSDouglas Gregor   LastCache->setNextStatCache(statCache);
165*d2eb58abSDouglas Gregor }
166*d2eb58abSDouglas Gregor 
167*d2eb58abSDouglas Gregor void FileManager::removeStatCache(StatSysCallCache *statCache) {
168*d2eb58abSDouglas Gregor   if (!statCache)
169*d2eb58abSDouglas Gregor     return;
170*d2eb58abSDouglas Gregor 
171*d2eb58abSDouglas Gregor   if (StatCache.get() == statCache) {
172*d2eb58abSDouglas Gregor     // This is the first stat cache.
173*d2eb58abSDouglas Gregor     StatCache.reset(StatCache->takeNextStatCache());
174*d2eb58abSDouglas Gregor     return;
175*d2eb58abSDouglas Gregor   }
176*d2eb58abSDouglas Gregor 
177*d2eb58abSDouglas Gregor   // Find the stat cache in the list.
178*d2eb58abSDouglas Gregor   StatSysCallCache *PrevCache = StatCache.get();
179*d2eb58abSDouglas Gregor   while (PrevCache && PrevCache->getNextStatCache() != statCache)
180*d2eb58abSDouglas Gregor     PrevCache = PrevCache->getNextStatCache();
181*d2eb58abSDouglas Gregor   if (PrevCache)
182*d2eb58abSDouglas Gregor     PrevCache->setNextStatCache(statCache->getNextStatCache());
183*d2eb58abSDouglas Gregor   else
184*d2eb58abSDouglas Gregor     assert(false && "Stat cache not found for removal");
185*d2eb58abSDouglas Gregor }
186*d2eb58abSDouglas Gregor 
1877a51313dSChris Lattner /// getDirectory - Lookup, cache, and verify the specified directory.  This
1887a51313dSChris Lattner /// returns null if the directory doesn't exist.
1897a51313dSChris Lattner ///
1907a51313dSChris Lattner const DirectoryEntry *FileManager::getDirectory(const char *NameStart,
1917a51313dSChris Lattner                                                 const char *NameEnd) {
1927a51313dSChris Lattner   ++NumDirLookups;
1937a51313dSChris Lattner   llvm::StringMapEntry<DirectoryEntry *> &NamedDirEnt =
1947a51313dSChris Lattner     DirEntries.GetOrCreateValue(NameStart, NameEnd);
1957a51313dSChris Lattner 
1967a51313dSChris Lattner   // See if there is already an entry in the map.
1977a51313dSChris Lattner   if (NamedDirEnt.getValue())
1987a51313dSChris Lattner     return NamedDirEnt.getValue() == NON_EXISTENT_DIR
1997a51313dSChris Lattner               ? 0 : NamedDirEnt.getValue();
2007a51313dSChris Lattner 
2017a51313dSChris Lattner   ++NumDirCacheMisses;
2027a51313dSChris Lattner 
2037a51313dSChris Lattner   // By default, initialize it to invalid.
2047a51313dSChris Lattner   NamedDirEnt.setValue(NON_EXISTENT_DIR);
2057a51313dSChris Lattner 
2067a51313dSChris Lattner   // Get the null-terminated directory name as stored as the key of the
2077a51313dSChris Lattner   // DirEntries map.
2087a51313dSChris Lattner   const char *InterndDirName = NamedDirEnt.getKeyData();
2097a51313dSChris Lattner 
2107a51313dSChris Lattner   // Check to see if the directory exists.
2117a51313dSChris Lattner   struct stat StatBuf;
212c8b740eaSTed Kremenek   if (stat_cached(InterndDirName, &StatBuf) ||   // Error stat'ing.
2137a51313dSChris Lattner       !S_ISDIR(StatBuf.st_mode))          // Not a directory?
2147a51313dSChris Lattner     return 0;
2157a51313dSChris Lattner 
2167a51313dSChris Lattner   // It exists.  See if we have already opened a directory with the same inode.
2177a51313dSChris Lattner   // This occurs when one dir is symlinked to another, for example.
2187a51313dSChris Lattner   DirectoryEntry &UDE = UniqueDirs.getDirectory(InterndDirName, StatBuf);
2197a51313dSChris Lattner 
2207a51313dSChris Lattner   NamedDirEnt.setValue(&UDE);
2217a51313dSChris Lattner   if (UDE.getName()) // Already have an entry with this inode, return it.
2227a51313dSChris Lattner     return &UDE;
2237a51313dSChris Lattner 
2247a51313dSChris Lattner   // Otherwise, we don't have this directory yet, add it.  We use the string
2257a51313dSChris Lattner   // key from the DirEntries map as the string.
2267a51313dSChris Lattner   UDE.Name  = InterndDirName;
2277a51313dSChris Lattner   return &UDE;
2287a51313dSChris Lattner }
2297a51313dSChris Lattner 
2307a51313dSChris Lattner /// NON_EXISTENT_FILE - A special value distinct from null that is used to
2317a51313dSChris Lattner /// represent a filename that doesn't exist on the disk.
2327a51313dSChris Lattner #define NON_EXISTENT_FILE reinterpret_cast<FileEntry*>((intptr_t)-1)
2337a51313dSChris Lattner 
2347a51313dSChris Lattner /// getFile - Lookup, cache, and verify the specified file.  This returns null
2357a51313dSChris Lattner /// if the file doesn't exist.
2367a51313dSChris Lattner ///
2377a51313dSChris Lattner const FileEntry *FileManager::getFile(const char *NameStart,
2387a51313dSChris Lattner                                       const char *NameEnd) {
2397a51313dSChris Lattner   ++NumFileLookups;
2407a51313dSChris Lattner 
2417a51313dSChris Lattner   // See if there is already an entry in the map.
2427a51313dSChris Lattner   llvm::StringMapEntry<FileEntry *> &NamedFileEnt =
2437a51313dSChris Lattner     FileEntries.GetOrCreateValue(NameStart, NameEnd);
2447a51313dSChris Lattner 
2457a51313dSChris Lattner   // See if there is already an entry in the map.
2467a51313dSChris Lattner   if (NamedFileEnt.getValue())
2477a51313dSChris Lattner     return NamedFileEnt.getValue() == NON_EXISTENT_FILE
2487a51313dSChris Lattner                  ? 0 : NamedFileEnt.getValue();
2497a51313dSChris Lattner 
2507a51313dSChris Lattner   ++NumFileCacheMisses;
2517a51313dSChris Lattner 
2527a51313dSChris Lattner   // By default, initialize it to invalid.
2537a51313dSChris Lattner   NamedFileEnt.setValue(NON_EXISTENT_FILE);
2547a51313dSChris Lattner 
2557a51313dSChris Lattner   // Figure out what directory it is in.   If the string contains a / in it,
2567a51313dSChris Lattner   // strip off everything after it.
2577a51313dSChris Lattner   // FIXME: this logic should be in sys::Path.
2587a51313dSChris Lattner   const char *SlashPos = NameEnd-1;
2597a51313dSChris Lattner   while (SlashPos >= NameStart && !IS_DIR_SEPARATOR_CHAR(SlashPos[0]))
2607a51313dSChris Lattner     --SlashPos;
26191f5ff6bSChris Lattner   // Ignore duplicate //'s.
26291f5ff6bSChris Lattner   while (SlashPos > NameStart && IS_DIR_SEPARATOR_CHAR(SlashPos[-1]))
26391f5ff6bSChris Lattner     --SlashPos;
2647a51313dSChris Lattner 
2657a51313dSChris Lattner   const DirectoryEntry *DirInfo;
2667a51313dSChris Lattner   if (SlashPos < NameStart) {
2677a51313dSChris Lattner     // Use the current directory if file has no path component.
2687a51313dSChris Lattner     const char *Name = ".";
2697a51313dSChris Lattner     DirInfo = getDirectory(Name, Name+1);
2707a51313dSChris Lattner   } else if (SlashPos == NameEnd-1)
2717a51313dSChris Lattner     return 0;       // If filename ends with a /, it's a directory.
2727a51313dSChris Lattner   else
2737a51313dSChris Lattner     DirInfo = getDirectory(NameStart, SlashPos);
2747a51313dSChris Lattner 
2757a51313dSChris Lattner   if (DirInfo == 0)  // Directory doesn't exist, file can't exist.
2767a51313dSChris Lattner     return 0;
2777a51313dSChris Lattner 
2787a51313dSChris Lattner   // Get the null-terminated file name as stored as the key of the
2797a51313dSChris Lattner   // FileEntries map.
2807a51313dSChris Lattner   const char *InterndFileName = NamedFileEnt.getKeyData();
2817a51313dSChris Lattner 
2827a51313dSChris Lattner   // FIXME: Use the directory info to prune this, before doing the stat syscall.
2837a51313dSChris Lattner   // FIXME: This will reduce the # syscalls.
2847a51313dSChris Lattner 
2857a51313dSChris Lattner   // Nope, there isn't.  Check to see if the file exists.
2867a51313dSChris Lattner   struct stat StatBuf;
28789b422c1SBenjamin Kramer   //llvm::errs() << "STATING: " << Filename;
288c8b740eaSTed Kremenek   if (stat_cached(InterndFileName, &StatBuf) ||   // Error stat'ing.
2897a51313dSChris Lattner         S_ISDIR(StatBuf.st_mode)) {           // A directory?
2907a51313dSChris Lattner     // If this file doesn't exist, we leave a null in FileEntries for this path.
29189b422c1SBenjamin Kramer     //llvm::errs() << ": Not existing\n";
2927a51313dSChris Lattner     return 0;
2937a51313dSChris Lattner   }
29489b422c1SBenjamin Kramer   //llvm::errs() << ": exists\n";
2957a51313dSChris Lattner 
2967a51313dSChris Lattner   // It exists.  See if we have already opened a file with the same inode.
2977a51313dSChris Lattner   // This occurs when one dir is symlinked to another, for example.
2987a51313dSChris Lattner   FileEntry &UFE = UniqueFiles.getFile(InterndFileName, StatBuf);
2997a51313dSChris Lattner 
3007a51313dSChris Lattner   NamedFileEnt.setValue(&UFE);
3017a51313dSChris Lattner   if (UFE.getName())  // Already have an entry with this inode, return it.
3027a51313dSChris Lattner     return &UFE;
3037a51313dSChris Lattner 
3047a51313dSChris Lattner   // Otherwise, we don't have this directory yet, add it.
3057a51313dSChris Lattner   // FIXME: Change the name to be a char* that points back to the 'FileEntries'
3067a51313dSChris Lattner   // key.
3077a51313dSChris Lattner   UFE.Name    = InterndFileName;
3087a51313dSChris Lattner   UFE.Size    = StatBuf.st_size;
3097a51313dSChris Lattner   UFE.ModTime = StatBuf.st_mtime;
3107a51313dSChris Lattner   UFE.Dir     = DirInfo;
3117a51313dSChris Lattner   UFE.UID     = NextFileUID++;
3127a51313dSChris Lattner   return &UFE;
3137a51313dSChris Lattner }
3147a51313dSChris Lattner 
3157a51313dSChris Lattner void FileManager::PrintStats() const {
31689b422c1SBenjamin Kramer   llvm::errs() << "\n*** File Manager Stats:\n";
31789b422c1SBenjamin Kramer   llvm::errs() << UniqueFiles.size() << " files found, "
3187a51313dSChris Lattner                << UniqueDirs.size() << " dirs found.\n";
31989b422c1SBenjamin Kramer   llvm::errs() << NumDirLookups << " dir lookups, "
3207a51313dSChris Lattner                << NumDirCacheMisses << " dir cache misses.\n";
32189b422c1SBenjamin Kramer   llvm::errs() << NumFileLookups << " file lookups, "
3227a51313dSChris Lattner                << NumFileCacheMisses << " file cache misses.\n";
3237a51313dSChris Lattner 
32489b422c1SBenjamin Kramer   //llvm::errs() << PagesMapped << BytesOfPagesMapped << FSLookups;
3257a51313dSChris Lattner }
326c5046832SDouglas Gregor 
327c5046832SDouglas Gregor int MemorizeStatCalls::stat(const char *path, struct stat *buf) {
328*d2eb58abSDouglas Gregor   int result = StatSysCallCache::stat(path, buf);
329c5046832SDouglas Gregor 
330c5046832SDouglas Gregor   if (result != 0) {
331c5046832SDouglas Gregor     // Cache failed 'stat' results.
332c5046832SDouglas Gregor     struct stat empty;
33301ce06fbSChris Lattner     memset(&empty, 0, sizeof(empty));
334c5046832SDouglas Gregor     StatCalls[path] = StatResult(result, empty);
335c5046832SDouglas Gregor   }
336c5046832SDouglas Gregor   else if (!S_ISDIR(buf->st_mode) || llvm::sys::Path(path).isAbsolute()) {
337c5046832SDouglas Gregor     // Cache file 'stat' results and directories with absolutely
338c5046832SDouglas Gregor     // paths.
339c5046832SDouglas Gregor     StatCalls[path] = StatResult(result, *buf);
340c5046832SDouglas Gregor   }
341c5046832SDouglas Gregor 
342c5046832SDouglas Gregor   return result;
343c5046832SDouglas Gregor }
344