<html><head><meta http-equiv="Content-Type" content="text/html charset=us-ascii"></head><body style="word-wrap: break-word; -webkit-nbsp-mode: space; -webkit-line-break: after-white-space;"><br><div><div>On Jan 25, 2013, at 4:55 PM, Douglas Gregor <<a href="mailto:dgregor@apple.com">dgregor@apple.com</a>> wrote:</div><br class="Apple-interchange-newline"><blockquote type="cite"><div style="letter-spacing: normal; orphans: auto; text-align: start; text-indent: 0px; text-transform: none; white-space: normal; widows: auto; word-spacing: 0px; -webkit-text-size-adjust: auto; -webkit-text-stroke-width: 0px;">Author: dgregor<br>Date: Fri Jan 25 18:55:12 2013<br>New Revision: 173542<br><br>URL:<span class="Apple-converted-space"> </span><a href="http://llvm.org/viewvc/llvm-project?rev=173542&view=rev">http://llvm.org/viewvc/llvm-project?rev=173542&view=rev</a><br>Log:<br>Since we're stuck with realpath for the header <-> module mapping,<br>factor the realpath calls into FileManager::getCanonicalName() so we<br>can cache the results of this epically slow operation. 5% speedup on<br>my modules test, and realpath drops out of the profile.<br><br>Modified:<br>   cfe/trunk/include/clang/Basic/FileManager.h<br>   cfe/trunk/lib/Basic/FileManager.cpp<br>   cfe/trunk/lib/Lex/HeaderSearch.cpp<br>   cfe/trunk/lib/Lex/ModuleMap.cpp<br><br>Modified: cfe/trunk/include/clang/Basic/FileManager.h<br>URL:<span class="Apple-converted-space"> </span><a href="http://llvm.org/viewvc/llvm-project/cfe/trunk/include/clang/Basic/FileManager.h?rev=173542&r1=173541&r2=173542&view=diff">http://llvm.org/viewvc/llvm-project/cfe/trunk/include/clang/Basic/FileManager.h?rev=173542&r1=173541&r2=173542&view=diff</a><br>==============================================================================<br>--- cfe/trunk/include/clang/Basic/FileManager.h (original)<br>+++ cfe/trunk/include/clang/Basic/FileManager.h Fri Jan 25 18:55:12 2013<br>@@ -17,6 +17,7 @@<br><br>#include "clang/Basic/FileSystemOptions.h"<br>#include "clang/Basic/LLVM.h"<br>+#include "llvm/ADT/DenseMap.h"<br>#include "llvm/ADT/IntrusiveRefCntPtr.h"<br>#include "llvm/ADT/OwningPtr.h"<br>#include "llvm/ADT/SmallVector.h"<br>@@ -152,6 +153,12 @@ class FileManager : public RefCountedBas<br>  /// \see SeenDirEntries<br>  llvm::StringMap<FileEntry*, llvm::BumpPtrAllocator> SeenFileEntries;<br><br>+  /// \brief The canonical names of directories.<br>+  llvm::DenseMap<const DirectoryEntry *, llvm::StringRef> CanonicalDirNames;<br>+<br>+  /// \brief Storage for canonical names that we have computed.<br>+  llvm::BumpPtrAllocator CanonicalNameStorage;<br>+<br>  /// \brief Each FileEntry we create is assigned a unique ID #.<br>  ///<br>  unsigned NextFileUID;<br>@@ -257,6 +264,13 @@ public:<br>  static void modifyFileEntry(FileEntry *File, off_t Size,<br>                              time_t ModificationTime);<br><br>+  /// \brief Retrieve the canonical name for a given directory.<br>+  ///<br>+  /// This is a very expensive operation, despite its results being cached,<br>+  /// and should only be used when the physical layout of the file system is<br>+  /// required, which is (almost) never.<br>+  StringRef getCanonicalName(const DirectoryEntry *Dir);<br>+<br>  void PrintStats() const;<br>};<br><br><br>Modified: cfe/trunk/lib/Basic/FileManager.cpp<br>URL:<span class="Apple-converted-space"> </span><a href="http://llvm.org/viewvc/llvm-project/cfe/trunk/lib/Basic/FileManager.cpp?rev=173542&r1=173541&r2=173542&view=diff">http://llvm.org/viewvc/llvm-project/cfe/trunk/lib/Basic/FileManager.cpp?rev=173542&r1=173541&r2=173542&view=diff</a><br>==============================================================================<br>--- cfe/trunk/lib/Basic/FileManager.cpp (original)<br>+++ cfe/trunk/lib/Basic/FileManager.cpp Fri Jan 25 18:55:12 2013<br>@@ -40,6 +40,11 @@<br>#define S_ISFIFO(x) (0)<br>#endif<br>#endif<br>+#if defined(LLVM_ON_UNIX)<br>+#if defined(__linux__)<br>+#include <linux/limits.h><br>+#endif<br>+#endif<br>using namespace clang;<br><br>// FIXME: Enhance libsystem to support inode and other fields.<br>@@ -620,6 +625,29 @@ void FileManager::modifyFileEntry(FileEn<br>  File->ModTime = ModificationTime;<br>}<br><br>+StringRef FileManager::getCanonicalName(const DirectoryEntry *Dir) {<br>+  // FIXME: use llvm::sys::fs::canonical() when it gets implemented<br>+#ifdef LLVM_ON_UNIX<br>+  llvm::DenseMap<const DirectoryEntry *, llvm::StringRef>::iterator Known<br>+    = CanonicalDirNames.find(Dir);<br>+  if (Known != CanonicalDirNames.end())<br>+    return Known->second;<br>+<br>+  StringRef CanonicalName(Dir->getName());<br>+  char CanonicalNameBuf[PATH_MAX];<br>+  if (realpath(Dir->getName(), CanonicalNameBuf)) {<br>+    unsigned Len = strlen(CanonicalNameBuf);<br>+    char *Mem = static_cast<char *>(CanonicalNameStorage.Allocate(Len, 1));<br>+    memcpy(Mem, CanonicalNameBuf, Len);<br>+    CanonicalName = StringRef(Mem, Len);<br>+  }<br>+<br>+  CanonicalDirNames.insert(std::make_pair(Dir, CanonicalName));<br>+  return CanonicalName;<br>+#else<br>+  return StringRef(Dir->getName());<br>+#endif<br>+}<br><br>void FileManager::PrintStats() const {<br>  llvm::errs() << "\n*** File Manager Stats:\n";<br><br>Modified: cfe/trunk/lib/Lex/HeaderSearch.cpp<br>URL:<span class="Apple-converted-space"> </span><a href="http://llvm.org/viewvc/llvm-project/cfe/trunk/lib/Lex/HeaderSearch.cpp?rev=173542&r1=173541&r2=173542&view=diff">http://llvm.org/viewvc/llvm-project/cfe/trunk/lib/Lex/HeaderSearch.cpp?rev=173542&r1=173541&r2=173542&view=diff</a><br>==============================================================================<br>--- cfe/trunk/lib/Lex/HeaderSearch.cpp (original)<br>+++ cfe/trunk/lib/Lex/HeaderSearch.cpp Fri Jan 25 18:55:12 2013<br>@@ -268,6 +268,10 @@ const FileEntry *DirectoryLookup::Lookup<br>  return Result;<br>}<br><br>+/// FIXME: HACK HACK HACK!<br>+static llvm::DenseMap<const DirectoryEntry *, const DirectoryEntry *><br>+  TopFrameworkDirs;<br>+<br></div></blockquote><div><br></div><div>Hi Doug,</div><div>Is the TopFrameworkDirs map actually used?</div><div><br></div><div> Chad</div><div><br></div><br><blockquote type="cite"><div style="letter-spacing: normal; orphans: auto; text-align: start; text-indent: 0px; text-transform: none; white-space: normal; widows: auto; word-spacing: 0px; -webkit-text-size-adjust: auto; -webkit-text-stroke-width: 0px;">/// \brief Given a framework directory, find the top-most framework directory.<br>///<br>/// \param FileMgr The file manager to use for directory lookups.<br>@@ -280,7 +284,6 @@ getTopFrameworkDir(FileManager &FileMgr,<br>  assert(llvm::sys::path::extension(DirName) == ".framework" &&<br>         "Not a framework directory");<br><br>-#ifdef LLVM_ON_UNIX<br>  // Note: as an egregious but useful hack we use the real path here, because<br>  // frameworks moving between top-level frameworks to embedded frameworks tend<br>  // to be symlinked, and we base the logical structure of modules on the<br>@@ -295,12 +298,8 @@ getTopFrameworkDir(FileManager &FileMgr,<br>  //<br>  // Similar issues occur when a top-level framework has moved into an<br>  // embedded framework.<br>-  char RealDirName[PATH_MAX];<br>-  if (realpath(DirName.str().c_str(), RealDirName))<br>-    DirName = RealDirName;<br>-#endif<br>-<br>  const DirectoryEntry *TopFrameworkDir = FileMgr.getDirectory(DirName);<br>+  DirName = FileMgr.getCanonicalName(TopFrameworkDir);<br>  do {<br>    // Get the parent directory name.<br>    DirName = llvm::sys::path::parent_path(DirName);<br><br>Modified: cfe/trunk/lib/Lex/ModuleMap.cpp<br>URL:<span class="Apple-converted-space"> </span><a href="http://llvm.org/viewvc/llvm-project/cfe/trunk/lib/Lex/ModuleMap.cpp?rev=173542&r1=173541&r2=173542&view=diff">http://llvm.org/viewvc/llvm-project/cfe/trunk/lib/Lex/ModuleMap.cpp?rev=173542&r1=173541&r2=173542&view=diff</a><br>==============================================================================<br>--- cfe/trunk/lib/Lex/ModuleMap.cpp (original)<br>+++ cfe/trunk/lib/Lex/ModuleMap.cpp Fri Jan 25 18:55:12 2013<br>@@ -163,20 +163,12 @@ Module *ModuleMap::findModuleForHeader(c<br><br>  const DirectoryEntry *Dir = File->getDir();<br>  SmallVector<const DirectoryEntry *, 2> SkippedDirs;<br>-#ifdef LLVM_ON_UNIX<br>+<br>  // Note: as an egregious but useful hack we use the real path here, because<br>  // frameworks moving from top-level frameworks to embedded frameworks tend<br>  // to be symlinked from the top-level location to the embedded location,<br>  // and we need to resolve lookups as if we had found the embedded location.<br>-  char RealDirName[PATH_MAX];<br>-  StringRef DirName;<br>-  if (realpath(Dir->getName(), RealDirName))<br>-    DirName = RealDirName;<br>-  else<br>-    DirName = Dir->getName();<br>-#else<br>-  StringRef DirName = Dir->getName();<br>-#endif<br>+  StringRef DirName = SourceMgr->getFileManager().getCanonicalName(Dir);<br><br>  // Keep walking up the directory hierarchy, looking for a directory with<br>  // an umbrella header.<br>@@ -420,16 +412,13 @@ ModuleMap::inferFrameworkModule(StringRe<br>  // a framework module, do so.<br>  if (!Parent) {<br>    // Determine whether we're allowed to infer a module map.<br>-    StringRef FrameworkDirName = FrameworkDir->getName();<br>-#ifdef LLVM_ON_UNIX<br>+<br>    // Note: as an egregious but useful hack we use the real path here, because<br>    // we might be looking at an embedded framework that symlinks out to a<br>    // top-level framework, and we need to infer as if we were naming the<br>    // top-level framework.<br>-    char RealFrameworkDirName[PATH_MAX];<br>-    if (realpath(FrameworkDir->getName(), RealFrameworkDirName))<br>-      FrameworkDirName = RealFrameworkDirName;<br>-#endif<br>+    StringRef FrameworkDirName<br>+      = SourceMgr->getFileManager().getCanonicalName(FrameworkDir);<br><br>    bool canInfer = false;<br>    if (llvm::sys::path::has_parent_path(FrameworkDirName)) {<br>@@ -527,29 +516,23 @@ ModuleMap::inferFrameworkModule(StringRe<br>      // check whether it is actually a subdirectory of the parent directory.<br>      // This will not be the case if the 'subframework' is actually a symlink<br>      // out to a top-level framework.<br>-#ifdef LLVM_ON_UNIX<br>-      char RealSubframeworkDirName[PATH_MAX];<br>-      if (realpath(Dir->path().c_str(), RealSubframeworkDirName)) {<br>-        StringRef SubframeworkDirName = RealSubframeworkDirName;<br>-<br>-        bool FoundParent = false;<br>-        do {<br>-          // Get the parent directory name.<br>-          SubframeworkDirName<br>-            = llvm::sys::path::parent_path(SubframeworkDirName);<br>-          if (SubframeworkDirName.empty())<br>-            break;<br>-<br>-          if (FileMgr.getDirectory(SubframeworkDirName) == FrameworkDir) {<br>-            FoundParent = true;<br>-            break;<br>-          }<br>-        } while (true);<br>+      StringRef SubframeworkDirName = FileMgr.getCanonicalName(SubframeworkDir);<br>+      bool FoundParent = false;<br>+      do {<br>+        // Get the parent directory name.<br>+        SubframeworkDirName<br>+          = llvm::sys::path::parent_path(SubframeworkDirName);<br>+        if (SubframeworkDirName.empty())<br>+          break;<br>+<br>+        if (FileMgr.getDirectory(SubframeworkDirName) == FrameworkDir) {<br>+          FoundParent = true;<br>+          break;<br>+        }<br>+      } while (true);<br><br>-        if (!FoundParent)<br>-          continue;<br>-      }<br>-#endif<br>+      if (!FoundParent)<br>+        continue;<br><br>      // FIXME: Do we want to warn about subframeworks without umbrella headers?<br>      SmallString<32> NameBuf;<br><br><br>_______________________________________________<br>cfe-commits mailing list<br><a href="mailto:cfe-commits@cs.uiuc.edu">cfe-commits@cs.uiuc.edu</a><br><a href="http://lists.cs.uiuc.edu/mailman/listinfo/cfe-commits">http://lists.cs.uiuc.edu/mailman/listinfo/cfe-commits</a></div></blockquote></div><br></body></html>