Home | History | Annotate | Download | only in Tooling
      1 //===--- FileMatchTrie.cpp - ----------------------------------------------===//
      2 //
      3 //                     The LLVM Compiler Infrastructure
      4 //
      5 // This file is distributed under the University of Illinois Open Source
      6 // License. See LICENSE.TXT for details.
      7 //
      8 //===----------------------------------------------------------------------===//
      9 //
     10 //  This file contains the implementation of a FileMatchTrie.
     11 //
     12 //===----------------------------------------------------------------------===//
     13 
     14 #include "clang/Tooling/FileMatchTrie.h"
     15 #include "llvm/ADT/StringMap.h"
     16 #include "llvm/Support/FileSystem.h"
     17 #include "llvm/Support/Path.h"
     18 #include "llvm/Support/raw_ostream.h"
     19 #include <sstream>
     20 using namespace clang;
     21 using namespace tooling;
     22 
     23 namespace {
     24 /// \brief Default \c PathComparator using \c llvm::sys::fs::equivalent().
     25 struct DefaultPathComparator : public PathComparator {
     26   bool equivalent(StringRef FileA, StringRef FileB) const override {
     27     return FileA == FileB || llvm::sys::fs::equivalent(FileA, FileB);
     28   }
     29 };
     30 }
     31 
     32 namespace clang {
     33 namespace tooling {
     34 /// \brief A node of the \c FileMatchTrie.
     35 ///
     36 /// Each node has storage for up to one path and a map mapping a path segment to
     37 /// child nodes. The trie starts with an empty root node.
     38 class FileMatchTrieNode {
     39 public:
     40   /// \brief Inserts 'NewPath' into this trie. \c ConsumedLength denotes
     41   /// the number of \c NewPath's trailing characters already consumed during
     42   /// recursion.
     43   ///
     44   /// An insert of a path
     45   /// 'p'starts at the root node and does the following:
     46   /// - If the node is empty, insert 'p' into its storage and abort.
     47   /// - If the node has a path 'p2' but no children, take the last path segment
     48   ///   's' of 'p2', put a new child into the map at 's' an insert the rest of
     49   ///   'p2' there.
     50   /// - Insert a new child for the last segment of 'p' and insert the rest of
     51   ///   'p' there.
     52   ///
     53   /// An insert operation is linear in the number of a path's segments.
     54   void insert(StringRef NewPath, unsigned ConsumedLength = 0) {
     55     // We cannot put relative paths into the FileMatchTrie as then a path can be
     56     // a postfix of another path, violating a core assumption of the trie.
     57     if (llvm::sys::path::is_relative(NewPath))
     58       return;
     59     if (Path.empty()) {
     60       // This is an empty leaf. Store NewPath and return.
     61       Path = NewPath;
     62       return;
     63     }
     64     if (Children.empty()) {
     65       // This is a leaf, ignore duplicate entry if 'Path' equals 'NewPath'.
     66       if (NewPath == Path)
     67           return;
     68       // Make this a node and create a child-leaf with 'Path'.
     69       StringRef Element(llvm::sys::path::filename(
     70           StringRef(Path).drop_back(ConsumedLength)));
     71       Children[Element].Path = Path;
     72     }
     73     StringRef Element(llvm::sys::path::filename(
     74           StringRef(NewPath).drop_back(ConsumedLength)));
     75     Children[Element].insert(NewPath, ConsumedLength + Element.size() + 1);
     76   }
     77 
     78   /// \brief Tries to find the node under this \c FileMatchTrieNode that best
     79   /// matches 'FileName'.
     80   ///
     81   /// If multiple paths fit 'FileName' equally well, \c IsAmbiguous is set to
     82   /// \c true and an empty string is returned. If no path fits 'FileName', an
     83   /// empty string is returned. \c ConsumedLength denotes the number of
     84   /// \c Filename's trailing characters already consumed during recursion.
     85   ///
     86   /// To find the best matching node for a given path 'p', the
     87   /// \c findEquivalent() function is called recursively for each path segment
     88   /// (back to fron) of 'p' until a node 'n' is reached that does not ..
     89   /// - .. have children. In this case it is checked
     90   ///   whether the stored path is equivalent to 'p'. If yes, the best match is
     91   ///   found. Otherwise continue with the parent node as if this node did not
     92   ///   exist.
     93   /// - .. a child matching the next path segment. In this case, all children of
     94   ///   'n' are an equally good match for 'p'. All children are of 'n' are found
     95   ///   recursively and their equivalence to 'p' is determined. If none are
     96   ///   equivalent, continue with the parent node as if 'n' didn't exist. If one
     97   ///   is equivalent, the best match is found. Otherwise, report and ambigiuity
     98   ///   error.
     99   StringRef findEquivalent(const PathComparator& Comparator,
    100                            StringRef FileName,
    101                            bool &IsAmbiguous,
    102                            unsigned ConsumedLength = 0) const {
    103     if (Children.empty()) {
    104       if (Comparator.equivalent(StringRef(Path), FileName))
    105         return StringRef(Path);
    106       return StringRef();
    107     }
    108     StringRef Element(llvm::sys::path::filename(FileName.drop_back(
    109         ConsumedLength)));
    110     llvm::StringMap<FileMatchTrieNode>::const_iterator MatchingChild =
    111         Children.find(Element);
    112     if (MatchingChild != Children.end()) {
    113       StringRef Result = MatchingChild->getValue().findEquivalent(
    114           Comparator, FileName, IsAmbiguous,
    115           ConsumedLength + Element.size() + 1);
    116       if (!Result.empty() || IsAmbiguous)
    117         return Result;
    118     }
    119     std::vector<StringRef> AllChildren;
    120     getAll(AllChildren, MatchingChild);
    121     StringRef Result;
    122     for (unsigned i = 0; i < AllChildren.size(); i++) {
    123       if (Comparator.equivalent(AllChildren[i], FileName)) {
    124         if (Result.empty()) {
    125           Result = AllChildren[i];
    126         } else {
    127           IsAmbiguous = true;
    128           return StringRef();
    129         }
    130       }
    131     }
    132     return Result;
    133   }
    134 
    135 private:
    136   /// \brief Gets all paths under this FileMatchTrieNode.
    137   void getAll(std::vector<StringRef> &Results,
    138               llvm::StringMap<FileMatchTrieNode>::const_iterator Except) const {
    139     if (Path.empty())
    140       return;
    141     if (Children.empty()) {
    142       Results.push_back(StringRef(Path));
    143       return;
    144     }
    145     for (llvm::StringMap<FileMatchTrieNode>::const_iterator
    146          It = Children.begin(), E = Children.end();
    147          It != E; ++It) {
    148       if (It == Except)
    149         continue;
    150       It->getValue().getAll(Results, Children.end());
    151     }
    152   }
    153 
    154   // The stored absolute path in this node. Only valid for leaf nodes, i.e.
    155   // nodes where Children.empty().
    156   std::string Path;
    157 
    158   // The children of this node stored in a map based on the next path segment.
    159   llvm::StringMap<FileMatchTrieNode> Children;
    160 };
    161 } // end namespace tooling
    162 } // end namespace clang
    163 
    164 FileMatchTrie::FileMatchTrie()
    165   : Root(new FileMatchTrieNode), Comparator(new DefaultPathComparator()) {}
    166 
    167 FileMatchTrie::FileMatchTrie(PathComparator *Comparator)
    168   : Root(new FileMatchTrieNode), Comparator(Comparator) {}
    169 
    170 FileMatchTrie::~FileMatchTrie() {
    171   delete Root;
    172 }
    173 
    174 void FileMatchTrie::insert(StringRef NewPath) {
    175   Root->insert(NewPath);
    176 }
    177 
    178 StringRef FileMatchTrie::findEquivalent(StringRef FileName,
    179                                         raw_ostream &Error) const {
    180   if (llvm::sys::path::is_relative(FileName)) {
    181     Error << "Cannot resolve relative paths";
    182     return StringRef();
    183   }
    184   bool IsAmbiguous = false;
    185   StringRef Result = Root->findEquivalent(*Comparator, FileName, IsAmbiguous);
    186   if (IsAmbiguous)
    187     Error << "Path is ambiguous";
    188   return Result;
    189 }
    190