Home | History | Annotate | Download | only in gn
      1 // Copyright (c) 2013 The Chromium Authors. All rights reserved.
      2 // Use of this source code is governed by a BSD-style license that can be
      3 // found in the LICENSE file.
      4 
      5 #include "tools/gn/pattern.h"
      6 
      7 #include "tools/gn/value.h"
      8 
      9 namespace {
     10 
     11 void ParsePattern(const std::string& s, std::vector<Pattern::Subrange>* out) {
     12   // Set when the last subrange is a literal so we can just append when we
     13   // find another literal.
     14   Pattern::Subrange* last_literal = NULL;
     15 
     16   for (size_t i = 0; i < s.size(); i++) {
     17     if (s[i] == '*') {
     18       // Don't allow two **.
     19       if (out->size() == 0 ||
     20           (*out)[out->size() - 1].type != Pattern::Subrange::ANYTHING)
     21         out->push_back(Pattern::Subrange(Pattern::Subrange::ANYTHING));
     22       last_literal = NULL;
     23     } else if (s[i] == '\\') {
     24       if (i < s.size() - 1 && s[i + 1] == 'b') {
     25         // "\b" means path boundary.
     26         i++;
     27         out->push_back(Pattern::Subrange(Pattern::Subrange::PATH_BOUNDARY));
     28         last_literal = NULL;
     29       } else {
     30         // Backslash + anything else means that literal char.
     31         if (!last_literal) {
     32           out->push_back(Pattern::Subrange(Pattern::Subrange::LITERAL));
     33           last_literal = &(*out)[out->size() - 1];
     34         }
     35         if (i < s.size() - 1) {
     36           i++;
     37           last_literal->literal.push_back(s[i]);
     38         } else {
     39           // Single backslash at end, use literal backslash.
     40           last_literal->literal.push_back('\\');
     41         }
     42       }
     43     } else {
     44       if (!last_literal) {
     45         out->push_back(Pattern::Subrange(Pattern::Subrange::LITERAL));
     46         last_literal = &(*out)[out->size() - 1];
     47       }
     48       last_literal->literal.push_back(s[i]);
     49     }
     50   }
     51 }
     52 
     53 }  // namespace
     54 
     55 Pattern::Pattern(const std::string& s) {
     56   ParsePattern(s, &subranges_);
     57   is_suffix_ =
     58       (subranges_.size() == 2 &&
     59        subranges_[0].type == Subrange::ANYTHING &&
     60        subranges_[1].type == Subrange::LITERAL);
     61 }
     62 
     63 Pattern::~Pattern() {
     64 }
     65 
     66 bool Pattern::MatchesString(const std::string& s) const {
     67   // Empty pattern matches only empty string.
     68   if (subranges_.empty())
     69     return s.empty();
     70 
     71   if (is_suffix_) {
     72     const std::string& suffix = subranges_[1].literal;
     73     if (suffix.size() > s.size())
     74       return false;  // Too short.
     75     return s.compare(s.size() - suffix.size(), suffix.size(), suffix) == 0;
     76   }
     77 
     78   return RecursiveMatch(s, 0, 0, true);
     79 }
     80 
     81 // We assume the number of ranges is small so recursive is always reasonable.
     82 // Could be optimized to only be recursive for *.
     83 bool Pattern::RecursiveMatch(const std::string& s,
     84                              size_t begin_char,
     85                              size_t subrange_index,
     86                              bool allow_implicit_path_boundary) const {
     87   if (subrange_index >= subranges_.size()) {
     88     // Hit the end of our subranges, the text should also be at the end for a
     89     // match.
     90     return begin_char == s.size();
     91   }
     92 
     93   const Subrange& sr = subranges_[subrange_index];
     94   switch (sr.type) {
     95     case Subrange::LITERAL: {
     96       if (s.size() - begin_char < sr.literal.size())
     97         return false;  // Not enough room.
     98       if (s.compare(begin_char, sr.literal.size(), sr.literal) != 0)
     99         return false;  // Literal doesn't match.
    100 
    101       // Recursively check the next one.
    102       return RecursiveMatch(s, begin_char + sr.literal.size(),
    103                             subrange_index + 1, true);
    104     }
    105 
    106     case Subrange::PATH_BOUNDARY: {
    107       // When we can accept an implicit path boundary, we have to check both
    108       // a match of the literal and the implicit one.
    109       if (allow_implicit_path_boundary &&
    110           (begin_char == 0 || begin_char == s.size())) {
    111         // At implicit path boundary, see if the rest of the pattern matches.
    112         if (RecursiveMatch(s, begin_char, subrange_index + 1, false))
    113           return true;
    114       }
    115 
    116       // Check for a literal "/".
    117       if (begin_char < s.size() && s[begin_char] == '/') {
    118         // At explicit boundary, see if the rest of the pattern matches.
    119         if (RecursiveMatch(s, begin_char + 1, subrange_index + 1, true))
    120           return true;
    121       }
    122       return false;
    123     }
    124 
    125     case Subrange::ANYTHING: {
    126       if (subrange_index == subranges_.size() - 1)
    127         return true;  // * at the end, consider it matching.
    128 
    129       size_t min_next_size = sr.MinSize();
    130 
    131       // We don't care about exactly what matched as long as there was a match,
    132       // so we can do this front-to-back. If we needed the match, we would
    133       // normally want "*" to be greedy so would work backwards.
    134       for (size_t i = begin_char; i < s.size() - min_next_size; i++) {
    135         // Note: this could probably be faster by detecting the type of the
    136         // next match in advance and checking for a match in this loop rather
    137         // than doing a full recursive call for each character.
    138         if (RecursiveMatch(s, i, subrange_index + 1, true))
    139           return true;
    140       }
    141       return false;
    142     }
    143 
    144     default:
    145       NOTREACHED();
    146   }
    147 
    148   return false;
    149 }
    150 
    151 PatternList::PatternList() {
    152 }
    153 
    154 PatternList::~PatternList() {
    155 }
    156 
    157 void PatternList::Append(const Pattern& pattern) {
    158   patterns_.push_back(pattern);
    159 }
    160 
    161 void PatternList::SetFromValue(const Value& v, Err* err) {
    162   patterns_.clear();
    163 
    164   if (v.type() != Value::LIST) {
    165     *err = Err(v.origin(), "This value must be a list.");
    166     return;
    167   }
    168 
    169   const std::vector<Value>& list = v.list_value();
    170   for (size_t i = 0; i < list.size(); i++) {
    171     if (!list[i].VerifyTypeIs(Value::STRING, err))
    172       return;
    173     patterns_.push_back(Pattern(list[i].string_value()));
    174   }
    175 }
    176 
    177 bool PatternList::MatchesString(const std::string& s) const {
    178   for (size_t i = 0; i < patterns_.size(); i++) {
    179     if (patterns_[i].MatchesString(s))
    180       return true;
    181   }
    182   return false;
    183 }
    184 
    185 bool PatternList::MatchesValue(const Value& v) const {
    186   if (v.type() == Value::STRING)
    187     return MatchesString(v.string_value());
    188   return false;
    189 }
    190