| // Copyright (c) 2013 The Chromium Authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style license that can be |
| // found in the LICENSE file. |
| |
| #include "tools/gn/pattern.h" |
| |
| #include "tools/gn/value.h" |
| |
| namespace { |
| |
| void ParsePattern(const std::string& s, std::vector<Pattern::Subrange>* out) { |
| // Set when the last subrange is a literal so we can just append when we |
| // find another literal. |
| Pattern::Subrange* last_literal = nullptr; |
| |
| for (size_t i = 0; i < s.size(); i++) { |
| if (s[i] == '*') { |
| // Don't allow two **. |
| if (out->size() == 0 || |
| (*out)[out->size() - 1].type != Pattern::Subrange::ANYTHING) |
| out->push_back(Pattern::Subrange(Pattern::Subrange::ANYTHING)); |
| last_literal = nullptr; |
| } else if (s[i] == '\\') { |
| if (i < s.size() - 1 && s[i + 1] == 'b') { |
| // "\b" means path boundary. |
| i++; |
| out->push_back(Pattern::Subrange(Pattern::Subrange::PATH_BOUNDARY)); |
| last_literal = nullptr; |
| } else { |
| // Backslash + anything else means that literal char. |
| if (!last_literal) { |
| out->push_back(Pattern::Subrange(Pattern::Subrange::LITERAL)); |
| last_literal = &(*out)[out->size() - 1]; |
| } |
| if (i < s.size() - 1) { |
| i++; |
| last_literal->literal.push_back(s[i]); |
| } else { |
| // Single backslash at end, use literal backslash. |
| last_literal->literal.push_back('\\'); |
| } |
| } |
| } else { |
| if (!last_literal) { |
| out->push_back(Pattern::Subrange(Pattern::Subrange::LITERAL)); |
| last_literal = &(*out)[out->size() - 1]; |
| } |
| last_literal->literal.push_back(s[i]); |
| } |
| } |
| } |
| |
| } // namespace |
| |
| Pattern::Pattern(const std::string& s) { |
| ParsePattern(s, &subranges_); |
| is_suffix_ = |
| (subranges_.size() == 2 && subranges_[0].type == Subrange::ANYTHING && |
| subranges_[1].type == Subrange::LITERAL); |
| } |
| |
| Pattern::Pattern(const Pattern& other) = default; |
| |
| Pattern::~Pattern() = default; |
| |
| bool Pattern::MatchesString(const std::string& s) const { |
| // Empty pattern matches only empty string. |
| if (subranges_.empty()) |
| return s.empty(); |
| |
| if (is_suffix_) { |
| const std::string& suffix = subranges_[1].literal; |
| if (suffix.size() > s.size()) |
| return false; // Too short. |
| return s.compare(s.size() - suffix.size(), suffix.size(), suffix) == 0; |
| } |
| |
| return RecursiveMatch(s, 0, 0, true); |
| } |
| |
| // We assume the number of ranges is small so recursive is always reasonable. |
| // Could be optimized to only be recursive for *. |
| bool Pattern::RecursiveMatch(const std::string& s, |
| size_t begin_char, |
| size_t subrange_index, |
| bool allow_implicit_path_boundary) const { |
| if (subrange_index >= subranges_.size()) { |
| // Hit the end of our subranges, the text should also be at the end for a |
| // match. |
| return begin_char == s.size(); |
| } |
| |
| const Subrange& sr = subranges_[subrange_index]; |
| switch (sr.type) { |
| case Subrange::LITERAL: { |
| if (s.size() - begin_char < sr.literal.size()) |
| return false; // Not enough room. |
| if (s.compare(begin_char, sr.literal.size(), sr.literal) != 0) |
| return false; // Literal doesn't match. |
| |
| // Recursively check the next one. |
| return RecursiveMatch(s, begin_char + sr.literal.size(), |
| subrange_index + 1, true); |
| } |
| |
| case Subrange::PATH_BOUNDARY: { |
| // When we can accept an implicit path boundary, we have to check both |
| // a match of the literal and the implicit one. |
| if (allow_implicit_path_boundary && |
| (begin_char == 0 || begin_char == s.size())) { |
| // At implicit path boundary, see if the rest of the pattern matches. |
| if (RecursiveMatch(s, begin_char, subrange_index + 1, false)) |
| return true; |
| } |
| |
| // Check for a literal "/". |
| if (begin_char < s.size() && s[begin_char] == '/') { |
| // At explicit boundary, see if the rest of the pattern matches. |
| if (RecursiveMatch(s, begin_char + 1, subrange_index + 1, true)) |
| return true; |
| } |
| return false; |
| } |
| |
| case Subrange::ANYTHING: { |
| if (subrange_index == subranges_.size() - 1) |
| return true; // * at the end, consider it matching. |
| |
| size_t min_next_size = sr.MinSize(); |
| |
| // We don't care about exactly what matched as long as there was a match, |
| // so we can do this front-to-back. If we needed the match, we would |
| // normally want "*" to be greedy so would work backwards. |
| for (size_t i = begin_char; i < s.size() - min_next_size; i++) { |
| // Note: this could probably be faster by detecting the type of the |
| // next match in advance and checking for a match in this loop rather |
| // than doing a full recursive call for each character. |
| if (RecursiveMatch(s, i, subrange_index + 1, true)) |
| return true; |
| } |
| return false; |
| } |
| |
| default: |
| NOTREACHED(); |
| } |
| |
| return false; |
| } |
| |
| PatternList::PatternList() = default; |
| |
| PatternList::PatternList(const PatternList& other) = default; |
| |
| PatternList::~PatternList() = default; |
| |
| void PatternList::Append(const Pattern& pattern) { |
| patterns_.push_back(pattern); |
| } |
| |
| void PatternList::SetFromValue(const Value& v, Err* err) { |
| patterns_.clear(); |
| |
| if (v.type() != Value::LIST) { |
| *err = Err(v.origin(), "This value must be a list."); |
| return; |
| } |
| |
| const std::vector<Value>& list = v.list_value(); |
| for (const auto& elem : list) { |
| if (!elem.VerifyTypeIs(Value::STRING, err)) |
| return; |
| patterns_.push_back(Pattern(elem.string_value())); |
| } |
| } |
| |
| bool PatternList::MatchesString(const std::string& s) const { |
| for (const auto& pattern : patterns_) { |
| if (pattern.MatchesString(s)) |
| return true; |
| } |
| return false; |
| } |
| |
| bool PatternList::MatchesValue(const Value& v) const { |
| if (v.type() == Value::STRING) |
| return MatchesString(v.string_value()); |
| return false; |
| } |