1 // Copyright (c) 2013 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
5 #include "tools/gn/pattern.h"
7 #include "tools/gn/value.h"
11 void ParsePattern(const std::string
& s
, std::vector
<Pattern::Subrange
>* out
) {
12 // Set when the last subrange is a literal so we can just append when we
13 // find another literal.
14 Pattern::Subrange
* last_literal
= nullptr;
16 for (size_t i
= 0; i
< s
.size(); i
++) {
18 // Don't allow two **.
19 if (out
->size() == 0 ||
20 (*out
)[out
->size() - 1].type
!= Pattern::Subrange::ANYTHING
)
21 out
->push_back(Pattern::Subrange(Pattern::Subrange::ANYTHING
));
22 last_literal
= nullptr;
23 } else if (s
[i
] == '\\') {
24 if (i
< s
.size() - 1 && s
[i
+ 1] == 'b') {
25 // "\b" means path boundary.
27 out
->push_back(Pattern::Subrange(Pattern::Subrange::PATH_BOUNDARY
));
28 last_literal
= nullptr;
30 // Backslash + anything else means that literal char.
32 out
->push_back(Pattern::Subrange(Pattern::Subrange::LITERAL
));
33 last_literal
= &(*out
)[out
->size() - 1];
35 if (i
< s
.size() - 1) {
37 last_literal
->literal
.push_back(s
[i
]);
39 // Single backslash at end, use literal backslash.
40 last_literal
->literal
.push_back('\\');
45 out
->push_back(Pattern::Subrange(Pattern::Subrange::LITERAL
));
46 last_literal
= &(*out
)[out
->size() - 1];
48 last_literal
->literal
.push_back(s
[i
]);
55 Pattern::Pattern(const std::string
& s
) {
56 ParsePattern(s
, &subranges_
);
58 (subranges_
.size() == 2 &&
59 subranges_
[0].type
== Subrange::ANYTHING
&&
60 subranges_
[1].type
== Subrange::LITERAL
);
66 bool Pattern::MatchesString(const std::string
& s
) const {
67 // Empty pattern matches only empty string.
68 if (subranges_
.empty())
72 const std::string
& suffix
= subranges_
[1].literal
;
73 if (suffix
.size() > s
.size())
74 return false; // Too short.
75 return s
.compare(s
.size() - suffix
.size(), suffix
.size(), suffix
) == 0;
78 return RecursiveMatch(s
, 0, 0, true);
81 // We assume the number of ranges is small so recursive is always reasonable.
82 // Could be optimized to only be recursive for *.
83 bool Pattern::RecursiveMatch(const std::string
& s
,
85 size_t subrange_index
,
86 bool allow_implicit_path_boundary
) const {
87 if (subrange_index
>= subranges_
.size()) {
88 // Hit the end of our subranges, the text should also be at the end for a
90 return begin_char
== s
.size();
93 const Subrange
& sr
= subranges_
[subrange_index
];
95 case Subrange::LITERAL
: {
96 if (s
.size() - begin_char
< sr
.literal
.size())
97 return false; // Not enough room.
98 if (s
.compare(begin_char
, sr
.literal
.size(), sr
.literal
) != 0)
99 return false; // Literal doesn't match.
101 // Recursively check the next one.
102 return RecursiveMatch(s
, begin_char
+ sr
.literal
.size(),
103 subrange_index
+ 1, true);
106 case Subrange::PATH_BOUNDARY
: {
107 // When we can accept an implicit path boundary, we have to check both
108 // a match of the literal and the implicit one.
109 if (allow_implicit_path_boundary
&&
110 (begin_char
== 0 || begin_char
== s
.size())) {
111 // At implicit path boundary, see if the rest of the pattern matches.
112 if (RecursiveMatch(s
, begin_char
, subrange_index
+ 1, false))
116 // Check for a literal "/".
117 if (begin_char
< s
.size() && s
[begin_char
] == '/') {
118 // At explicit boundary, see if the rest of the pattern matches.
119 if (RecursiveMatch(s
, begin_char
+ 1, subrange_index
+ 1, true))
125 case Subrange::ANYTHING
: {
126 if (subrange_index
== subranges_
.size() - 1)
127 return true; // * at the end, consider it matching.
129 size_t min_next_size
= sr
.MinSize();
131 // We don't care about exactly what matched as long as there was a match,
132 // so we can do this front-to-back. If we needed the match, we would
133 // normally want "*" to be greedy so would work backwards.
134 for (size_t i
= begin_char
; i
< s
.size() - min_next_size
; i
++) {
135 // Note: this could probably be faster by detecting the type of the
136 // next match in advance and checking for a match in this loop rather
137 // than doing a full recursive call for each character.
138 if (RecursiveMatch(s
, i
, subrange_index
+ 1, true))
151 PatternList::PatternList() {
154 PatternList::~PatternList() {
157 void PatternList::Append(const Pattern
& pattern
) {
158 patterns_
.push_back(pattern
);
161 void PatternList::SetFromValue(const Value
& v
, Err
* err
) {
164 if (v
.type() != Value::LIST
) {
165 *err
= Err(v
.origin(), "This value must be a list.");
169 const std::vector
<Value
>& list
= v
.list_value();
170 for (size_t i
= 0; i
< list
.size(); i
++) {
171 if (!list
[i
].VerifyTypeIs(Value::STRING
, err
))
173 patterns_
.push_back(Pattern(list
[i
].string_value()));
177 bool PatternList::MatchesString(const std::string
& s
) const {
178 for (size_t i
= 0; i
< patterns_
.size(); i
++) {
179 if (patterns_
[i
].MatchesString(s
))
185 bool PatternList::MatchesValue(const Value
& v
) const {
186 if (v
.type() == Value::STRING
)
187 return MatchesString(v
.string_value());