xref: /freebsd-src/contrib/llvm-project/clang/lib/Format/MatchFilePath.cpp (revision cb14a3fe5122c879eae1fb480ed7ce82a699ddb6)
1*cb14a3feSDimitry Andric //===--- MatchFilePath.cpp - Match file path with pattern -------*- C++ -*-===//
2*cb14a3feSDimitry Andric //
3*cb14a3feSDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4*cb14a3feSDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
5*cb14a3feSDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6*cb14a3feSDimitry Andric //
7*cb14a3feSDimitry Andric //===----------------------------------------------------------------------===//
8*cb14a3feSDimitry Andric ///
9*cb14a3feSDimitry Andric /// \file
10*cb14a3feSDimitry Andric /// This file implements the functionality of matching a file path name to
11*cb14a3feSDimitry Andric /// a pattern, similar to the POSIX fnmatch() function.
12*cb14a3feSDimitry Andric ///
13*cb14a3feSDimitry Andric //===----------------------------------------------------------------------===//
14*cb14a3feSDimitry Andric 
15*cb14a3feSDimitry Andric #include "MatchFilePath.h"
16*cb14a3feSDimitry Andric 
17*cb14a3feSDimitry Andric using namespace llvm;
18*cb14a3feSDimitry Andric 
19*cb14a3feSDimitry Andric namespace clang {
20*cb14a3feSDimitry Andric namespace format {
21*cb14a3feSDimitry Andric 
22*cb14a3feSDimitry Andric // Check whether `FilePath` matches `Pattern` based on POSIX (1003.1-2008)
23*cb14a3feSDimitry Andric // 2.13.1, 2.13.2, and Rule 1 of 2.13.3.
24*cb14a3feSDimitry Andric bool matchFilePath(StringRef Pattern, StringRef FilePath) {
25*cb14a3feSDimitry Andric   assert(!Pattern.empty());
26*cb14a3feSDimitry Andric   assert(!FilePath.empty());
27*cb14a3feSDimitry Andric 
28*cb14a3feSDimitry Andric   // No match if `Pattern` ends with a non-meta character not equal to the last
29*cb14a3feSDimitry Andric   // character of `FilePath`.
30*cb14a3feSDimitry Andric   if (const auto C = Pattern.back(); !strchr("?*]", C) && C != FilePath.back())
31*cb14a3feSDimitry Andric     return false;
32*cb14a3feSDimitry Andric 
33*cb14a3feSDimitry Andric   constexpr auto Separator = '/';
34*cb14a3feSDimitry Andric   const auto EOP = Pattern.size();  // End of `Pattern`.
35*cb14a3feSDimitry Andric   const auto End = FilePath.size(); // End of `FilePath`.
36*cb14a3feSDimitry Andric   unsigned I = 0;                   // Index to `Pattern`.
37*cb14a3feSDimitry Andric 
38*cb14a3feSDimitry Andric   for (unsigned J = 0; J < End; ++J) {
39*cb14a3feSDimitry Andric     if (I == EOP)
40*cb14a3feSDimitry Andric       return false;
41*cb14a3feSDimitry Andric 
42*cb14a3feSDimitry Andric     switch (const auto F = FilePath[J]; Pattern[I]) {
43*cb14a3feSDimitry Andric     case '\\':
44*cb14a3feSDimitry Andric       if (++I == EOP || F != Pattern[I])
45*cb14a3feSDimitry Andric         return false;
46*cb14a3feSDimitry Andric       break;
47*cb14a3feSDimitry Andric     case '?':
48*cb14a3feSDimitry Andric       if (F == Separator)
49*cb14a3feSDimitry Andric         return false;
50*cb14a3feSDimitry Andric       break;
51*cb14a3feSDimitry Andric     case '*': {
52*cb14a3feSDimitry Andric       while (++I < EOP && Pattern[I] == '*') { // Skip consecutive stars.
53*cb14a3feSDimitry Andric       }
54*cb14a3feSDimitry Andric       const auto K = FilePath.find(Separator, J); // Index of next `Separator`.
55*cb14a3feSDimitry Andric       const bool NoMoreSeparatorsInFilePath = K == StringRef::npos;
56*cb14a3feSDimitry Andric       if (I == EOP) // `Pattern` ends with a star.
57*cb14a3feSDimitry Andric         return NoMoreSeparatorsInFilePath;
58*cb14a3feSDimitry Andric       // `Pattern` ends with a lone backslash.
59*cb14a3feSDimitry Andric       if (Pattern[I] == '\\' && ++I == EOP)
60*cb14a3feSDimitry Andric         return false;
61*cb14a3feSDimitry Andric       // The star is followed by a (possibly escaped) `Separator`.
62*cb14a3feSDimitry Andric       if (Pattern[I] == Separator) {
63*cb14a3feSDimitry Andric         if (NoMoreSeparatorsInFilePath)
64*cb14a3feSDimitry Andric           return false;
65*cb14a3feSDimitry Andric         J = K; // Skip to next `Separator` in `FilePath`.
66*cb14a3feSDimitry Andric         break;
67*cb14a3feSDimitry Andric       }
68*cb14a3feSDimitry Andric       // Recurse.
69*cb14a3feSDimitry Andric       for (auto Pat = Pattern.substr(I); J < End && FilePath[J] != Separator;
70*cb14a3feSDimitry Andric            ++J) {
71*cb14a3feSDimitry Andric         if (matchFilePath(Pat, FilePath.substr(J)))
72*cb14a3feSDimitry Andric           return true;
73*cb14a3feSDimitry Andric       }
74*cb14a3feSDimitry Andric       return false;
75*cb14a3feSDimitry Andric     }
76*cb14a3feSDimitry Andric     case '[':
77*cb14a3feSDimitry Andric       // Skip e.g. `[!]`.
78*cb14a3feSDimitry Andric       if (I + 3 < EOP || (I + 3 == EOP && Pattern[I + 1] != '!')) {
79*cb14a3feSDimitry Andric         // Skip unpaired `[`, brackets containing slashes, and `[]`.
80*cb14a3feSDimitry Andric         if (const auto K = Pattern.find_first_of("]/", I + 1);
81*cb14a3feSDimitry Andric             K != StringRef::npos && Pattern[K] == ']' && K > I + 1) {
82*cb14a3feSDimitry Andric           if (F == Separator)
83*cb14a3feSDimitry Andric             return false;
84*cb14a3feSDimitry Andric           ++I; // After the `[`.
85*cb14a3feSDimitry Andric           bool Negated = false;
86*cb14a3feSDimitry Andric           if (Pattern[I] == '!') {
87*cb14a3feSDimitry Andric             Negated = true;
88*cb14a3feSDimitry Andric             ++I; // After the `!`.
89*cb14a3feSDimitry Andric           }
90*cb14a3feSDimitry Andric           bool Match = false;
91*cb14a3feSDimitry Andric           do {
92*cb14a3feSDimitry Andric             if (I + 2 < K && Pattern[I + 1] == '-') {
93*cb14a3feSDimitry Andric               Match = Pattern[I] <= F && F <= Pattern[I + 2];
94*cb14a3feSDimitry Andric               I += 3; // After the range, e.g. `A-Z`.
95*cb14a3feSDimitry Andric             } else {
96*cb14a3feSDimitry Andric               Match = F == Pattern[I++];
97*cb14a3feSDimitry Andric             }
98*cb14a3feSDimitry Andric           } while (!Match && I < K);
99*cb14a3feSDimitry Andric           if (Negated ? Match : !Match)
100*cb14a3feSDimitry Andric             return false;
101*cb14a3feSDimitry Andric           I = K + 1; // After the `]`.
102*cb14a3feSDimitry Andric           continue;
103*cb14a3feSDimitry Andric         }
104*cb14a3feSDimitry Andric       }
105*cb14a3feSDimitry Andric       [[fallthrough]]; // Match `[` literally.
106*cb14a3feSDimitry Andric     default:
107*cb14a3feSDimitry Andric       if (F != Pattern[I])
108*cb14a3feSDimitry Andric         return false;
109*cb14a3feSDimitry Andric     }
110*cb14a3feSDimitry Andric 
111*cb14a3feSDimitry Andric     ++I;
112*cb14a3feSDimitry Andric   }
113*cb14a3feSDimitry Andric 
114*cb14a3feSDimitry Andric   // Match trailing stars with null strings.
115*cb14a3feSDimitry Andric   while (I < EOP && Pattern[I] == '*')
116*cb14a3feSDimitry Andric     ++I;
117*cb14a3feSDimitry Andric 
118*cb14a3feSDimitry Andric   return I == EOP;
119*cb14a3feSDimitry Andric }
120*cb14a3feSDimitry Andric 
121*cb14a3feSDimitry Andric } // namespace format
122*cb14a3feSDimitry Andric } // namespace clang
123