View Javadoc
1   /*
2    * Copyright (C) 2014, Andrey Loskutov <loskutov@gmx.de>
3    * and other copyright owners as documented in the project's IP log.
4    *
5    * This program and the accompanying materials are made available
6    * under the terms of the Eclipse Distribution License v1.0 which
7    * accompanies this distribution, is reproduced below, and is
8    * available at http://www.eclipse.org/org/documents/edl-v10.php
9    *
10   * All rights reserved.
11   *
12   * Redistribution and use in source and binary forms, with or
13   * without modification, are permitted provided that the following
14   * conditions are met:
15   *
16   * - Redistributions of source code must retain the above copyright
17   *   notice, this list of conditions and the following disclaimer.
18   *
19   * - Redistributions in binary form must reproduce the above
20   *   copyright notice, this list of conditions and the following
21   *   disclaimer in the documentation and/or other materials provided
22   *   with the distribution.
23   *
24   * - Neither the name of the Eclipse Foundation, Inc. nor the
25   *   names of its contributors may be used to endorse or promote
26   *   products derived from this software without specific prior
27   *   written permission.
28   *
29   * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND
30   * CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES,
31   * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
32   * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
33   * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
34   * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
35   * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
36   * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
37   * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
38   * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
39   * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
40   * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
41   * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
42   */
43  package org.eclipse.jgit.ignore.internal;
44  
45  import static org.eclipse.jgit.ignore.internal.Strings.checkWildCards;
46  import static org.eclipse.jgit.ignore.internal.Strings.count;
47  import static org.eclipse.jgit.ignore.internal.Strings.getPathSeparator;
48  import static org.eclipse.jgit.ignore.internal.Strings.isWildCard;
49  import static org.eclipse.jgit.ignore.internal.Strings.split;
50  
51  import java.util.ArrayList;
52  import java.util.List;
53  
54  import org.eclipse.jgit.errors.InvalidPatternException;
55  import org.eclipse.jgit.ignore.internal.Strings.PatternState;
56  
57  /**
58   * Matcher built by patterns consists of multiple path segments.
59   * <p>
60   * This class is immutable and thread safe.
61   */
62  public class PathMatcher extends AbstractMatcher {
63  
64  	private static final WildMatcher WILD = WildMatcher.INSTANCE;
65  
66  	private final List<IMatcher> matchers;
67  
68  	private final char slash;
69  
70  	private final boolean beginning;
71  
72  	private PathMatcher(String pattern, Character pathSeparator,
73  			boolean dirOnly)
74  			throws InvalidPatternException {
75  		super(pattern, dirOnly);
76  		slash = getPathSeparator(pathSeparator);
77  		beginning = pattern.indexOf(slash) == 0;
78  		if (isSimplePathWithSegments(pattern))
79  			matchers = null;
80  		else
81  			matchers = createMatchers(split(pattern, slash), pathSeparator,
82  					dirOnly);
83  	}
84  
85  	private boolean isSimplePathWithSegments(String path) {
86  		return !isWildCard(path) && path.indexOf('\\') < 0
87  				&& count(path, slash, true) > 0;
88  	}
89  
90  	private static List<IMatcher> createMatchers(List<String> segments,
91  			Character pathSeparator, boolean dirOnly)
92  			throws InvalidPatternException {
93  		List<IMatcher> matchers = new ArrayList<>(segments.size());
94  		for (int i = 0; i < segments.size(); i++) {
95  			String segment = segments.get(i);
96  			IMatcher matcher = createNameMatcher0(segment, pathSeparator,
97  					dirOnly);
98  			if (matcher == WILD && i > 0
99  					&& matchers.get(matchers.size() - 1) == WILD)
100 				// collapse wildmatchers **/** is same as **
101 				continue;
102 			matchers.add(matcher);
103 		}
104 		return matchers;
105 	}
106 
107 	/**
108 	 *
109 	 * @param pattern
110 	 * @param pathSeparator
111 	 *            if this parameter isn't null then this character will not
112 	 *            match at wildcards(* and ? are wildcards).
113 	 * @param dirOnly
114 	 * @return never null
115 	 * @throws InvalidPatternException
116 	 */
117 	public static IMatcher createPathMatcher(String pattern,
118 			Character pathSeparator, boolean dirOnly)
119 			throws InvalidPatternException {
120 		pattern = trim(pattern);
121 		char slash = Strings.getPathSeparator(pathSeparator);
122 		// ignore possible leading and trailing slash
123 		int slashIdx = pattern.indexOf(slash, 1);
124 		if (slashIdx > 0 && slashIdx < pattern.length() - 1)
125 			return new PathMatcher(pattern, pathSeparator, dirOnly);
126 		return createNameMatcher0(pattern, pathSeparator, dirOnly);
127 	}
128 
129 	/**
130 	 * Trim trailing spaces, unless they are escaped with backslash, see
131 	 * https://www.kernel.org/pub/software/scm/git/docs/gitignore.html
132 	 *
133 	 * @param pattern
134 	 *            non null
135 	 * @return trimmed pattern
136 	 */
137 	private static String trim(String pattern) {
138 		while (pattern.length() > 0
139 				&& pattern.charAt(pattern.length() - 1) == ' ') {
140 			if (pattern.length() > 1
141 					&& pattern.charAt(pattern.length() - 2) == '\\') {
142 				// last space was escaped by backslash: remove backslash and
143 				// keep space
144 				pattern = pattern.substring(0, pattern.length() - 2) + " "; //$NON-NLS-1$
145 				return pattern;
146 			}
147 			pattern = pattern.substring(0, pattern.length() - 1);
148 		}
149 		return pattern;
150 	}
151 
152 	private static IMatcher createNameMatcher0(String segment,
153 			Character pathSeparator, boolean dirOnly)
154 			throws InvalidPatternException {
155 		// check if we see /** or ** segments => double star pattern
156 		if (WildMatcher.WILDMATCH.equals(segment)
157 				|| WildMatcher.WILDMATCH2.equals(segment))
158 			return WILD;
159 
160 		PatternState state = checkWildCards(segment);
161 		switch (state) {
162 		case LEADING_ASTERISK_ONLY:
163 			return new LeadingAsteriskMatcher(segment, pathSeparator, dirOnly);
164 		case TRAILING_ASTERISK_ONLY:
165 			return new TrailingAsteriskMatcher(segment, pathSeparator, dirOnly);
166 		case COMPLEX:
167 			return new WildCardMatcher(segment, pathSeparator, dirOnly);
168 		default:
169 			return new NameMatcher(segment, pathSeparator, dirOnly, true);
170 		}
171 	}
172 
173 	@Override
174 	public boolean matches(String path, boolean assumeDirectory,
175 			boolean pathMatch) {
176 		if (matchers == null) {
177 			return simpleMatch(path, assumeDirectory, pathMatch);
178 		}
179 		return iterate(path, 0, path.length(), assumeDirectory, pathMatch);
180 	}
181 
182 	/*
183 	 * Stupid but fast string comparison: the case where we don't have to match
184 	 * wildcards or single segments (mean: this is multi-segment path which must
185 	 * be at the beginning of the another string)
186 	 */
187 	private boolean simpleMatch(String path, boolean assumeDirectory,
188 			boolean pathMatch) {
189 		boolean hasSlash = path.indexOf(slash) == 0;
190 		if (beginning && !hasSlash) {
191 			path = slash + path;
192 		}
193 		if (!beginning && hasSlash) {
194 			path = path.substring(1);
195 		}
196 		if (path.equals(pattern)) {
197 			// Exact match: must meet directory expectations
198 			return !dirOnly || assumeDirectory;
199 		}
200 		/*
201 		 * Add slashes for startsWith check. This avoids matching e.g.
202 		 * "/src/new" to /src/newfile" but allows "/src/new" to match
203 		 * "/src/new/newfile", as is the git standard
204 		 */
205 		String prefix = pattern + slash;
206 		if (pathMatch) {
207 			return path.equals(prefix) && (!dirOnly || assumeDirectory);
208 		}
209 		if (path.startsWith(prefix)) {
210 			return true;
211 		}
212 		return false;
213 	}
214 
215 	@Override
216 	public boolean matches(String segment, int startIncl, int endExcl,
217 			boolean assumeDirectory) {
218 		throw new UnsupportedOperationException(
219 				"Path matcher works only on entire paths"); //$NON-NLS-1$
220 	}
221 
222 	private boolean iterate(final String path, final int startIncl,
223 			final int endExcl, boolean assumeDirectory, boolean pathMatch) {
224 		int matcher = 0;
225 		int right = startIncl;
226 		boolean match = false;
227 		int lastWildmatch = -1;
228 		// ** matches may get extended if a later match fails. When that
229 		// happens, we must extend the ** by exactly one segment.
230 		// wildmatchBacktrackPos records the end of the segment after a **
231 		// match, so that we can reset correctly.
232 		int wildmatchBacktrackPos = -1;
233 		while (true) {
234 			int left = right;
235 			right = path.indexOf(slash, right);
236 			if (right == -1) {
237 				if (left < endExcl) {
238 					match = matches(matcher, path, left, endExcl,
239 							assumeDirectory);
240 				} else {
241 					// a/** should not match a/ or a
242 					match = match && matchers.get(matcher) != WILD;
243 				}
244 				if (match) {
245 					if (matcher < matchers.size() - 1
246 							&& matchers.get(matcher) == WILD) {
247 						// ** can match *nothing*: a/**/b match also a/b
248 						matcher++;
249 						match = matches(matcher, path, left, endExcl,
250 								assumeDirectory);
251 					} else if (dirOnly && !assumeDirectory) {
252 						// Directory expectations not met
253 						return false;
254 					}
255 				}
256 				return match && matcher + 1 == matchers.size();
257 			}
258 			if (wildmatchBacktrackPos < 0) {
259 				wildmatchBacktrackPos = right;
260 			}
261 			if (right - left > 0) {
262 				match = matches(matcher, path, left, right, assumeDirectory);
263 			} else {
264 				// path starts with slash???
265 				right++;
266 				continue;
267 			}
268 			if (match) {
269 				boolean wasWild = matchers.get(matcher) == WILD;
270 				if (wasWild) {
271 					lastWildmatch = matcher;
272 					wildmatchBacktrackPos = -1;
273 					// ** can match *nothing*: a/**/b match also a/b
274 					right = left - 1;
275 				}
276 				matcher++;
277 				if (matcher == matchers.size()) {
278 					// We had a prefix match here.
279 					if (!pathMatch) {
280 						return true;
281 					} else {
282 						if (right == endExcl - 1) {
283 							// Extra slash at the end: actually a full match.
284 							// Must meet directory expectations
285 							return !dirOnly || assumeDirectory;
286 						}
287 						// Prefix matches only if pattern ended with /**
288 						if (wasWild) {
289 							return true;
290 						}
291 						if (lastWildmatch >= 0) {
292 							// Consider pattern **/x and input x/x.
293 							// We've matched the prefix x/ so far: we
294 							// must try to extend the **!
295 							matcher = lastWildmatch + 1;
296 							right = wildmatchBacktrackPos;
297 							wildmatchBacktrackPos = -1;
298 						} else {
299 							return false;
300 						}
301 					}
302 				}
303 			} else if (lastWildmatch != -1) {
304 				matcher = lastWildmatch + 1;
305 				right = wildmatchBacktrackPos;
306 				wildmatchBacktrackPos = -1;
307 			} else {
308 				return false;
309 			}
310 			right++;
311 		}
312 	}
313 
314 	private boolean matches(int matcherIdx, String path, int startIncl,
315 			int endExcl,
316 			boolean assumeDirectory) {
317 		IMatcher matcher = matchers.get(matcherIdx);
318 		return matcher.matches(path, startIncl, endExcl, assumeDirectory);
319 	}
320 }