| 
									
										
										
										
											1995-01-27 02:41:45 +00:00
										 |  |  | """Filename matching with shell patterns.
 | 
					
						
							| 
									
										
										
										
											1992-01-12 23:29:29 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											1995-01-27 02:41:45 +00:00
										 |  |  | fnmatch(FILENAME, PATTERN) matches according to the local convention. | 
					
						
							|  |  |  | fnmatchcase(FILENAME, PATTERN) always takes case in account. | 
					
						
							| 
									
										
										
										
											1992-01-12 23:29:29 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											1995-01-27 02:41:45 +00:00
										 |  |  | The functions operate by translating the pattern into a regular | 
					
						
							|  |  |  | expression.  They cache the compiled regular expressions for speed. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | The function translate(PATTERN) returns a regular expression | 
					
						
							|  |  |  | corresponding to PATTERN.  (It does not compile it.) | 
					
						
							|  |  |  | """
 | 
					
						
							| 
									
										
										
										
											2010-07-23 16:22:25 +00:00
										 |  |  | import os | 
					
						
							|  |  |  | import posixpath | 
					
						
							| 
									
										
										
										
											1997-10-22 21:00:49 +00:00
										 |  |  | import re | 
					
						
							| 
									
										
										
										
											2010-08-13 16:26:40 +00:00
										 |  |  | import functools | 
					
						
							| 
									
										
										
										
											1997-10-22 21:00:49 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-08-13 16:26:40 +00:00
										 |  |  | __all__ = ["filter", "fnmatch", "fnmatchcase", "translate"] | 
					
						
							| 
									
										
										
										
											2010-07-23 16:22:25 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-05-11 21:19:20 -05:00
										 |  |  | # Build a thread-safe incrementing counter to help create unique regexp group | 
					
						
							|  |  |  | # names across calls. | 
					
						
							|  |  |  | from itertools import count | 
					
						
							|  |  |  | _nextgroupnum = count().__next__ | 
					
						
							|  |  |  | del count | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											1991-01-01 18:11:14 +00:00
										 |  |  | def fnmatch(name, pat): | 
					
						
							| 
									
										
										
										
											2001-01-14 23:36:06 +00:00
										 |  |  |     """Test whether FILENAME matches PATTERN.
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     Patterns are Unix shell style: | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     *       matches everything | 
					
						
							|  |  |  |     ?       matches any single character | 
					
						
							|  |  |  |     [seq]   matches any character in seq | 
					
						
							|  |  |  |     [!seq]  matches any char not in seq | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     An initial period in FILENAME is not special. | 
					
						
							|  |  |  |     Both FILENAME and PATTERN are first case-normalized | 
					
						
							|  |  |  |     if the operating system requires it. | 
					
						
							|  |  |  |     If you don't want this, use fnmatchcase(FILENAME, PATTERN). | 
					
						
							|  |  |  |     """
 | 
					
						
							|  |  |  |     name = os.path.normcase(name) | 
					
						
							|  |  |  |     pat = os.path.normcase(pat) | 
					
						
							|  |  |  |     return fnmatchcase(name, pat) | 
					
						
							| 
									
										
										
										
											1995-01-27 02:41:45 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-02-17 01:33:37 -08:00
										 |  |  | @functools.lru_cache(maxsize=256, typed=True) | 
					
						
							| 
									
										
										
										
											2011-10-20 09:22:10 -07:00
										 |  |  | def _compile_pattern(pat): | 
					
						
							|  |  |  |     if isinstance(pat, bytes): | 
					
						
							| 
									
										
										
										
											2010-08-13 16:26:40 +00:00
										 |  |  |         pat_str = str(pat, 'ISO-8859-1') | 
					
						
							|  |  |  |         res_str = translate(pat_str) | 
					
						
							|  |  |  |         res = bytes(res_str, 'ISO-8859-1') | 
					
						
							|  |  |  |     else: | 
					
						
							|  |  |  |         res = translate(pat) | 
					
						
							|  |  |  |     return re.compile(res).match | 
					
						
							| 
									
										
										
										
											2010-07-23 16:22:25 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2001-06-06 06:24:38 +00:00
										 |  |  | def filter(names, pat): | 
					
						
							| 
									
										
										
										
											2020-12-18 16:10:20 -03:00
										 |  |  |     """Construct a list from those elements of the iterable NAMES that match PAT.""" | 
					
						
							| 
									
										
										
										
											2008-10-02 18:55:37 +00:00
										 |  |  |     result = [] | 
					
						
							|  |  |  |     pat = os.path.normcase(pat) | 
					
						
							| 
									
										
										
										
											2011-10-20 09:22:10 -07:00
										 |  |  |     match = _compile_pattern(pat) | 
					
						
							| 
									
										
										
										
											2001-06-06 06:24:38 +00:00
										 |  |  |     if os.path is posixpath: | 
					
						
							|  |  |  |         # normcase on posix is NOP. Optimize it away from the loop. | 
					
						
							|  |  |  |         for name in names: | 
					
						
							|  |  |  |             if match(name): | 
					
						
							|  |  |  |                 result.append(name) | 
					
						
							|  |  |  |     else: | 
					
						
							|  |  |  |         for name in names: | 
					
						
							|  |  |  |             if match(os.path.normcase(name)): | 
					
						
							|  |  |  |                 result.append(name) | 
					
						
							|  |  |  |     return result | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											1995-01-27 02:41:45 +00:00
										 |  |  | def fnmatchcase(name, pat): | 
					
						
							| 
									
										
										
										
											2001-01-14 23:36:06 +00:00
										 |  |  |     """Test whether FILENAME matches PATTERN, including case.
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     This is a version of fnmatch() which doesn't case-normalize | 
					
						
							|  |  |  |     its arguments. | 
					
						
							|  |  |  |     """
 | 
					
						
							| 
									
										
										
										
											2011-10-20 09:22:10 -07:00
										 |  |  |     match = _compile_pattern(pat) | 
					
						
							| 
									
										
										
										
											2008-10-02 18:55:37 +00:00
										 |  |  |     return match(name) is not None | 
					
						
							| 
									
										
										
										
											1991-01-01 18:11:14 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-07-23 16:22:25 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											1992-01-12 23:29:29 +00:00
										 |  |  | def translate(pat): | 
					
						
							| 
									
										
										
										
											2001-01-14 23:36:06 +00:00
										 |  |  |     """Translate a shell PATTERN to a regular expression.
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     There is no way to quote meta-characters. | 
					
						
							|  |  |  |     """
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-05-05 21:28:24 -05:00
										 |  |  |     STAR = object() | 
					
						
							|  |  |  |     res = [] | 
					
						
							|  |  |  |     add = res.append | 
					
						
							| 
									
										
										
										
											2001-01-14 23:36:06 +00:00
										 |  |  |     i, n = 0, len(pat) | 
					
						
							|  |  |  |     while i < n: | 
					
						
							|  |  |  |         c = pat[i] | 
					
						
							|  |  |  |         i = i+1 | 
					
						
							|  |  |  |         if c == '*': | 
					
						
							| 
									
										
										
										
											2020-05-05 21:28:24 -05:00
										 |  |  |             # compress consecutive `*` into one | 
					
						
							|  |  |  |             if (not res) or res[-1] is not STAR: | 
					
						
							|  |  |  |                 add(STAR) | 
					
						
							| 
									
										
										
										
											2001-01-14 23:36:06 +00:00
										 |  |  |         elif c == '?': | 
					
						
							| 
									
										
										
										
											2020-05-05 21:28:24 -05:00
										 |  |  |             add('.') | 
					
						
							| 
									
										
										
										
											2001-01-14 23:36:06 +00:00
										 |  |  |         elif c == '[': | 
					
						
							|  |  |  |             j = i | 
					
						
							|  |  |  |             if j < n and pat[j] == '!': | 
					
						
							|  |  |  |                 j = j+1 | 
					
						
							|  |  |  |             if j < n and pat[j] == ']': | 
					
						
							|  |  |  |                 j = j+1 | 
					
						
							|  |  |  |             while j < n and pat[j] != ']': | 
					
						
							|  |  |  |                 j = j+1 | 
					
						
							|  |  |  |             if j >= n: | 
					
						
							| 
									
										
										
										
											2020-05-05 21:28:24 -05:00
										 |  |  |                 add('\\[') | 
					
						
							| 
									
										
										
										
											2001-01-14 23:36:06 +00:00
										 |  |  |             else: | 
					
						
							| 
									
										
										
										
											2018-02-09 13:30:19 +02:00
										 |  |  |                 stuff = pat[i:j] | 
					
						
							|  |  |  |                 if '--' not in stuff: | 
					
						
							|  |  |  |                     stuff = stuff.replace('\\', r'\\') | 
					
						
							|  |  |  |                 else: | 
					
						
							|  |  |  |                     chunks = [] | 
					
						
							|  |  |  |                     k = i+2 if pat[i] == '!' else i+1 | 
					
						
							|  |  |  |                     while True: | 
					
						
							|  |  |  |                         k = pat.find('-', k, j) | 
					
						
							|  |  |  |                         if k < 0: | 
					
						
							|  |  |  |                             break | 
					
						
							|  |  |  |                         chunks.append(pat[i:k]) | 
					
						
							|  |  |  |                         i = k+1 | 
					
						
							|  |  |  |                         k = k+3 | 
					
						
							|  |  |  |                     chunks.append(pat[i:j]) | 
					
						
							|  |  |  |                     # Escape backslashes and hyphens for set difference (--). | 
					
						
							|  |  |  |                     # Hyphens that create ranges shouldn't be escaped. | 
					
						
							|  |  |  |                     stuff = '-'.join(s.replace('\\', r'\\').replace('-', r'\-') | 
					
						
							|  |  |  |                                      for s in chunks) | 
					
						
							|  |  |  |                 # Escape set operations (&&, ~~ and ||). | 
					
						
							|  |  |  |                 stuff = re.sub(r'([&~|])', r'\\\1', stuff) | 
					
						
							| 
									
										
										
										
											2001-01-14 23:36:06 +00:00
										 |  |  |                 i = j+1 | 
					
						
							|  |  |  |                 if stuff[0] == '!': | 
					
						
							| 
									
										
										
										
											2001-03-21 18:05:48 +00:00
										 |  |  |                     stuff = '^' + stuff[1:] | 
					
						
							| 
									
										
										
										
											2018-02-09 13:30:19 +02:00
										 |  |  |                 elif stuff[0] in ('^', '['): | 
					
						
							| 
									
										
										
										
											2001-03-21 18:05:48 +00:00
										 |  |  |                     stuff = '\\' + stuff | 
					
						
							| 
									
										
										
										
											2020-05-05 21:28:24 -05:00
										 |  |  |                 add(f'[{stuff}]') | 
					
						
							| 
									
										
										
										
											2001-01-14 23:36:06 +00:00
										 |  |  |         else: | 
					
						
							| 
									
										
										
										
											2020-05-05 21:28:24 -05:00
										 |  |  |             add(re.escape(c)) | 
					
						
							|  |  |  |     assert i == n | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     # Deal with STARs. | 
					
						
							|  |  |  |     inp = res | 
					
						
							|  |  |  |     res = [] | 
					
						
							|  |  |  |     add = res.append | 
					
						
							|  |  |  |     i, n = 0, len(inp) | 
					
						
							|  |  |  |     # Fixed pieces at the start? | 
					
						
							|  |  |  |     while i < n and inp[i] is not STAR: | 
					
						
							|  |  |  |         add(inp[i]) | 
					
						
							|  |  |  |         i += 1 | 
					
						
							|  |  |  |     # Now deal with STAR fixed STAR fixed ... | 
					
						
							|  |  |  |     # For an interior `STAR fixed` pairing, we want to do a minimal | 
					
						
							|  |  |  |     # .*? match followed by `fixed`, with no possibility of backtracking. | 
					
						
							|  |  |  |     # We can't spell that directly, but can trick it into working by matching | 
					
						
							|  |  |  |     #    .*?fixed | 
					
						
							|  |  |  |     # in a lookahead assertion, save the matched part in a group, then | 
					
						
							|  |  |  |     # consume that group via a backreference. If the overall match fails, | 
					
						
							|  |  |  |     # the lookahead assertion won't try alternatives. So the translation is: | 
					
						
							| 
									
										
										
										
											2020-05-11 21:19:20 -05:00
										 |  |  |     #     (?=(?P<name>.*?fixed))(?P=name) | 
					
						
							|  |  |  |     # Group names are created as needed: g0, g1, g2, ... | 
					
						
							|  |  |  |     # The numbers are obtained from _nextgroupnum() to ensure they're unique | 
					
						
							|  |  |  |     # across calls and across threads. This is because people rely on the | 
					
						
							|  |  |  |     # undocumented ability to join multiple translate() results together via | 
					
						
							|  |  |  |     # "|" to build large regexps matching "one of many" shell patterns. | 
					
						
							| 
									
										
										
										
											2020-05-05 21:28:24 -05:00
										 |  |  |     while i < n: | 
					
						
							|  |  |  |         assert inp[i] is STAR | 
					
						
							|  |  |  |         i += 1 | 
					
						
							|  |  |  |         if i == n: | 
					
						
							|  |  |  |             add(".*") | 
					
						
							|  |  |  |             break | 
					
						
							|  |  |  |         assert inp[i] is not STAR | 
					
						
							|  |  |  |         fixed = [] | 
					
						
							|  |  |  |         while i < n and inp[i] is not STAR: | 
					
						
							|  |  |  |             fixed.append(inp[i]) | 
					
						
							|  |  |  |             i += 1 | 
					
						
							|  |  |  |         fixed = "".join(fixed) | 
					
						
							|  |  |  |         if i == n: | 
					
						
							|  |  |  |             add(".*") | 
					
						
							|  |  |  |             add(fixed) | 
					
						
							|  |  |  |         else: | 
					
						
							| 
									
										
										
										
											2020-05-11 21:19:20 -05:00
										 |  |  |             groupnum = _nextgroupnum() | 
					
						
							| 
									
										
										
										
											2020-05-05 21:28:24 -05:00
										 |  |  |             add(f"(?=(?P<g{groupnum}>.*?{fixed}))(?P=g{groupnum})") | 
					
						
							|  |  |  |     assert i == n | 
					
						
							|  |  |  |     res = "".join(res) | 
					
						
							|  |  |  |     return fr'(?s:{res})\Z' |