mirror of
https://github.com/python/cpython.git
synced 2025-10-24 02:13:49 +00:00

In translate(), generate unique group names across calls. The restores the undocumented ability to get a valid regexp by joining multiple translate() results via `|`.
175 lines
6.8 KiB
Python
175 lines
6.8 KiB
Python
"""Test cases for the fnmatch module."""
|
|
|
|
import unittest
|
|
import os
|
|
import warnings
|
|
|
|
from fnmatch import fnmatch, fnmatchcase, translate, filter
|
|
|
|
class FnmatchTestCase(unittest.TestCase):
|
|
|
|
def check_match(self, filename, pattern, should_match=True, fn=fnmatch):
|
|
if should_match:
|
|
self.assertTrue(fn(filename, pattern),
|
|
"expected %r to match pattern %r"
|
|
% (filename, pattern))
|
|
else:
|
|
self.assertFalse(fn(filename, pattern),
|
|
"expected %r not to match pattern %r"
|
|
% (filename, pattern))
|
|
|
|
def test_fnmatch(self):
|
|
check = self.check_match
|
|
check('abc', 'abc')
|
|
check('abc', '?*?')
|
|
check('abc', '???*')
|
|
check('abc', '*???')
|
|
check('abc', '???')
|
|
check('abc', '*')
|
|
check('abc', 'ab[cd]')
|
|
check('abc', 'ab[!de]')
|
|
check('abc', 'ab[de]', False)
|
|
check('a', '??', False)
|
|
check('a', 'b', False)
|
|
|
|
# these test that '\' is handled correctly in character sets;
|
|
# see SF bug #409651
|
|
check('\\', r'[\]')
|
|
check('a', r'[!\]')
|
|
check('\\', r'[!\]', False)
|
|
|
|
# test that filenames with newlines in them are handled correctly.
|
|
# http://bugs.python.org/issue6665
|
|
check('foo\nbar', 'foo*')
|
|
check('foo\nbar\n', 'foo*')
|
|
check('\nfoo', 'foo*', False)
|
|
check('\n', '*')
|
|
|
|
def test_slow_fnmatch(self):
|
|
check = self.check_match
|
|
check('a' * 50, '*a*a*a*a*a*a*a*a*a*a')
|
|
# The next "takes forever" if the regexp translation is
|
|
# straightforward. See bpo-40480.
|
|
check('a' * 50 + 'b', '*a*a*a*a*a*a*a*a*a*a', False)
|
|
|
|
def test_mix_bytes_str(self):
|
|
self.assertRaises(TypeError, fnmatch, 'test', b'*')
|
|
self.assertRaises(TypeError, fnmatch, b'test', '*')
|
|
self.assertRaises(TypeError, fnmatchcase, 'test', b'*')
|
|
self.assertRaises(TypeError, fnmatchcase, b'test', '*')
|
|
|
|
def test_fnmatchcase(self):
|
|
check = self.check_match
|
|
check('abc', 'abc', True, fnmatchcase)
|
|
check('AbC', 'abc', False, fnmatchcase)
|
|
check('abc', 'AbC', False, fnmatchcase)
|
|
check('AbC', 'AbC', True, fnmatchcase)
|
|
|
|
check('usr/bin', 'usr/bin', True, fnmatchcase)
|
|
check('usr\\bin', 'usr/bin', False, fnmatchcase)
|
|
check('usr/bin', 'usr\\bin', False, fnmatchcase)
|
|
check('usr\\bin', 'usr\\bin', True, fnmatchcase)
|
|
|
|
def test_bytes(self):
|
|
self.check_match(b'test', b'te*')
|
|
self.check_match(b'test\xff', b'te*\xff')
|
|
self.check_match(b'foo\nbar', b'foo*')
|
|
|
|
def test_case(self):
|
|
ignorecase = os.path.normcase('ABC') == os.path.normcase('abc')
|
|
check = self.check_match
|
|
check('abc', 'abc')
|
|
check('AbC', 'abc', ignorecase)
|
|
check('abc', 'AbC', ignorecase)
|
|
check('AbC', 'AbC')
|
|
|
|
def test_sep(self):
|
|
normsep = os.path.normcase('\\') == os.path.normcase('/')
|
|
check = self.check_match
|
|
check('usr/bin', 'usr/bin')
|
|
check('usr\\bin', 'usr/bin', normsep)
|
|
check('usr/bin', 'usr\\bin', normsep)
|
|
check('usr\\bin', 'usr\\bin')
|
|
|
|
def test_warnings(self):
|
|
with warnings.catch_warnings():
|
|
warnings.simplefilter('error', Warning)
|
|
check = self.check_match
|
|
check('[', '[[]')
|
|
check('&', '[a&&b]')
|
|
check('|', '[a||b]')
|
|
check('~', '[a~~b]')
|
|
check(',', '[a-z+--A-Z]')
|
|
check('.', '[a-z--/A-Z]')
|
|
|
|
|
|
class TranslateTestCase(unittest.TestCase):
|
|
|
|
def test_translate(self):
|
|
import re
|
|
self.assertEqual(translate('*'), r'(?s:.*)\Z')
|
|
self.assertEqual(translate('?'), r'(?s:.)\Z')
|
|
self.assertEqual(translate('a?b*'), r'(?s:a.b.*)\Z')
|
|
self.assertEqual(translate('[abc]'), r'(?s:[abc])\Z')
|
|
self.assertEqual(translate('[]]'), r'(?s:[]])\Z')
|
|
self.assertEqual(translate('[!x]'), r'(?s:[^x])\Z')
|
|
self.assertEqual(translate('[^x]'), r'(?s:[\^x])\Z')
|
|
self.assertEqual(translate('[x'), r'(?s:\[x)\Z')
|
|
# from the docs
|
|
self.assertEqual(translate('*.txt'), r'(?s:.*\.txt)\Z')
|
|
# squash consecutive stars
|
|
self.assertEqual(translate('*********'), r'(?s:.*)\Z')
|
|
self.assertEqual(translate('A*********'), r'(?s:A.*)\Z')
|
|
self.assertEqual(translate('*********A'), r'(?s:.*A)\Z')
|
|
self.assertEqual(translate('A*********?[?]?'), r'(?s:A.*.[?].)\Z')
|
|
# fancy translation to prevent exponential-time match failure
|
|
t = translate('**a*a****a')
|
|
digits = re.findall(r'\d+', t)
|
|
self.assertEqual(len(digits), 4)
|
|
self.assertEqual(digits[0], digits[1])
|
|
self.assertEqual(digits[2], digits[3])
|
|
g1 = f"g{digits[0]}" # e.g., group name "g4"
|
|
g2 = f"g{digits[2]}" # e.g., group name "g5"
|
|
self.assertEqual(t,
|
|
fr'(?s:(?=(?P<{g1}>.*?a))(?P={g1})(?=(?P<{g2}>.*?a))(?P={g2}).*a)\Z')
|
|
# and try pasting multiple translate results - it's an undocumented
|
|
# feature that this works; all the pain of generating unique group
|
|
# names across calls exists to support this
|
|
r1 = translate('**a**a**a*')
|
|
r2 = translate('**b**b**b*')
|
|
r3 = translate('*c*c*c*')
|
|
fatre = "|".join([r1, r2, r3])
|
|
self.assertTrue(re.match(fatre, 'abaccad'))
|
|
self.assertTrue(re.match(fatre, 'abxbcab'))
|
|
self.assertTrue(re.match(fatre, 'cbabcaxc'))
|
|
self.assertFalse(re.match(fatre, 'dabccbad'))
|
|
|
|
class FilterTestCase(unittest.TestCase):
|
|
|
|
def test_filter(self):
|
|
self.assertEqual(filter(['Python', 'Ruby', 'Perl', 'Tcl'], 'P*'),
|
|
['Python', 'Perl'])
|
|
self.assertEqual(filter([b'Python', b'Ruby', b'Perl', b'Tcl'], b'P*'),
|
|
[b'Python', b'Perl'])
|
|
|
|
def test_mix_bytes_str(self):
|
|
self.assertRaises(TypeError, filter, ['test'], b'*')
|
|
self.assertRaises(TypeError, filter, [b'test'], '*')
|
|
|
|
def test_case(self):
|
|
ignorecase = os.path.normcase('P') == os.path.normcase('p')
|
|
self.assertEqual(filter(['Test.py', 'Test.rb', 'Test.PL'], '*.p*'),
|
|
['Test.py', 'Test.PL'] if ignorecase else ['Test.py'])
|
|
self.assertEqual(filter(['Test.py', 'Test.rb', 'Test.PL'], '*.P*'),
|
|
['Test.py', 'Test.PL'] if ignorecase else ['Test.PL'])
|
|
|
|
def test_sep(self):
|
|
normsep = os.path.normcase('\\') == os.path.normcase('/')
|
|
self.assertEqual(filter(['usr/bin', 'usr', 'usr\\lib'], 'usr/*'),
|
|
['usr/bin', 'usr\\lib'] if normsep else ['usr/bin'])
|
|
self.assertEqual(filter(['usr/bin', 'usr', 'usr\\lib'], 'usr\\*'),
|
|
['usr/bin', 'usr\\lib'] if normsep else ['usr\\lib'])
|
|
|
|
|
|
if __name__ == "__main__":
|
|
unittest.main()
|