mirror of
https://github.com/python/cpython.git
synced 2024-12-30 12:15:27 +08:00
23cdbfa744
fnmatch.translate() no longer produces patterns which contain set operations. Sets starting with '[' or containing '--', '&&', '~~' or '||' will be interpreted differently in regular expressions in future versions. Currently they emit warnings. fnmatch.translate() now avoids producing patterns containing such sets by accident.
129 lines
4.0 KiB
Python
129 lines
4.0 KiB
Python
"""Filename matching with shell patterns.
|
|
|
|
fnmatch(FILENAME, PATTERN) matches according to the local convention.
|
|
fnmatchcase(FILENAME, PATTERN) always takes case in account.
|
|
|
|
The functions operate by translating the pattern into a regular
|
|
expression. They cache the compiled regular expressions for speed.
|
|
|
|
The function translate(PATTERN) returns a regular expression
|
|
corresponding to PATTERN. (It does not compile it.)
|
|
"""
|
|
import os
|
|
import posixpath
|
|
import re
|
|
import functools
|
|
|
|
__all__ = ["filter", "fnmatch", "fnmatchcase", "translate"]
|
|
|
|
def fnmatch(name, pat):
|
|
"""Test whether FILENAME matches PATTERN.
|
|
|
|
Patterns are Unix shell style:
|
|
|
|
* matches everything
|
|
? matches any single character
|
|
[seq] matches any character in seq
|
|
[!seq] matches any char not in seq
|
|
|
|
An initial period in FILENAME is not special.
|
|
Both FILENAME and PATTERN are first case-normalized
|
|
if the operating system requires it.
|
|
If you don't want this, use fnmatchcase(FILENAME, PATTERN).
|
|
"""
|
|
name = os.path.normcase(name)
|
|
pat = os.path.normcase(pat)
|
|
return fnmatchcase(name, pat)
|
|
|
|
@functools.lru_cache(maxsize=256, typed=True)
|
|
def _compile_pattern(pat):
|
|
if isinstance(pat, bytes):
|
|
pat_str = str(pat, 'ISO-8859-1')
|
|
res_str = translate(pat_str)
|
|
res = bytes(res_str, 'ISO-8859-1')
|
|
else:
|
|
res = translate(pat)
|
|
return re.compile(res).match
|
|
|
|
def filter(names, pat):
|
|
"""Return the subset of the list NAMES that match PAT."""
|
|
result = []
|
|
pat = os.path.normcase(pat)
|
|
match = _compile_pattern(pat)
|
|
if os.path is posixpath:
|
|
# normcase on posix is NOP. Optimize it away from the loop.
|
|
for name in names:
|
|
if match(name):
|
|
result.append(name)
|
|
else:
|
|
for name in names:
|
|
if match(os.path.normcase(name)):
|
|
result.append(name)
|
|
return result
|
|
|
|
def fnmatchcase(name, pat):
|
|
"""Test whether FILENAME matches PATTERN, including case.
|
|
|
|
This is a version of fnmatch() which doesn't case-normalize
|
|
its arguments.
|
|
"""
|
|
match = _compile_pattern(pat)
|
|
return match(name) is not None
|
|
|
|
|
|
def translate(pat):
|
|
"""Translate a shell PATTERN to a regular expression.
|
|
|
|
There is no way to quote meta-characters.
|
|
"""
|
|
|
|
i, n = 0, len(pat)
|
|
res = ''
|
|
while i < n:
|
|
c = pat[i]
|
|
i = i+1
|
|
if c == '*':
|
|
res = res + '.*'
|
|
elif c == '?':
|
|
res = res + '.'
|
|
elif c == '[':
|
|
j = i
|
|
if j < n and pat[j] == '!':
|
|
j = j+1
|
|
if j < n and pat[j] == ']':
|
|
j = j+1
|
|
while j < n and pat[j] != ']':
|
|
j = j+1
|
|
if j >= n:
|
|
res = res + '\\['
|
|
else:
|
|
stuff = pat[i:j]
|
|
if '--' not in stuff:
|
|
stuff = stuff.replace('\\', r'\\')
|
|
else:
|
|
chunks = []
|
|
k = i+2 if pat[i] == '!' else i+1
|
|
while True:
|
|
k = pat.find('-', k, j)
|
|
if k < 0:
|
|
break
|
|
chunks.append(pat[i:k])
|
|
i = k+1
|
|
k = k+3
|
|
chunks.append(pat[i:j])
|
|
# Escape backslashes and hyphens for set difference (--).
|
|
# Hyphens that create ranges shouldn't be escaped.
|
|
stuff = '-'.join(s.replace('\\', r'\\').replace('-', r'\-')
|
|
for s in chunks)
|
|
# Escape set operations (&&, ~~ and ||).
|
|
stuff = re.sub(r'([&~|])', r'\\\1', stuff)
|
|
i = j+1
|
|
if stuff[0] == '!':
|
|
stuff = '^' + stuff[1:]
|
|
elif stuff[0] in ('^', '['):
|
|
stuff = '\\' + stuff
|
|
res = '%s[%s]' % (res, stuff)
|
|
else:
|
|
res = res + re.escape(c)
|
|
return r'(?s:%s)\Z' % res
|