| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175 |
- # Copyright (C) 2017 Jelmer Vernooij <jelmer@jelmer.uk>
- #
- # Dulwich is dual-licensed under the Apache License, Version 2.0 and the GNU
- # General Public License as public by the Free Software Foundation; version 2.0
- # or (at your option) any later version. You can redistribute it and/or
- # modify it under the terms of either of these two licenses.
- #
- # Unless required by applicable law or agreed to in writing, software
- # distributed under the License is distributed on an "AS IS" BASIS,
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- # See the License for the specific language governing permissions and
- # limitations under the License.
- #
- # You should have received a copy of the licenses; if not, see
- # <http://www.gnu.org/licenses/> for a copy of the GNU General Public License
- # and <http://www.apache.org/licenses/LICENSE-2.0> for a copy of the Apache
- # License, Version 2.0.
- #
- """Parsing of gitignore files.
- For details for the matching rules, see https://git-scm.com/docs/gitignore
- """
- import re
- def translate(pat):
- """Translate a shell PATTERN to a regular expression.
- There is no way to quote meta-characters.
- Originally copied from fnmatch in Python 2.7, but modified for Dulwich
- to cope with features in Git ignore patterns.
- """
- res = b'(?ms)'
- if b'/' not in pat:
- # If there's no slash, this is a filename-based match
- res = res + b'(.*\/)?'
- if pat.startswith(b'**/'):
- # Leading **/
- pat = pat[2:]
- res = res + b'(.*\/)?'
- if pat.startswith(b'/'):
- pat = pat[1:]
- i, n = 0, len(pat)
- while i < n:
- if pat[i:i+3] == b'/**':
- res = res + b'(\\/.*)?'
- i = i+3
- continue
- c = pat[i:i+1]
- i = i+1
- if c == b'*':
- res = res + b'[^\/]+'
- elif c == b'?':
- res = res + b'.'
- elif c == b'[':
- j = i
- if j < n and pat[j:j+1] == b'!':
- j = j+1
- if j < n and pat[j:j+1] == b']':
- j = j+1
- while j < n and pat[j:j+1] != b']':
- j = j+1
- if j >= n:
- res = res + b'\\['
- else:
- stuff = pat[i:j].replace(b'\\', b'\\\\')
- i = j+1
- if stuff.startswith(b'!'):
- stuff = b'^' + stuff[1:]
- elif stuff.startswith(b'^'):
- stuff = b'\\' + stuff
- res = res + b'[' + stuff + b']'
- else:
- res = res + re.escape(c)
- return res + b'\Z'
- def read_ignore_patterns(f):
- """Read a git ignore file.
- :param f: File-like object to read from
- :return: List of patterns
- """
- for l in f:
- l = l.rstrip(b"\n")
- # Ignore blank lines, they're used for readability.
- if not l:
- continue
- if l.startswith(b'#'):
- # Comment
- continue
- # Trailing spaces are ignored unless they are quoted with a backslash.
- while l.endswith(b' ') and not l.endswith(b'\\ '):
- l = l[:-1]
- l = l.replace(b'\\ ', b' ')
- yield l
- def match_pattern(path, pattern):
- """Match a gitignore-style pattern against a path.
- :param path: Path to match
- :param pattern: Pattern to match
- :return: bool indicating whether the pattern matched
- """
- re_pattern = translate(pattern)
- return re.match(re_pattern, path)
- class IgnoreFilter(object):
- def __init__(self, patterns):
- self._patterns = []
- for pattern in patterns:
- self.append_pattern(pattern)
- def append_pattern(self, pattern):
- """Add a pattern to the set."""
- self._patterns.append(pattern)
- def is_ignored(self, path):
- """Check whether a path is ignored.
- For directories, include a trailing slash.
- :return: None if file is not mentioned, True if it is included, False
- if it is explicitly excluded.
- """
- status = None
- for pattern in self._patterns:
- if pattern[0:1] == b'!':
- if match_pattern(pattern[1:], path):
- # Explicitly excluded.
- return False
- else:
- if pattern[0:1] == b'\\':
- pattern = pattern[1:]
- if match_pattern(pattern, path):
- status = True
- return status
- class IgnoreFilterStack(object):
- """Check for ignore status in multiple filters."""
- def __init__(self, filters):
- self._filters = filters
- def is_ignored(self, path):
- """Check whether a path is explicitly included or excluded in ignores.
- :param path: Path to check
- :return: None if the file is not mentioned, True if it is included,
- False if it is explicitly excluded.
- """
- status = None
- for filter in self._filters:
- status = filter.is_ignored(path)
- if status is not None:
- return status
- return status
|