diff --git a/src/missing.py b/src/missing.py index 1db276c..c141274 100644 --- a/src/missing.py +++ b/src/missing.py @@ -4,104 +4,63 @@ import os import re import subprocess -from functools import lru_cache -from typing import Optional +from typing import Sequence logger = logging.getLogger('missing') class Missing: - RE_TEST_PY = re.compile(r'^.*?\.py$') - def __init__(self, exclude): + def __init__(self, exclude: Sequence[str]): if not (isinstance(exclude, list) or isinstance(exclude, tuple)): raise TypeError('exclude should be list or tuple') + for path in exclude: + if os.path.exists(path) and not os.path.isdir(path): + raise TypeError(f"exclude should only contain directories, found file {path}") - self._tracked_files = self._list_files_obey_gitignore() - logger.debug('Tracked files: %r', self._tracked_files) + files = [os.path.normpath(path) for path in self._list_files()] + logger.debug(f"{files=}") - # append .git to exclude folder - exclude = {'.git', *exclude} + exclude = [os.path.normpath(path) for path in exclude] + logger.debug(f"{exclude=}") - # normalize a pathname by collapsing redundant separators - self._exclude = [os.path.normpath(path) for path in exclude] + files_excluded = set() + for file in files: + if all([not file.startswith(e) for e in exclude]): + files_excluded.add(file) + logger.debug(f"{files_excluded=}") + + self.files = files_excluded def run(self) -> int: - return int(self._find_for_unittest()) - - @lru_cache(maxsize=None) - def _check_init_py_exists(self, path: str) -> bool: - """check the __init__.py exists on the current path and parent path""" - basedir = os.path.dirname(path) - - if basedir in ('', '.'): - return False - - # check the parent folder - fail = self._check_init_py_exists(basedir) - - # check the current __init__ exists or not - init_py = f'{basedir}/__init__.py' - if not os.path.exists(init_py): - fail = True - - # create the __init__.py - with open(init_py, 'w'): - logger.warning('create file: {}'.format(init_py)) - return fail - - def _find_for_unittest(self, basedir: Optional[str] = None) -> bool: - """the unittest find the test*.py only for the regular package""" - fail = False - init_run = False - - if basedir is None: - basedir = '.' - init_run = True - - for filename in os.listdir(basedir): - path = os.path.normpath(f'{basedir}/{filename}') - if path in self._exclude: - # skip the explicitly excluded path - logger.debug('exclude: %r', path) + """Return 1 if there are missing files, otherwise 0""" + is_failed = 0 + + for file in self.files: + basedir = os.path.dirname(file) + + if basedir in ('', '.'): continue - if os.path.isdir(path): - if self._find_for_unittest(path): - fail = True - elif self.RE_TEST_PY.match(filename): - if self._is_tracked(path): - logger.debug('check: %r', path) - if self._check_init_py_exists(path): - fail = True - else: - logger.debug('untracked: %r', path) - else: - logger.debug('no_match: %r', path) - - if init_run and fail: - logger.warning('found missing __init__.py for unittest') - - return fail - - def _is_tracked(self, path): - if self._tracked_files is None: - return True - return path in self._tracked_files - - def _list_files_obey_gitignore(self): - # list committed files - tracked_files = ( - subprocess.check_output( - ['git', 'ls-files', '-z'], - encoding='utf-8', - ) - .rstrip('\0') - .split('\0') - ) + init_py = os.path.join(basedir, '__init__.py') + if not os.path.exists(init_py): + is_failed = True + # create the __init__.py + with open(init_py, 'w'): + logger.warning(f'create file: {init_py}') + + return is_failed - # list untracked files - tracked_files += ( + @staticmethod + def _list_files(): + pattern = re.compile(r'^.*?\.py$') + + files = subprocess.check_output( + ['git', 'ls-files', '-z'], + encoding='utf-8', + ).rstrip('\0').split('\0') + + files += ( subprocess.check_output( ['git', 'ls-files', '-o', '--exclude-standard', '-z'], encoding='utf-8', @@ -109,12 +68,11 @@ def _list_files_obey_gitignore(self): .rstrip('\0') .split('\0') ) + return set( - [ - os.path.normpath(tracked_file) - for tracked_file in tracked_files - if self.RE_TEST_PY.match(os.path.basename(tracked_file)) - ] + os.path.normpath(file) + for file in files + if pattern.match(os.path.basename(file)) )