From 0d90d914bd2f45a15f5ea6209b9cfec7ebcdc3ed Mon Sep 17 00:00:00 2001 From: Ellen Marie Dash Date: Mon, 26 Oct 2020 16:09:52 -0400 Subject: [PATCH] [commands/cache] make `pip cache purge` remove everything from http + wheels caches; make `pip cache remove` prune empty directories. --- src/pip/_internal/commands/cache.py | 17 +++++++++ src/pip/_internal/utils/filesystem.py | 52 +++++++++++++++++++++++++++ 2 files changed, 69 insertions(+) diff --git a/src/pip/_internal/commands/cache.py b/src/pip/_internal/commands/cache.py index f1a489d324f..a99e05e5ae0 100644 --- a/src/pip/_internal/commands/cache.py +++ b/src/pip/_internal/commands/cache.py @@ -184,7 +184,24 @@ def remove_cache_items(self, options: Values, args: List[Any]) -> None: for filename in files: os.unlink(filename) logger.verbose("Removed %s", filename) + + http_dirs = filesystem.subdirs_with_no_files(self._cache_dir(options, "http")) + wheel_dirs = filesystem.subdirs_with_no_files( + self._cache_dir(options, "wheels") + ) + dirs = list(http_dirs) + list(wheel_dirs) + for dirname in dirs: + os.rmdir(dirname) + logger.verbose("Removed %s", dirname) + + # selfcheck.json is no longer used by pip. + selfcheck_json = self._cache_dir(options, "selfcheck.json") + if os.path.isfile(selfcheck_json): + os.remove(selfcheck_json) + logger.verbose("Removed legacy selfcheck.json file") + logger.info("Files removed: %s", len(files)) + logger.info("Empty directories removed: %s", len(dirs)) def purge_cache(self, options: Values, args: List[Any]) -> None: if args: diff --git a/src/pip/_internal/utils/filesystem.py b/src/pip/_internal/utils/filesystem.py index 83c2df75b96..28b27d55e45 100644 --- a/src/pip/_internal/utils/filesystem.py +++ b/src/pip/_internal/utils/filesystem.py @@ -4,11 +4,13 @@ import random import sys from contextlib import contextmanager +from pathlib import Path from tempfile import NamedTemporaryFile from typing import Any, BinaryIO, Generator, List, Union, cast from pip._vendor.tenacity import retry, stop_after_delay, wait_fixed +from pip._internal.exceptions import PipError from pip._internal.utils.compat import get_path_uid from pip._internal.utils.misc import format_size @@ -151,3 +153,53 @@ def directory_size(path: str) -> Union[int, float]: def format_directory_size(path: str) -> str: return format_size(directory_size(path)) + + +def _leaf_subdirs(path: Path): + """Traverses the file tree, finding every empty directory.""" + + path_obj = Path(path) + + if not path_obj.exists(): + return + + for item in path_obj.iterdir(): + if not item.is_dir(): + continue + + subitems = item.iterdir() + + # ASSUMPTION: Nothing in subitems will be None or False. + if not any(subitems): + yield item + + if not any(subitem.is_file() for subitem in subitems): + yield from _leaf_subdirs(item) + + +def _leaf_parents_without_files(path: Path, leaf: Path): + """Yields +leaf+ and each parent directory below +path+, until one of + them includes a file (as opposed to directories or nothing).""" + + if not str(leaf).startswith(str(path)): + # If +leaf+ is not a subdirectory of +path+, bail early to avoid + # an endless loop. + raise PipError("leaf is not a subdirectory of path") + + path = Path(path) + leaf = Path(leaf) + while leaf != path: + if all(item.is_dir() for item in leaf.iterdir()): + yield str(leaf) + else: + break + leaf = leaf.parent + + +def subdirs_with_no_files(path_str: str): + """Yields every subdirectory of +path_str+ that has no files under it.""" + + path = Path(path_str) + + for leaf in _leaf_subdirs(path): + yield from _leaf_parents_without_files(path, leaf)