GH-89727: Partially fix shutil.rmtree() recursion error on deep trees (#119634)

Make `shutil._rmtree_unsafe()` call `os.walk()`, which is implemented
without recursion.

`shutil._rmtree_safe_fd()` is not affected and can still raise a recursion
error.

Co-authored-by: Jelle Zijlstra <jelle.zijlstra@gmail.com>
This commit is contained in:
Barney Gale 2024-05-29 21:11:30 +01:00 committed by GitHub
parent c22323cd1c
commit a150679f90
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
4 changed files with 33 additions and 28 deletions

View file

@ -281,6 +281,10 @@ def renames(old, new):
__all__.extend(["makedirs", "removedirs", "renames"]) __all__.extend(["makedirs", "removedirs", "renames"])
# Private sentinel that makes walk() classify all symlinks and junctions as
# regular files.
_walk_symlinks_as_files = object()
def walk(top, topdown=True, onerror=None, followlinks=False): def walk(top, topdown=True, onerror=None, followlinks=False):
"""Directory tree generator. """Directory tree generator.
@ -382,7 +386,10 @@ def walk(top, topdown=True, onerror=None, followlinks=False):
break break
try: try:
is_dir = entry.is_dir() if followlinks is _walk_symlinks_as_files:
is_dir = entry.is_dir(follow_symlinks=False) and not entry.is_junction()
else:
is_dir = entry.is_dir()
except OSError: except OSError:
# If is_dir() raises an OSError, consider the entry not to # If is_dir() raises an OSError, consider the entry not to
# be a directory, same behaviour as os.path.isdir(). # be a directory, same behaviour as os.path.isdir().

View file

@ -606,37 +606,21 @@ else:
# version vulnerable to race conditions # version vulnerable to race conditions
def _rmtree_unsafe(path, onexc): def _rmtree_unsafe(path, onexc):
try: def onerror(err):
with os.scandir(path) as scandir_it: if not isinstance(err, FileNotFoundError):
entries = list(scandir_it) onexc(os.scandir, err.filename, err)
except FileNotFoundError: results = os.walk(path, topdown=False, onerror=onerror, followlinks=os._walk_symlinks_as_files)
return for dirpath, dirnames, filenames in results:
except OSError as err: for name in dirnames:
onexc(os.scandir, path, err) fullname = os.path.join(dirpath, name)
entries = []
for entry in entries:
fullname = entry.path
try:
is_dir = entry.is_dir(follow_symlinks=False)
except FileNotFoundError:
continue
except OSError:
is_dir = False
if is_dir and not entry.is_junction():
try: try:
if entry.is_symlink(): os.rmdir(fullname)
# This can only happen if someone replaces
# a directory with a symlink after the call to
# os.scandir or entry.is_dir above.
raise OSError("Cannot call rmtree on a symbolic link")
except FileNotFoundError: except FileNotFoundError:
continue continue
except OSError as err: except OSError as err:
onexc(os.path.islink, fullname, err) onexc(os.rmdir, fullname, err)
continue for name in filenames:
_rmtree_unsafe(fullname, onexc) fullname = os.path.join(dirpath, name)
else:
try: try:
os.unlink(fullname) os.unlink(fullname)
except FileNotFoundError: except FileNotFoundError:

View file

@ -741,6 +741,17 @@ class TestRmTree(BaseTest, unittest.TestCase):
shutil.rmtree(TESTFN) shutil.rmtree(TESTFN)
raise raise
@unittest.skipIf(shutil._use_fd_functions, "fd-based functions remain unfixed (GH-89727)")
def test_rmtree_above_recursion_limit(self):
recursion_limit = 40
# directory_depth > recursion_limit
directory_depth = recursion_limit + 10
base = os.path.join(TESTFN, *(['d'] * directory_depth))
os.makedirs(base)
with support.infinite_recursion(recursion_limit):
shutil.rmtree(TESTFN)
class TestCopyTree(BaseTest, unittest.TestCase): class TestCopyTree(BaseTest, unittest.TestCase):

View file

@ -0,0 +1,3 @@
Partially fix issue with :func:`shutil.rmtree` where a :exc:`RecursionError`
is raised on deep directory trees. A recursion error is no longer raised
when :data:`!rmtree.avoids_symlink_attacks` is false.