Skip to content

Commit

Permalink
pythongh-117084: Fix ZIP file extraction for directory entry names wi…
Browse files Browse the repository at this point in the history
…th backslashes on Windows (pythonGH-117129)
  • Loading branch information
serhiy-storchaka authored and adorilson committed Mar 25, 2024
1 parent b087334 commit c175734
Show file tree
Hide file tree
Showing 4 changed files with 27 additions and 1 deletion.
Binary file added Lib/test/archivetestdata/zipdir_backslash.zip
Binary file not shown.
16 changes: 16 additions & 0 deletions Lib/test/test_zipfile/test_core.py
Expand Up @@ -2937,6 +2937,22 @@ def test_bug_6050(self):
os.mkdir(os.path.join(TESTFN2, "a"))
self.test_extract_dir()

def test_extract_dir_backslash(self):
zfname = findfile("zipdir_backslash.zip", subdir="archivetestdata")
with zipfile.ZipFile(zfname) as zipf:
zipf.extractall(TESTFN2)
if os.name == 'nt':
self.assertTrue(os.path.isdir(os.path.join(TESTFN2, "a")))
self.assertTrue(os.path.isdir(os.path.join(TESTFN2, "a", "b")))
self.assertTrue(os.path.isfile(os.path.join(TESTFN2, "a", "b", "c")))
self.assertTrue(os.path.isdir(os.path.join(TESTFN2, "d")))
self.assertTrue(os.path.isdir(os.path.join(TESTFN2, "d", "e")))
else:
self.assertTrue(os.path.isfile(os.path.join(TESTFN2, "a\\b\\c")))
self.assertTrue(os.path.isfile(os.path.join(TESTFN2, "d\\e\\")))
self.assertFalse(os.path.exists(os.path.join(TESTFN2, "a")))
self.assertFalse(os.path.exists(os.path.join(TESTFN2, "d")))

def test_write_dir(self):
dirpath = os.path.join(TESTFN2, "x")
os.mkdir(dirpath)
Expand Down
10 changes: 9 additions & 1 deletion Lib/zipfile/__init__.py
Expand Up @@ -605,7 +605,15 @@ def from_file(cls, filename, arcname=None, *, strict_timestamps=True):

def is_dir(self):
"""Return True if this archive member is a directory."""
return self.filename.endswith('/')
if self.filename.endswith('/'):
return True
# The ZIP format specification requires to use forward slashes
# as the directory separator, but in practice some ZIP files
# created on Windows can use backward slashes. For compatibility
# with the extraction code which already handles this:
if os.path.altsep:
return self.filename.endswith((os.path.sep, os.path.altsep))
return False


# ZIP encryption uses the CRC32 one-byte primitive for scrambling some
Expand Down
@@ -0,0 +1,2 @@
Fix :mod:`zipfile` extraction for directory entries with the name containing
backslashes on Windows.

0 comments on commit c175734

Please sign in to comment.