# Unix SMB/CIFS implementation. # Copyright (C) Douglas Bagnall # # This program is free software; you can redistribute it and/or modify # it under the terms of the GNU General Public License as published by # the Free Software Foundation; either version 3 of the License, or # (at your option) any later version. # # This program is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU General Public License for more details. # # You should have received a copy of the GNU General Public License # along with this program. If not, see . import os import tarfile from pathlib import Path from tarfile import ExtractError, TarInfo, TarFile as UnsafeTarFile class TarFile(UnsafeTarFile): """This TarFile implementation is trying to ameliorate CVE-2007-4559, where tarfile.TarFiles can step outside of the target directory using '../../'. """ try: # New in version 3.11.4 (also has been backported) # https://docs.python.org/3/library/tarfile.html#tarfile.TarFile.extraction_filter # https://peps.python.org/pep-0706/ extraction_filter = staticmethod(tarfile.data_filter) except AttributeError: def extract(self, member, path="", set_attrs=True, *, numeric_owner=False): self._safetarfile_check() super().extract(member, path, set_attrs=set_attrs, numeric_owner=numeric_owner) def extractall(self, path, members=None, *, numeric_owner=False): self._safetarfile_check() super().extractall(path, members, numeric_owner=numeric_owner) def _safetarfile_check(self): for tarinfo in self.__iter__(): if self._is_traversal_attempt(tarinfo=tarinfo): raise ExtractError( "Attempted directory traversal for " f"member: {tarinfo.name}") if self._is_unsafe_symlink(tarinfo=tarinfo): raise ExtractError( "Attempted directory traversal via symlink for " f"member: {tarinfo.linkname}") if self._is_unsafe_link(tarinfo=tarinfo): raise ExtractError( "Attempted directory traversal via link for " f"member: {tarinfo.linkname}") def _resolve_path(self, path): return os.path.realpath(os.path.abspath(path)) def _is_path_in_dir(self, path, basedir): return self._resolve_path(os.path.join(basedir, path)).startswith(basedir) def _is_traversal_attempt(self, tarinfo): if (tarinfo.name.startswith(os.sep) or ".." + os.sep in tarinfo.name): return True return False def _is_unsafe_symlink(self, tarinfo): if tarinfo.issym(): symlink_file = Path( os.path.normpath(os.path.join(os.getcwd(), tarinfo.linkname))) if not self._is_path_in_dir(symlink_file, os.getcwd()): return True return False def _is_unsafe_link(self, tarinfo): if tarinfo.islnk(): link_file = Path( os.path.normpath(os.path.join(os.getcwd(), tarinfo.linkname))) if not self._is_path_in_dir(link_file, os.getcwd()): return True return False open = TarFile.open