""" Ported to Python3. Futz with files like a pro. """ import sys, os, stat, tempfile, time, binascii import six from collections import namedtuple from errno import ENOENT if sys.platform == "win32": from ctypes import WINFUNCTYPE, WinError, windll, POINTER, byref, c_ulonglong, \ create_unicode_buffer, get_last_error from ctypes.wintypes import BOOL, DWORD, LPCWSTR, LPWSTR, LPVOID from twisted.python import log from allmydata.crypto import aes from allmydata.util.assertutil import _assert def rename(src, dst, tries=4, basedelay=0.1): """ Here is a superkludge to workaround the fact that occasionally on Windows some other process (e.g. an anti-virus scanner, a local search engine, etc.) is looking at your file when you want to delete or move it, and hence you can't. The horrible workaround is to sit and spin, trying to delete it, for a short time and then give up. With the default values of tries and basedelay this can block for less than a second. @param tries: number of tries -- each time after the first we wait twice as long as the previous wait @param basedelay: how long to wait before the second try """ for i in range(tries-1): try: return os.rename(src, dst) except EnvironmentError as le: # XXX Tighten this to check if this is a permission denied error (possibly due to another Windows process having the file open and execute the superkludge only in this case. log.msg("XXX KLUDGE Attempting to move file %s => %s; got %s; sleeping %s seconds" % (src, dst, le, basedelay,)) time.sleep(basedelay) basedelay *= 2 return os.rename(src, dst) # The last try. def remove(f, tries=4, basedelay=0.1): """ Here is a superkludge to workaround the fact that occasionally on Windows some other process (e.g. an anti-virus scanner, a local search engine, etc.) is looking at your file when you want to delete or move it, and hence you can't. The horrible workaround is to sit and spin, trying to delete it, for a short time and then give up. With the default values of tries and basedelay this can block for less than a second. @param tries: number of tries -- each time after the first we wait twice as long as the previous wait @param basedelay: how long to wait before the second try """ try: os.chmod(f, stat.S_IWRITE | stat.S_IEXEC | stat.S_IREAD) except: pass for i in range(tries-1): try: return os.remove(f) except EnvironmentError as le: # XXX Tighten this to check if this is a permission denied error (possibly due to another Windows process having the file open and execute the superkludge only in this case. if not os.path.exists(f): return log.msg("XXX KLUDGE Attempting to remove file %s; got %s; sleeping %s seconds" % (f, le, basedelay,)) time.sleep(basedelay) basedelay *= 2 return os.remove(f) # The last try. class ReopenableNamedTemporaryFile(object): """ This uses tempfile.mkstemp() to generate a secure temp file. It then closes the file, leaving a zero-length file as a placeholder. You can get the filename with ReopenableNamedTemporaryFile.name. When the ReopenableNamedTemporaryFile instance is garbage collected or its shutdown() method is called, it deletes the file. """ def __init__(self, *args, **kwargs): fd, self.name = tempfile.mkstemp(*args, **kwargs) os.close(fd) def __repr__(self): return "<%s instance at %x %s>" % (self.__class__.__name__, id(self), self.name) def __str__(self): return self.__repr__() def __del__(self): self.shutdown() def shutdown(self): remove(self.name) class EncryptedTemporaryFile(object): # not implemented: next, readline, readlines, xreadlines, writelines def __init__(self): self.file = tempfile.TemporaryFile() self.key = os.urandom(16) # AES-128 def _crypt(self, offset, data): offset_big = offset // 16 offset_small = offset % 16 iv = binascii.unhexlify("%032x" % offset_big) cipher = aes.create_encryptor(self.key, iv) # this is just to advance the counter aes.encrypt_data(cipher, b"\x00" * offset_small) return aes.encrypt_data(cipher, data) def close(self): self.file.close() def flush(self): self.file.flush() def seek(self, offset, whence=0): # 0 = SEEK_SET self.file.seek(offset, whence) def tell(self): offset = self.file.tell() return offset def read(self, size=-1): """A read must not follow a write, or vice-versa, without an intervening seek.""" index = self.file.tell() ciphertext = self.file.read(size) plaintext = self._crypt(index, ciphertext) return plaintext def write(self, plaintext): """A read must not follow a write, or vice-versa, without an intervening seek. If seeking and then writing causes a 'hole' in the file, the contents of the hole are unspecified.""" index = self.file.tell() ciphertext = self._crypt(index, plaintext) self.file.write(ciphertext) def truncate(self, newsize): """Truncate or extend the file to 'newsize'. If it is extended, the contents after the old end-of-file are unspecified. The file position after this operation is unspecified.""" self.file.truncate(newsize) def make_dirs_with_absolute_mode(parent, dirname, mode): """ Make directory `dirname` and chmod it to `mode` afterwards. We chmod all parent directories of `dirname` until we reach `parent`. """ precondition_abspath(parent) precondition_abspath(dirname) if not is_ancestor_path(parent, dirname): raise AssertionError("dirname must be a descendant of parent") make_dirs(dirname) while dirname != parent: os.chmod(dirname, mode) # FIXME: doesn't seem to work on Windows for long paths old_dirname, dirname = dirname, os.path.dirname(dirname) _assert(len(dirname) < len(old_dirname), dirname=dirname, old_dirname=old_dirname) def is_ancestor_path(parent, dirname): while dirname != parent: # FIXME: doesn't seem to work on Windows for long paths old_dirname, dirname = dirname, os.path.dirname(dirname) if len(dirname) >= len(old_dirname): return False return True def make_dirs(dirname, mode=0o777): """ An idempotent version of os.makedirs(). If the dir already exists, do nothing and return without raising an exception. If this call creates the dir, return without raising an exception. If there is an error that prevents creation or if the directory gets deleted after make_dirs() creates it and before make_dirs() checks that it exists, raise an exception. """ tx = None try: os.makedirs(dirname, mode) except OSError as x: tx = x if not os.path.isdir(dirname): if tx: raise tx raise IOError("unknown error prevented creation of directory, or deleted the directory immediately after creation: %s" % dirname) # careful not to construct an IOError with a 2-tuple, as that has a special meaning... def rm_dir(dirname): """ A threadsafe and idempotent version of shutil.rmtree(). If the dir is already gone, do nothing and return without raising an exception. If this call removes the dir, return without raising an exception. If there is an error that prevents deletion or if the directory gets created again after rm_dir() deletes it and before rm_dir() checks that it is gone, raise an exception. """ excs = [] try: os.chmod(dirname, stat.S_IWRITE | stat.S_IEXEC | stat.S_IREAD) for f in os.listdir(dirname): fullname = os.path.join(dirname, f) if os.path.isdir(fullname): rm_dir(fullname) else: remove(fullname) os.rmdir(dirname) except Exception as le: # Ignore "No such file or directory" if (not isinstance(le, OSError)) or le.args[0] != 2: excs.append(le) # Okay, now we've recursively removed everything, ignoring any "No # such file or directory" errors, and collecting any other errors. if os.path.exists(dirname): if len(excs) == 1: raise excs[0] if len(excs) == 0: raise OSError("Failed to remove dir for unknown reason.") raise OSError(excs) def remove_if_possible(f): try: remove(f) except: pass def du(basedir): size = 0 for root, dirs, files in os.walk(basedir): for f in files: fn = os.path.join(root, f) size += os.path.getsize(fn) return size def move_into_place(source, dest): """Atomically replace a file, or as near to it as the platform allows. The dest file may or may not exist.""" if "win32" in sys.platform.lower() and os.path.exists(source): # we check for source existing since we don't want to nuke the # dest unless we'll succeed at moving the target into place remove_if_possible(dest) os.rename(source, dest) def write_atomically(target, contents, mode="b"): assert ( isinstance(contents, bytes) and "b" in mode or isinstance(contents, str) and "t" in mode or mode == ""), (type(contents), mode) with open(target+".tmp", "w"+mode) as f: f.write(contents) move_into_place(target+".tmp", target) def write(path, data, mode="wb"): if "b" in mode and isinstance(data, str): data = data.encode("utf-8") with open(path, mode) as f: f.write(data) def read(path, mode="rb"): with open(path, mode) as rf: return rf.read() def put_file(path, inf): precondition_abspath(path) # TODO: create temporary file and move into place? with open(path, "wb") as outf: while True: data = inf.read(32768) if not data: break outf.write(data) def precondition_abspath(path): if not isinstance(path, str): raise AssertionError("an abspath must be a Unicode string") if sys.platform == "win32": # This intentionally doesn't view absolute paths starting with a drive specification, or # paths relative to the current drive, as acceptable. if not path.startswith("\\\\"): raise AssertionError("an abspath should be normalized using abspath_expanduser_unicode") else: # This intentionally doesn't view the path '~' or paths starting with '~/' as acceptable. if not os.path.isabs(path): raise AssertionError("an abspath should be normalized using abspath_expanduser_unicode") # Work around . This code is adapted from # # with some simplifications. _getfullpathname = None try: from nt import _getfullpathname # type: ignore except ImportError: pass def abspath_expanduser_unicode(path, base=None, long_path=True): """ Return the absolute version of a path. If 'base' is given and 'path' is relative, the path will be expanded relative to 'base'. 'path' must be a Unicode string. 'base', if given, must be a Unicode string corresponding to an absolute path as returned by a previous call to abspath_expanduser_unicode. On Windows, the result will be a long path unless long_path is given as False. """ if not isinstance(path, str): raise AssertionError("paths must be Unicode strings") if base is not None and long_path: precondition_abspath(base) path = expanduser(path) if _getfullpathname: # On Windows, os.path.isabs will incorrectly return True # for paths without a drive letter (that are not UNC paths), # e.g. "\\". See . try: if base is None: path = _getfullpathname(path or u".") else: path = _getfullpathname(os.path.join(base, path)) except OSError: pass if not os.path.isabs(path): if base is None: cwd = os.getcwd() path = os.path.join(cwd, path) else: path = os.path.join(base, path) # We won't hit because # there is always at least one Unicode path component. path = os.path.normpath(path) if sys.platform == "win32" and long_path: path = to_windows_long_path(path) return path def to_windows_long_path(path): # '/' is normally a perfectly valid path component separator in Windows. # However, when using the "\\?\" syntax it is not recognized, so we # replace it with '\' here. path = path.replace(u"/", u"\\") # Note that other normalizations such as removing '.' and '..' should # be done outside this function. if path.startswith(u"\\\\?\\") or path.startswith(u"\\\\.\\"): return path elif path.startswith(u"\\\\"): return u"\\\\?\\UNC\\" + path[2 :] else: return u"\\\\?\\" + path have_GetDiskFreeSpaceExW = False if sys.platform == "win32": # GetEnvironmentVariableW = WINFUNCTYPE( DWORD, LPCWSTR, LPWSTR, DWORD, use_last_error=True )(("GetEnvironmentVariableW", windll.kernel32)) try: # PULARGE_INTEGER = POINTER(c_ulonglong) # GetDiskFreeSpaceExW = WINFUNCTYPE( BOOL, LPCWSTR, PULARGE_INTEGER, PULARGE_INTEGER, PULARGE_INTEGER, use_last_error=True )(("GetDiskFreeSpaceExW", windll.kernel32)) have_GetDiskFreeSpaceExW = True except Exception: import traceback traceback.print_exc() def expanduser(path): # os.path.expanduser is hopelessly broken for Unicode paths on Windows (ticket #1674). if sys.platform == "win32": return windows_expanduser(path) else: return os.path.expanduser(path) def windows_expanduser(path): if not path.startswith('~'): return path home_dir = windows_getenv(u'USERPROFILE') if home_dir is None: home_drive = windows_getenv(u'HOMEDRIVE') home_path = windows_getenv(u'HOMEPATH') if home_drive is None or home_path is None: raise OSError("Could not find home directory: neither %USERPROFILE% nor (%HOMEDRIVE% and %HOMEPATH%) are set.") home_dir = os.path.join(home_drive, home_path) if path == '~': return home_dir elif path.startswith('~/') or path.startswith('~\\'): return os.path.join(home_dir, path[2 :]) else: return path # ERROR_ENVVAR_NOT_FOUND = 203 def windows_getenv(name): # Based on , # with improved error handling. Returns None if there is no enivronment variable of the given name. if not isinstance(name, str): raise AssertionError("name must be Unicode") n = GetEnvironmentVariableW(name, None, 0) # GetEnvironmentVariableW returns DWORD, so n cannot be negative. if n == 0: err = get_last_error() if err == ERROR_ENVVAR_NOT_FOUND: return None raise OSError("WinError: %s\n attempting to read size of environment variable %r" % (WinError(err), name)) if n == 1: # Avoid an ambiguity between a zero-length string and an error in the return value of the # call to GetEnvironmentVariableW below. return u"" buf = create_unicode_buffer(u'\0'*n) retval = GetEnvironmentVariableW(name, buf, n) if retval == 0: err = get_last_error() if err == ERROR_ENVVAR_NOT_FOUND: return None raise OSError("WinError: %s\n attempting to read environment variable %r" % (WinError(err), name)) if retval >= n: raise OSError("Unexpected result %d (expected less than %d) from GetEnvironmentVariableW attempting to read environment variable %r" % (retval, n, name)) return buf.value def get_disk_stats(whichdir, reserved_space=0): """Return disk statistics for the storage disk, in the form of a dict with the following fields. total: total bytes on disk free_for_root: bytes actually free on disk free_for_nonroot: bytes free for "a non-privileged user" [Unix] or the current user [Windows]; might take into account quotas depending on platform used: bytes used on disk avail: bytes available excluding reserved space An AttributeError can occur if the OS has no API to get disk information. An EnvironmentError can occur if the OS call fails. whichdir is a directory on the filesystem in question -- the answer is about the filesystem, not about the directory, so the directory is used only to specify which filesystem. reserved_space is how many bytes to subtract from the answer, so you can pass how many bytes you would like to leave unused on this filesystem as reserved_space. """ if have_GetDiskFreeSpaceExW: # If this is a Windows system and GetDiskFreeSpaceExW is available, use it. # (This might put up an error dialog unless # SetErrorMode(SEM_FAILCRITICALERRORS | SEM_NOOPENFILEERRORBOX) has been called, # which we do in allmydata.windows.fixups.initialize().) n_free_for_nonroot = c_ulonglong(0) n_total = c_ulonglong(0) n_free_for_root = c_ulonglong(0) retval = GetDiskFreeSpaceExW(whichdir, byref(n_free_for_nonroot), byref(n_total), byref(n_free_for_root)) if retval == 0: raise OSError("WinError: %s\n attempting to get disk statistics for %r" % (WinError(get_last_error()), whichdir)) free_for_nonroot = n_free_for_nonroot.value total = n_total.value free_for_root = n_free_for_root.value else: # For Unix-like systems. # # # s = os.statvfs(whichdir) # on my mac laptop: # statvfs(2) is a wrapper around statfs(2). # statvfs.f_frsize = statfs.f_bsize : # "minimum unit of allocation" (statvfs) # "fundamental file system block size" (statfs) # statvfs.f_bsize = statfs.f_iosize = stat.st_blocks : preferred IO size # on an encrypted home directory ("FileVault"), it gets f_blocks # wrong, and s.f_blocks*s.f_frsize is twice the size of my disk, # but s.f_bavail*s.f_frsize is correct total = s.f_frsize * s.f_blocks free_for_root = s.f_frsize * s.f_bfree free_for_nonroot = s.f_frsize * s.f_bavail # valid for all platforms: used = total - free_for_root avail = max(free_for_nonroot - reserved_space, 0) return { 'total': total, 'free_for_root': free_for_root, 'free_for_nonroot': free_for_nonroot, 'used': used, 'avail': avail, } def get_available_space(whichdir, reserved_space): """Returns available space for share storage in bytes, or None if no API to get this information is available. whichdir is a directory on the filesystem in question -- the answer is about the filesystem, not about the directory, so the directory is used only to specify which filesystem. reserved_space is how many bytes to subtract from the answer, so you can pass how many bytes you would like to leave unused on this filesystem as reserved_space. """ try: return get_disk_stats(whichdir, reserved_space)['avail'] except AttributeError: return None except EnvironmentError: log.msg("OS call to get disk statistics failed") return 0 class ConflictError(Exception): pass class UnableToUnlinkReplacementError(Exception): pass def reraise(wrapper): cls, exc, tb = sys.exc_info() wrapper_exc = wrapper("%s: %s" % (cls.__name__, exc)) six.reraise(wrapper, wrapper_exc, tb) if sys.platform == "win32": # ReplaceFileW = WINFUNCTYPE( BOOL, LPCWSTR, LPCWSTR, LPCWSTR, DWORD, LPVOID, LPVOID, use_last_error=True )(("ReplaceFileW", windll.kernel32)) REPLACEFILE_IGNORE_MERGE_ERRORS = 0x00000002 # ERROR_FILE_NOT_FOUND = 2 def rename_no_overwrite(source_path, dest_path): os.rename(source_path, dest_path) def replace_file(replaced_path, replacement_path): precondition_abspath(replaced_path) precondition_abspath(replacement_path) # no "backup" path (the first None) because we don't want to # create a backup file r = ReplaceFileW(replaced_path, replacement_path, None, REPLACEFILE_IGNORE_MERGE_ERRORS, None, None) if r == 0: # The UnableToUnlinkReplacementError case does not happen on Windows; # all errors should be treated as signalling a conflict. err = get_last_error() if err != ERROR_FILE_NOT_FOUND: raise ConflictError("WinError: %s" % (WinError(err),)) try: move_into_place(replacement_path, replaced_path) except EnvironmentError: reraise(ConflictError) else: def rename_no_overwrite(source_path, dest_path): # link will fail with EEXIST if there is already something at dest_path. os.link(source_path, dest_path) try: os.unlink(source_path) except EnvironmentError: reraise(UnableToUnlinkReplacementError) def replace_file(replaced_path, replacement_path): precondition_abspath(replaced_path) precondition_abspath(replacement_path) if not os.path.exists(replacement_path): raise ConflictError("Replacement file not found: %r" % (replacement_path,)) try: move_into_place(replacement_path, replaced_path) except OSError as e: if e.errno != ENOENT: raise except EnvironmentError: reraise(ConflictError) PathInfo = namedtuple('PathInfo', 'isdir isfile islink exists size mtime_ns ctime_ns') def seconds_to_ns(t): return int(t * 1000000000) def get_pathinfo(path_u, now_ns=None): try: statinfo = os.lstat(path_u) mode = statinfo.st_mode return PathInfo(isdir =stat.S_ISDIR(mode), isfile =stat.S_ISREG(mode), islink =stat.S_ISLNK(mode), exists =True, size =statinfo.st_size, mtime_ns=seconds_to_ns(statinfo.st_mtime), ctime_ns=seconds_to_ns(statinfo.st_ctime), ) except OSError as e: if e.errno == ENOENT: if now_ns is None: now_ns = seconds_to_ns(time.time()) return PathInfo(isdir =False, isfile =False, islink =False, exists =False, size =None, mtime_ns=now_ns, ctime_ns=now_ns, ) raise