Source code for duplicity.tempdir

# -*- Mode:Python; indent-tabs-mode:nil; tab-width:4; encoding:utf-8 -*-
#
# Copyright 2002 Ben Escoto <ben@emerose.org>
# Copyright 2007 Kenneth Loafman <kenneth@loafman.com>
#
# This file is part of duplicity.
#
# Duplicity is free software; you can redistribute it and/or modify it
# under the terms of the GNU General Public License as published by the
# Free Software Foundation; either version 2 of the License, or (at your
# option) any later version.
#
# Duplicity is distributed in the hope that it will be useful, but
# WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
# General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with duplicity; if not, write to the Free Software Foundation,
# Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

u"""
Provides temporary file handling cenetered around a single top-level
securely created temporary directory.

The public interface of this module is thread-safe.
"""

from __future__ import print_function
from future import standard_library
standard_library.install_aliases()
from builtins import object

import os
import platform
import subprocess
import tempfile
import threading

from duplicity import config
from duplicity import log
from duplicity import util

# Set up state related to managing the default temporary directory
# instance
_defaultLock = threading.Lock()
_defaultInstance = None
# backup the initial tmp dir path because we will force tempfile
# later to use our generated _defaultInstance.dir() as temproot
_initialSystemTempRoot = tempfile.gettempdir()


[docs]def default(): u""" Obtain the global default instance of TemporaryDirectory, creating it first if necessary. Failures are propagated to caller. Most callers are expected to use this function rather than instantiating TemporaryDirectory directly, unless they explicitly desdire to have their "own" directory for some reason. This function is thread-safe. """ global _defaultLock global _defaultInstance _defaultLock.acquire() try: if _defaultInstance is None or _defaultInstance.dir() is None: _defaultInstance = TemporaryDirectory(temproot=config.temproot) # set the temp dir to be the default in tempfile module from now on tempfile.tempdir = _defaultInstance.dir() return _defaultInstance finally: _defaultLock.release()
[docs]class TemporaryDirectory(object): u""" A temporary directory. An instance of this class is backed by a directory in the file system created securely by the use of tempfile.mkdtemp(). Said instance can be used to obtain unique filenames inside of this directory for cases where mktemp()-like semantics is desired, or (recommended) an fd,filename pair for mkstemp()-like semantics. See further below for the security implications of using it. Each instance will keep a list of all files ever created by it, to faciliate deletion of such files and rmdir() of the directory itself. It does this in order to be able to clean out the directory without resorting to a recursive delete (ala rm -rf), which would be risky. Calling code can optionally (recommended) notify an instance of the fact that a tempfile was deleted, and thus need not be kept track of anymore. This class serves two primary purposes: Firstly, it provides a convenient single top-level directory in which all the clutter ends up, rather than cluttering up the root of the system temp directory itself with many files. Secondly, it provides a way to get mktemp() style semantics for temporary file creation, with most of the risks gone. Specifically, since the directory itself is created securely, files in this directory can be (mostly) safely created non-atomically without the usual mktemp() security implications. However, in the presence of tmpwatch, tmpreaper, or similar mechanisms that will cause files in the system tempdir to expire, a security risk is still present because the removal of the TemporaryDirectory managed directory removes all protection it offers. For this reason, use of mkstemp() is greatly preferred above use of mktemp(). In addition, since cleanup is in the form of deletion based on a list of filenames, completely independently of whether someone else already deleted the file, there exists a race here as well. The impact should however be limited to the removal of an 'attackers' file. """
[docs] def __init__(self, temproot=None): u""" Create a new TemporaryDirectory backed by a unique and securely created file system directory. tempbase - The temp root directory, or None to use system default (recommended). """ def defaults_to_tmp(path): u'''Determine if path point to a MAcOS system tmp''' sys_temps = [ os.path.realpath(u"/tmp"), os.path.realpath(u"/var/tmp"), ] user_temp = os.path.realpath(path) for sys_temp in sys_temps: if user_temp.startswith(sys_temp): return True return False if temproot is None: if config.temproot: temproot = config.temproot else: global _initialSystemTempRoot temproot = _initialSystemTempRoot if isinstance(temproot, b"".__class__): temproot = util.fsdecode(temproot) if (platform.system().startswith(u'Darwin') and defaults_to_tmp(temproot)): # Use temp space from getconf, never /tmp temproot = subprocess.check_output([u'getconf', u'DARWIN_USER_TEMP_DIR']) temproot = util.fsdecode(temproot).rstrip() self.__dir = tempfile.mkdtemp(u"-tempdir", u"duplicity-", temproot) log.Info(_(u"Using temporary directory %s") % self.__dir) # number of mktemp()/mkstemp() calls served so far self.__tempcount = 0 # dict of paths pending deletion; use dict even though we are # not concearned with association, because it is unclear whether # sets are O(1), while dictionaries are. self.__pending = {} self.__lock = threading.Lock() # protect private resources *AND* mktemp/mkstemp calls
[docs] def dir(self): u""" Returns the absolute pathname of the temp folder. """ return self.__dir
def __del__(self): u""" Perform cleanup. """ global _defaultInstance if _defaultInstance is not None: self.cleanup()
[docs] def mktemp(self): u""" Return a unique filename suitable for use for a temporary file. The file is not created. Subsequent calls to this method are guaranteed to never return the same filename again. As a result, it is safe to use under concurrent conditions. NOTE: mkstemp() is greatly preferred. """ filename = None self.__lock.acquire() try: self.__tempcount = self.__tempcount + 1 suffix = u"-%d" % (self.__tempcount,) filename = util.fsencode(tempfile.mktemp(suffix, u"mktemp-", self.__dir)) log.Debug(_(u"Registering (mktemp) temporary file %s") % util.fsdecode(filename)) self.__pending[filename] = None finally: self.__lock.release() return filename
[docs] def mkstemp(self): u""" Returns a filedescriptor and a filename, as per os.mkstemp(), but located in the temporary directory and subject to tracking and automatic cleanup. """ fd = None filename = None self.__lock.acquire() try: self.__tempcount = self.__tempcount + 1 suffix = u"-%d" % (self.__tempcount,) fd, filename = tempfile.mkstemp(suffix, u"mkstemp-", self.__dir,) log.Debug(_(u"Registering (mkstemp) temporary file %s") % filename) self.__pending[filename] = None finally: self.__lock.release() return fd, filename
[docs] def mkstemp_file(self): u""" Convenience wrapper around mkstemp(), with the file descriptor converted into a file object. """ fd, filename = self.mkstemp() return os.fdopen(fd, u"r+"), filename
[docs] def forget(self, fname): u""" Forget about the given filename previously obtained through mktemp() or mkstemp(). This should be called *after* the file has been deleted, to stop a future cleanup() from trying to delete it. Forgetting is only needed for scaling purposes; that is, to avoid n timefile creations from implying that n filenames are kept in memory. Typically this whould never matter in duplicity, but for niceness sake callers are recommended to use this method whenever possible. """ self.__lock.acquire() try: if fname in self.__pending: log.Debug(_(u"Forgetting temporary file %s") % util.fsdecode(fname)) del self.__pending[fname] else: log.Warn(_(u"Attempt to forget unknown tempfile %s - this is probably a bug.") % util.fsdecode(fname)) pass finally: self.__lock.release()
[docs] def cleanup(self): u""" Cleanup any files created in the temporary directory (that have not been forgotten), and clean up the temporary directory itself. On failure they are logged, but this method will not raise an exception. """ self.__lock.acquire() try: if self.__dir is not None: for file in list(self.__pending.keys()): try: log.Debug(_(u"Removing still remembered temporary file %s") % util.fsdecode(file)) util.ignore_missing(os.unlink, file) except Exception: log.Info(_(u"Cleanup of temporary file %s failed") % util.fsdecode(file)) pass try: os.rmdir(self.__dir) except Exception: log.Warn(_(u"Cleanup of temporary directory %s failed - " u"this is probably a bug.") % util.fsdecode(self.__dir)) pass self.__pending = None self.__dir = None finally: self.__lock.release()