From e557fe9989cc2a91a34ddab04402157297a4ae4d Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Marek=20Marczykowski-G=C3=B3recki?= Date: Sun, 13 Mar 2016 13:49:42 +0100 Subject: [PATCH] backup: restructude the code into classes Introduce two main classes Backup and BackupRestore for storing the state of the desired operation. Then a simple interface to adjust parameters. (Almost) no functional change. QubesOS/qubes-issues#1213 QubesOS/qubes-issues#1214 --- qubes/backup.py | 3114 +++++++++++++++++++------------------ qubes/tests/__init__.py | 36 +- qubes/tests/int/backup.py | 46 +- 3 files changed, 1598 insertions(+), 1598 deletions(-) diff --git a/qubes/backup.py b/qubes/backup.py index 09ccb11f..b201b7fb 100644 --- a/qubes/backup.py +++ b/qubes/backup.py @@ -23,6 +23,7 @@ # # from __future__ import unicode_literals +import itertools from qubes.utils import size_to_human import sys import os @@ -45,6 +46,7 @@ HEADER_FILENAME = 'backup-header' DEFAULT_CRYPTO_ALGORITHM = 'aes-256-cbc' DEFAULT_HMAC_ALGORITHM = 'SHA512' DEFAULT_COMPRESSION_FILTER = 'gzip' +# TODO: increase version after finishing implementation CURRENT_BACKUP_FORMAT_VERSION = '3' # Maximum size of error message get from process stderr (including VM process) MAX_STDERR_BYTES = 1024 @@ -53,9 +55,6 @@ HEADER_QUBES_XML_MAX_SIZE = 1024 * 1024 BLKSIZE = 512 -# global state for backup_cancel() -running_backup_operation = None - def print_stdout(text): print (text) @@ -83,322 +82,99 @@ def get_disk_usage(path): return ret -class BackupOperationInfo: - def __init__(self): - self.canceled = False - self.processes_to_kill_on_cancel = [] - self.tmpdir_to_remove = None - - class BackupCanceledError(qubes.exc.QubesException): def __init__(self, msg, tmpdir=None): super(BackupCanceledError, self).__init__(msg) self.tmpdir = tmpdir -class BackupHeader: - version = 'version' - encrypted = 'encrypted' - compressed = 'compressed' - compression_filter = 'compression-filter' - crypto_algorithm = 'crypto-algorithm' - hmac_algorithm = 'hmac-algorithm' +class BackupHeader(object): + header_keys = { + 'version': 'version', + 'encrypted': 'encrypted', + 'compressed': 'compressed', + 'compression-filter': 'compression_filter', + 'crypto-algorithm': 'crypto_algorithm', + 'hmac-algorithm': 'hmac_algorithm', + } bool_options = ['encrypted', 'compressed'] int_options = ['version'] + def __init__(self, header_data = None): + # repeat the list to help code completion... + self.version = None + self.encrypted = None + self.compressed = None + # Options introduced in backup format 3+, which always have a header, + # so no need for fallback in function parameter + self.compression_filter = None + self.hmac_algorithm = None + self.crypto_algorithm = None -def file_to_backup(file_path, subdir=None): - sz = get_disk_usage(file_path) + if header_data is not None: + self.load(header_data) - if subdir is None: - abs_file_path = os.path.abspath(file_path) - abs_base_dir = os.path.abspath(qubes.config.system_path["qubes_base_dir"]) + '/' - abs_file_dir = os.path.dirname(abs_file_path) + '/' - (nothing, directory, subdir) = abs_file_dir.partition(abs_base_dir) - assert nothing == "" - assert directory == abs_base_dir - else: - if len(subdir) > 0 and not subdir.endswith('/'): - subdir += '/' - return [{"path": file_path, "size": sz, "subdir": subdir}] + def load(self, untrusted_header_text): + """Parse backup header file. - -def backup_cancel(): - """ - Cancel currently running backup/restore operation - - @return: True if any operation was signaled - """ - if running_backup_operation is None: - return False - - running_backup_operation.canceled = True - for proc in running_backup_operation.processes_to_kill_on_cancel: + :param untrusted_header_text: header content + :type untrusted_header_text: basestring + .. warning:: + This function may be exposed to not yet verified header, + so is security critical. + """ try: - proc.terminate() - except: + untrusted_header_text = untrusted_header_text.decode('ascii') + except UnicodeDecodeError: + raise qubes.exc.QubesException( + "Non-ASCII characters in backup header") + for untrusted_line in untrusted_header_text.splitlines(): + if untrusted_line.count('=') != 1: + raise qubes.exc.QubesException("Invalid backup header") + (key, value) = untrusted_line.strip().split('=') + if key not in self.header_keys.keys(): + # Ignoring unknown option + continue + if getattr(self, self.header_keys[key]) is not None: + raise qubes.exc.QubesException( + "Duplicated header line: {}".format(key)) + if key in self.bool_options: + value = value.lower() in ["1", "true", "yes"] + elif key in self.int_options: + value = int(value) + setattr(self, self.header_keys[key], value) + + self.validate() + + def validate(self): + if self.version == 1: + # header not really present pass - return True - - -def backup_prepare(app, vms_list=None, exclude_list=None, - print_callback=print_stdout, hide_vm_names=True): - """ - If vms = None, include all (sensible) VMs; - exclude_list is always applied - """ - # XXX hack for tests, where store filename is qubes-test.xml - qubes_xml = app._store - if os.path.basename(qubes_xml) != 'qubes.xml': - dir = tempfile.mkdtemp() - shutil.copy(qubes_xml, os.path.join(dir, 'qubes.xml')) - qubes_xml = os.path.join(dir, 'qubes.xml') - # FIXME cleanup tempdir later - - files_to_backup = file_to_backup(qubes_xml, '') - - if exclude_list is None: - exclude_list = [] - - if vms_list is None: - all_vms = [vm for vm in app.domains] - selected_vms = [vm for vm in all_vms if vm.include_in_backups] - appvms_to_backup = [vm for vm in selected_vms if - vm.is_appvm() and not vm.internal] - template_vms_worth_backingup = [vm for vm in selected_vms if ( - vm.is_template() and vm.include_in_backups)] - dom0 = [app.domains[0]] - - vms_list = appvms_to_backup + \ - template_vms_worth_backingup + dom0 - - vms_for_backup = vms_list - # Apply exclude list - if exclude_list: - vms_for_backup = [vm for vm in vms_list if vm.name not in exclude_list] - - there_are_running_vms = False - - fields_to_display = [ - {"name": "VM", "width": 16}, - {"name": "type", "width": 12}, - {"name": "size", "width": 12} - ] - - # Display the header - s = "" - for f in fields_to_display: - fmt = "{{0:-^{0}}}-+".format(f["width"] + 1) - s += fmt.format('-') - print_callback(s) - s = "" - for f in fields_to_display: - fmt = "{{0:>{0}}} |".format(f["width"] + 1) - s += fmt.format(f["name"]) - print_callback(s) - s = "" - for f in fields_to_display: - fmt = "{{0:-^{0}}}-+".format(f["width"] + 1) - s += fmt.format('-') - print_callback(s) - - files_to_backup_index = 0 - for vm in vms_for_backup: - if vm.is_template(): - # handle templates later - continue - if vm.qid == 0: - # handle dom0 later - continue - - if hide_vm_names: - subdir = 'vm%d/' % vm.qid + elif self.version in [2, 3]: + expected_attrs = ['version', 'encrypted', 'compressed', + 'hmac_algorithm'] + if self.encrypted: + expected_attrs += ['crypto_algorithm'] + if self.version >= 3 and self.compressed: + expected_attrs += ['compression_filter'] + for key in expected_attrs: + if getattr(self, key) is None: + raise qubes.exc.QubesException( + "Backup header lack '{}' info".format(key)) else: - subdir = None - - if vm.private_img is not None: - files_to_backup += file_to_backup(vm.private_img, subdir) - - if vm.is_appvm(): - files_to_backup += file_to_backup(vm.icon_path, subdir) - if vm.updateable: - if os.path.exists(vm.dir_path + "/apps.templates"): - # template - files_to_backup += file_to_backup( - vm.dir_path + "/apps.templates", subdir) - else: - # standaloneVM - files_to_backup += file_to_backup(vm.dir_path + "/apps", subdir) - - if os.path.exists(vm.dir_path + "/kernels"): - files_to_backup += file_to_backup(vm.dir_path + "/kernels", - subdir) - if os.path.exists(vm.firewall_conf): - files_to_backup += file_to_backup(vm.firewall_conf, subdir) - if 'appmenus_whitelist' in qubes.config.vm_files and \ - os.path.exists(os.path.join(vm.dir_path, - qubes.config.vm_files[ - 'appmenus_whitelist'])): - files_to_backup += file_to_backup( - os.path.join(vm.dir_path, qubes.config.vm_files[ - 'appmenus_whitelist']), - subdir) - - if vm.updateable: - files_to_backup += file_to_backup(vm.root_img, subdir) - - s = "" - fmt = "{{0:>{0}}} |".format(fields_to_display[0]["width"] + 1) - s += fmt.format(vm.name) - - fmt = "{{0:>{0}}} |".format(fields_to_display[1]["width"] + 1) - if vm.is_netvm(): - s += fmt.format("NetVM" + (" + Sys" if vm.updateable else "")) - else: - s += fmt.format("AppVM" + (" + Sys" if vm.updateable else "")) - - vm_size = reduce(lambda x, y: x + y["size"], - files_to_backup[files_to_backup_index:], - 0) - files_to_backup_index = len(files_to_backup) - - fmt = "{{0:>{0}}} |".format(fields_to_display[2]["width"] + 1) - s += fmt.format(size_to_human(vm_size)) - - if vm.is_running(): - s += " <-- The VM is running, please shut it down before proceeding " \ - "with the backup!" - there_are_running_vms = True - - print_callback(s) - - for vm in vms_for_backup: - if not vm.is_template(): - # already handled - continue - if vm.qid == 0: - # handle dom0 later - continue - vm_sz = vm.get_disk_utilization() - if hide_vm_names: - template_subdir = 'vm%d/' % vm.qid - else: - template_subdir = os.path.relpath( - vm.dir_path, - qubes.config.system_path["qubes_base_dir"]) + '/' - template_to_backup = [{"path": vm.dir_path + '/.', - "size": vm_sz, - "subdir": template_subdir}] - files_to_backup += template_to_backup - - s = "" - fmt = "{{0:>{0}}} |".format(fields_to_display[0]["width"] + 1) - s += fmt.format(vm.name) - - fmt = "{{0:>{0}}} |".format(fields_to_display[1]["width"] + 1) - s += fmt.format("Template VM") - - fmt = "{{0:>{0}}} |".format(fields_to_display[2]["width"] + 1) - s += fmt.format(size_to_human(vm_sz)) - - if vm.is_running(): - s += " <-- The VM is running, please shut it down before proceeding " \ - "with the backup!" - there_are_running_vms = True - - print_callback(s) - - # Initialize backup flag on all VMs - vms_for_backup_qid = [vm.qid for vm in vms_for_backup] - for vm in app.domains: - vm.backup_content = False - if vm.qid == 0: - # handle dom0 later - continue - - if vm.qid in vms_for_backup_qid: - vm.backup_content = True - vm.backup_size = vm.get_disk_utilization() - if hide_vm_names: - vm.backup_path = 'vm%d' % vm.qid - else: - vm.backup_path = os.path.relpath( - vm.dir_path, - qubes.config.system_path["qubes_base_dir"]) - - # Dom0 user home - if 0 in vms_for_backup_qid: - local_user = grp.getgrnam('qubes').gr_mem[0] - home_dir = pwd.getpwnam(local_user).pw_dir - # Home dir should have only user-owned files, so fix it now to prevent - # permissions problems - some root-owned files can left after - # 'sudo bash' and similar commands - subprocess.check_call(['sudo', 'chown', '-R', local_user, home_dir]) - - home_sz = get_disk_usage(home_dir) - home_to_backup = [ - {"path": home_dir, "size": home_sz, "subdir": 'dom0-home/'}] - files_to_backup += home_to_backup - - vm = app.domains[0] - vm.backup_content = True - vm.backup_size = home_sz - vm.backup_path = os.path.join('dom0-home', os.path.basename(home_dir)) - - s = "" - fmt = "{{0:>{0}}} |".format(fields_to_display[0]["width"] + 1) - s += fmt.format('Dom0') - - fmt = "{{0:>{0}}} |".format(fields_to_display[1]["width"] + 1) - s += fmt.format("User home") - - fmt = "{{0:>{0}}} |".format(fields_to_display[2]["width"] + 1) - s += fmt.format(size_to_human(home_sz)) - - print_callback(s) - - app.save() - # FIXME: should be after backup completed - - total_backup_sz = 0 - for f in files_to_backup: - total_backup_sz += f["size"] - - s = "" - for f in fields_to_display: - fmt = "{{0:-^{0}}}-+".format(f["width"] + 1) - s += fmt.format('-') - print_callback(s) - - s = "" - fmt = "{{0:>{0}}} |".format(fields_to_display[0]["width"] + 1) - s += fmt.format("Total size:") - fmt = "{{0:>{0}}} |".format( - fields_to_display[1]["width"] + 1 + 2 + fields_to_display[2][ - "width"] + 1) - s += fmt.format(size_to_human(total_backup_sz)) - print_callback(s) - - s = "" - for f in fields_to_display: - fmt = "{{0:-^{0}}}-+".format(f["width"] + 1) - s += fmt.format('-') - print_callback(s) - - vms_not_for_backup = [vm.name for vm in app.domains - if not vm.backup_content] - print_callback("VMs not selected for backup: %s" % " ".join( - vms_not_for_backup)) - - if there_are_running_vms: - raise qubes.exc.QubesException("Please shutdown all VMs before proceeding.") - - for fileinfo in files_to_backup: - assert len(fileinfo["subdir"]) == 0 or fileinfo["subdir"][-1] == '/', \ - "'subdir' must ends with a '/': %s" % unicode(fileinfo) - - return files_to_backup + raise qubes.exc.QubesException( + "Unsupported backup version {}".format(self.version)) + def save(self, filename): + with open(filename, "w") as f: + # make sure 'version' is the first key + f.write('version={}\n'.format(self.version)) + for key, attr in self.header_keys.iteritems(): + if key == 'version': + continue + if getattr(self, attr) is None: + continue + f.write("{!s}={!s}\n".format(key, getattr(self, attr))) class SendWorker(Process): def __init__(self, queue, base_dir, backup_stdout): @@ -449,40 +225,332 @@ class SendWorker(Process): print "Finished sending thread" -def prepare_backup_header(target_directory, passphrase, compressed=False, - encrypted=False, - hmac_algorithm=DEFAULT_HMAC_ALGORITHM, - crypto_algorithm=DEFAULT_CRYPTO_ALGORITHM, - compression_filter=None): - header_file_path = os.path.join(target_directory, HEADER_FILENAME) - with open(header_file_path, "w") as f: - f.write(str("%s=%s\n" % (BackupHeader.version, - CURRENT_BACKUP_FORMAT_VERSION))) - f.write(str("%s=%s\n" % (BackupHeader.hmac_algorithm, hmac_algorithm))) - f.write(str("%s=%s\n" % (BackupHeader.crypto_algorithm, - crypto_algorithm))) - f.write(str("%s=%s\n" % (BackupHeader.encrypted, str(encrypted)))) - f.write(str("%s=%s\n" % (BackupHeader.compressed, str(compressed)))) - if compressed: - f.write(str("%s=%s\n" % (BackupHeader.compression_filter, - str(compression_filter)))) +class Backup(object): + def __init__(self, app, vms_list=None, exclude_list=None, **kwargs): + """ + If vms = None, include all (sensible) VMs; + exclude_list is always applied + """ + super(Backup, self).__init__() - hmac = subprocess.Popen(["openssl", "dgst", - "-" + hmac_algorithm, "-hmac", passphrase], - stdin=open(header_file_path, "r"), - stdout=open(header_file_path + ".hmac", "w")) - if hmac.wait() != 0: - raise qubes.exc.QubesException("Failed to compute hmac of header file") - return HEADER_FILENAME, HEADER_FILENAME + ".hmac" + #: progress of the backup - bytes handled of the current VM + self.chunk_size = 100 * 1024 * 1024 + self._current_vm_bytes = 0 + #: progress of the backup - bytes handled of finished VMs + self._done_vms_bytes = 0 + #: total backup size (set by :py:meth:`get_files_to_backup`) + self.total_backup_bytes = 0 + #: list of PIDs to kill on backup cancel + self.processes_to_kill_on_cancel = [] + self.app = app + #: directory for temporary files - set after creating the directory + self.tmpdir = None + + # Backup settings - defaults + #: should the backup be encrypted? + self.encrypted = True + #: should the backup be compressed? + self.compressed = True + #: what passphrase should be used to intergrity protect (and encrypt) + # the backup; required + self.passphrase = None + #: custom hmac algorithm + self.hmac_algorithm = DEFAULT_HMAC_ALGORITHM + #: custom encryption algorithm + self.crypto_algorithm = DEFAULT_CRYPTO_ALGORITHM + #: custom compression filter; a program which process stdin to stdout + self.compression_filter = DEFAULT_COMPRESSION_FILTER + #: VM to which backup should be sent (if any) + self.target_vm = None + #: directory to save backup in (either in dom0 or target VM, + # depending on :py:attr:`target_vm` + self.target_dir = None + #: callback for progress reporting. Will be called with one argument + # - progress in percents + self.progress_callback = None + + for key, value in kwargs.iteritems(): + if hasattr(self, key): + setattr(self, key, value) + else: + raise AttributeError(key) + + #: whether backup was canceled + self.canceled = False + + # FIXME: drop this legacy feature? + if isinstance(self.compressed, basestring): + self.compression_filter = self.compressed + self.compressed = True + else: + self.compression_filter = DEFAULT_COMPRESSION_FILTER + + if exclude_list is None: + exclude_list = [] + + if vms_list is None: + all_vms = [vm for vm in app.domains] + selected_vms = [vm for vm in all_vms if vm.include_in_backups] + appvms_to_backup = [vm for vm in selected_vms if + vm.is_appvm() and not vm.internal] + template_vms_worth_backingup = [vm for vm in selected_vms if ( + vm.is_template() and vm.include_in_backups)] + dom0 = [app.domains[0]] + + vms_list = appvms_to_backup + \ + template_vms_worth_backingup + dom0 + + self.vms_for_backup = vms_list + # Apply exclude list + if exclude_list: + self.vms_for_backup = [vm for vm in vms_list if vm.name not in + exclude_list] + + def __del__(self): + if self.tmpdir and os.path.exists(self.tmpdir): + shutil.rmtree(self.tmpdir) + + def cancel(self): + """Cancel running backup operation. Can be called from another thread. + """ + self.canceled = True + for proc in self.processes_to_kill_on_cancel: + try: + proc.terminate() + except: + pass + + @staticmethod + def _file_to_backup(file_path, subdir=None): + sz = get_disk_usage(file_path) + + if subdir is None: + abs_file_path = os.path.abspath(file_path) + abs_base_dir = os.path.abspath(qubes.config.system_path["qubes_base_dir"]) + '/' + abs_file_dir = os.path.dirname(abs_file_path) + '/' + (nothing, directory, subdir) = abs_file_dir.partition(abs_base_dir) + assert nothing == "" + assert directory == abs_base_dir + else: + if len(subdir) > 0 and not subdir.endswith('/'): + subdir += '/' + return [{"path": file_path, "size": sz, "subdir": subdir}] -def backup_do(app, base_backup_dir, files_to_backup, passphrase, - progress_callback=None, encrypted=False, appvm=None, - compressed=False, hmac_algorithm=DEFAULT_HMAC_ALGORITHM, - crypto_algorithm=DEFAULT_CRYPTO_ALGORITHM): - global running_backup_operation + def get_files_to_backup(self): + files_to_backup = {} + total_backup_sz = 0 + for vm in self.vms_for_backup: + if vm.is_template(): + # handle templates later + continue + if vm.qid == 0: + # handle dom0 later + continue - def queue_put_with_check(proc, vmproc, queue, element): + if self.encrypted: + subdir = 'vm%d/' % vm.qid + else: + subdir = None + + vm_files = [] + if vm.private_img is not None: + vm_files += self._file_to_backup(vm.private_img, subdir) + + # TODO: don't backup the icon + if vm.is_appvm(): + vm_files += self._file_to_backup( + vm.icon_path, subdir) + if vm.updateable: + if os.path.exists(vm.dir_path + "/apps.templates"): + # template + vm_files += self._file_to_backup( + vm.dir_path + "/apps.templates", subdir) + else: + # standaloneVM + vm_files += self._file_to_backup( + vm.dir_path + "/apps", subdir) + + if os.path.exists(vm.dir_path + "/kernels"): + vm_files += self._file_to_backup( + vm.dir_path + "/kernels", subdir) + # TODO: drop after merging firewall.xml into qubes.xml + firewall_conf = os.path.join(vm.dir_path, vm.firewall_conf) + if os.path.exists(firewall_conf): + vm_files += self._file_to_backup( + firewall_conf, subdir) + if 'appmenus_whitelist' in qubes.config.vm_files and \ + os.path.exists(os.path.join(vm.dir_path, + qubes.config.vm_files[ + 'appmenus_whitelist'])): + vm_files += self._file_to_backup( + os.path.join(vm.dir_path, qubes.config.vm_files[ + 'appmenus_whitelist']), + subdir) + + if vm.updateable: + vm_files += self._file_to_backup(vm.root_img, subdir) + vm_size = reduce(lambda x, y: x + y['size'], vm_files, 0) + files_to_backup[vm.qid] = { + 'vm': vm, + 'files': vm_files, + 'subdir': subdir, + 'size': vm_size, + } + total_backup_sz += vm_size + + for vm in self.vms_for_backup: + if not vm.is_template(): + # already handled + continue + if vm.qid == 0: + # handle dom0 later + continue + vm_sz = vm.get_disk_utilization() + if self.encrypted: + template_subdir = 'vm%d/' % vm.qid + else: + template_subdir = os.path.relpath( + vm.dir_path, + qubes.config.system_path["qubes_base_dir"]) + '/' + template_to_backup = [{"path": vm.dir_path + '/.', + "size": vm_sz, + "subdir": template_subdir}] + vm_files = template_to_backup + vm_size = reduce(lambda x, y: x + y['size'], vm_files, 0) + files_to_backup[vm.qid] = { + 'vm': vm, + 'files': vm_files, + 'subdir': template_subdir, + 'size': vm_size, + } + total_backup_sz += vm_size + + # Dom0 user home + if 0 in [vm.qid for vm in self.vms_for_backup]: + local_user = grp.getgrnam('qubes').gr_mem[0] + home_dir = pwd.getpwnam(local_user).pw_dir + # Home dir should have only user-owned files, so fix it now to prevent + # permissions problems - some root-owned files can left after + # 'sudo bash' and similar commands + subprocess.check_call(['sudo', 'chown', '-R', local_user, home_dir]) + + home_sz = get_disk_usage(home_dir) + home_to_backup = [ + {"path": home_dir, "size": home_sz, "subdir": 'dom0-home/'}] + vm_files = home_to_backup + + files_to_backup[0] = { + 'vm': self.app.domains[0], + 'files': vm_files, + 'subdir': os.path.join('dom0-home', os.path.basename(home_dir)), + 'size': home_sz, + } + total_backup_sz += home_sz + + self.total_backup_bytes = total_backup_sz + return files_to_backup + + + def get_backup_summary(self): + summary = "" + + fields_to_display = [ + {"name": "VM", "width": 16}, + {"name": "type", "width": 12}, + {"name": "size", "width": 12} + ] + + # Display the header + for f in fields_to_display: + fmt = "{{0:-^{0}}}-+".format(f["width"] + 1) + summary += fmt.format('-') + summary += "\n" + for f in fields_to_display: + fmt = "{{0:>{0}}} |".format(f["width"] + 1) + summary += fmt.format(f["name"]) + summary += "\n" + for f in fields_to_display: + fmt = "{{0:-^{0}}}-+".format(f["width"] + 1) + summary += fmt.format('-') + summary += "\n" + + files_to_backup = self.get_files_to_backup() + + for qid, vm_info in files_to_backup.iteritems(): + s = "" + fmt = "{{0:>{0}}} |".format(fields_to_display[0]["width"] + 1) + s += fmt.format(vm_info['vm'].name) + + fmt = "{{0:>{0}}} |".format(fields_to_display[1]["width"] + 1) + if qid == 0: + s += fmt.format("User home") + elif vm_info['vm'].is_template(): + s += fmt.format("Template VM") + else: + s += fmt.format("VM" + (" + Sys" if vm_info['vm'].updateable else "")) + + vm_size = vm_info['size'] + + fmt = "{{0:>{0}}} |".format(fields_to_display[2]["width"] + 1) + s += fmt.format(size_to_human(vm_size)) + + if qid != 0 and vm_info['vm'].is_running(): + s += " <-- The VM is running, please shut it down before proceeding " \ + "with the backup!" + + summary += s + "\n" + + for f in fields_to_display: + fmt = "{{0:-^{0}}}-+".format(f["width"] + 1) + summary += fmt.format('-') + summary += "\n" + + fmt = "{{0:>{0}}} |".format(fields_to_display[0]["width"] + 1) + summary += fmt.format("Total size:") + fmt = "{{0:>{0}}} |".format( + fields_to_display[1]["width"] + 1 + 2 + fields_to_display[2][ + "width"] + 1) + summary += fmt.format(size_to_human(self.total_backup_bytes)) + summary += "\n" + + for f in fields_to_display: + fmt = "{{0:-^{0}}}-+".format(f["width"] + 1) + summary += fmt.format('-') + summary += "\n" + + vms_not_for_backup = [vm.name for vm in self.app.domains + if vm not in self.vms_for_backup] + summary += "VMs not selected for backup:\n - " + "\n - ".join( + vms_not_for_backup) + + return summary + + def prepare_backup_header(self): + header_file_path = os.path.join(self.tmpdir, HEADER_FILENAME) + backup_header = BackupHeader() + backup_header.version = CURRENT_BACKUP_FORMAT_VERSION + backup_header.hmac_algorithm = self.hmac_algorithm + backup_header.crypto_algorithm = self.crypto_algorithm + backup_header.encrypted = self.encrypted + backup_header.compressed = self.compressed + if self.compressed: + backup_header.compression_filter = self.compression_filter + backup_header.save(header_file_path) + + hmac = subprocess.Popen( + ["openssl", "dgst", "-" + self.hmac_algorithm, + "-hmac", self.passphrase], + stdin=open(header_file_path, "r"), + stdout=open(header_file_path + ".hmac", "w")) + if hmac.wait() != 0: + raise qubes.exc.QubesException( + "Failed to compute hmac of header file") + return HEADER_FILENAME, HEADER_FILENAME + ".hmac" + + + @staticmethod + def _queue_put_with_check(proc, vmproc, queue, element): if queue.full(): if not proc.is_alive(): if vmproc: @@ -493,270 +561,286 @@ def backup_do(app, base_backup_dir, files_to_backup, passphrase, raise qubes.exc.QubesException(message) queue.put(element) - total_backup_sz = 0 - passphrase = passphrase.encode('utf-8') - for f in files_to_backup: - total_backup_sz += f["size"] + def _send_progress_update(self): + if callable(self.progress_callback): + progress = ( + 100 * (self._done_vms_bytes + self._current_vm_bytes) / + self.total_backup_bytes) + self.progress_callback(progress) - if isinstance(compressed, str): - compression_filter = compressed - else: - compression_filter = DEFAULT_COMPRESSION_FILTER + def _add_vm_progress(self, bytes_done): + self._current_vm_bytes += bytes_done + self._send_progress_update() - running_backup_operation = BackupOperationInfo() - vmproc = None - tar_sparse = None - if appvm is not None: - # Prepare the backup target (Qubes service call) - backup_target = "QUBESRPC qubes.Backup dom0" + def backup_do(self): + if self.passphrase is None: + raise qubes.exc.QubesException("No passphrase set") + qubes_xml = self.app._store + self.tmpdir = tempfile.mkdtemp() + shutil.copy(qubes_xml, os.path.join(self.tmpdir, 'qubes.xml')) + qubes_xml = os.path.join(self.tmpdir, 'qubes.xml') + backup_app = qubes.Qubes(qubes_xml) - # If APPVM, STDOUT is a PIPE - vmproc = appvm.run(command=backup_target, passio_popen=True, - passio_stderr=True) - vmproc.stdin.write(base_backup_dir. - replace("\r", "").replace("\n", "") + "\n") - backup_stdout = vmproc.stdin - running_backup_operation.processes_to_kill_on_cancel.append(vmproc) - else: - # Prepare the backup target (local file) - if os.path.isdir(base_backup_dir): - backup_target = base_backup_dir + "/qubes-{0}". \ - format(time.strftime("%Y-%m-%dT%H%M%S")) + # FIXME: cache it earlier? + files_to_backup = self.get_files_to_backup() + # make sure backup_content isn't set initially + for vm in backup_app.domains: + vm.backup_content = qubes.property.DEFAULT + + for qid, vm_info in files_to_backup.iteritems(): + if qid != 0 and vm_info['vm'].is_running(): + raise qubes.exc.QubesVMNotHaltedError(vm_info['vm']) + # VM is included in the backup + backup_app.domains[qid].backup_content = True + backup_app.domains[qid].backup_path = vm_info['subdir'] + backup_app.domains[qid].backup_size = vm_info['size'] + backup_app.save() + + passphrase = self.passphrase.encode('utf-8') + + vmproc = None + tar_sparse = None + if self.target_vm is not None: + # Prepare the backup target (Qubes service call) + backup_target = "QUBESRPC qubes.Backup dom0" + + # If APPVM, STDOUT is a PIPE + vmproc = self.target_vm.run( + command=backup_target, passio_popen=True, passio_stderr=True) + vmproc.stdin.write(self.target_dir. + replace("\r", "").replace("\n", "") + "\n") + backup_stdout = vmproc.stdin + self.processes_to_kill_on_cancel.append(vmproc) else: - backup_target = base_backup_dir - - # Create the target directory - if not os.path.exists(os.path.dirname(base_backup_dir)): - raise qubes.exc.QubesException( - "ERROR: the backup directory for {0} does not exists". - format(base_backup_dir)) - - # If not APPVM, STDOUT is a local file - backup_stdout = open(backup_target, 'wb') - - global blocks_backedup - blocks_backedup = 0 - if callable(progress_callback): - progress = blocks_backedup * 11 / total_backup_sz - progress_callback(progress) - - backup_tmpdir = tempfile.mkdtemp(prefix="/var/tmp/backup_") - running_backup_operation.tmpdir_to_remove = backup_tmpdir - - # Tar with tape length does not deals well with stdout (close stdout between - # two tapes) - # For this reason, we will use named pipes instead - if BACKUP_DEBUG: - print "Working in", backup_tmpdir - - backup_pipe = os.path.join(backup_tmpdir, "backup_pipe") - if BACKUP_DEBUG: - print "Creating pipe in:", backup_pipe - os.mkfifo(backup_pipe) - - if BACKUP_DEBUG: - print "Will backup:", files_to_backup - - header_files = prepare_backup_header(backup_tmpdir, passphrase, - compressed=bool(compressed), - encrypted=encrypted, - hmac_algorithm=hmac_algorithm, - crypto_algorithm=crypto_algorithm, - compression_filter=compression_filter) - - # Setup worker to send encrypted data chunks to the backup_target - def compute_progress(new_size, total_backup_size): - global blocks_backedup - blocks_backedup += new_size - if callable(progress_callback): - this_progress = blocks_backedup / float(total_backup_size) - progress_callback(int(round(this_progress * 100, 2))) - - to_send = Queue(10) - send_proc = SendWorker(to_send, backup_tmpdir, backup_stdout) - send_proc.start() - - for f in header_files: - to_send.put(f) - - for filename in files_to_backup: - if BACKUP_DEBUG: - print "Backing up", filename - - backup_tempfile = os.path.join(backup_tmpdir, - filename["subdir"], - os.path.basename(filename["path"])) - if BACKUP_DEBUG: - print "Using temporary location:", backup_tempfile - - # Ensure the temporary directory exists - if not os.path.isdir(os.path.dirname(backup_tempfile)): - os.makedirs(os.path.dirname(backup_tempfile)) - - # The first tar cmd can use any complex feature as we want. Files will - # be verified before untaring this. - # Prefix the path in archive with filename["subdir"] to have it - # verified during untar - tar_cmdline = (["tar", "-Pc", '--sparse', - "-f", backup_pipe, - '-C', os.path.dirname(filename["path"])] + - (['--dereference'] if filename["subdir"] != "dom0-home/" - else []) + - ['--xform', 's:^%s:%s\\0:' % ( - os.path.basename(filename["path"]), - filename["subdir"]), - os.path.basename(filename["path"]) - ]) - if compressed: - tar_cmdline.insert(-1, - "--use-compress-program=%s" % compression_filter) - - if BACKUP_DEBUG: - print " ".join(tar_cmdline) - - # Tips: Popen(bufsize=0) - # Pipe: tar-sparse | encryptor [| hmac] | tar | backup_target - # Pipe: tar-sparse [| hmac] | tar | backup_target - tar_sparse = subprocess.Popen(tar_cmdline, stdin=subprocess.PIPE, - stderr=(open(os.devnull, 'w') - if not BACKUP_DEBUG - else None)) - running_backup_operation.processes_to_kill_on_cancel.append(tar_sparse) - - # Wait for compressor (tar) process to finish or for any error of other - # subprocesses - i = 0 - run_error = "paused" - encryptor = None - if encrypted: - # Start encrypt - # If no cipher is provided, the data is forwarded unencrypted !!! - encryptor = subprocess.Popen(["openssl", "enc", - "-e", "-" + crypto_algorithm, - "-pass", "pass:" + passphrase], - stdin=open(backup_pipe, 'rb'), - stdout=subprocess.PIPE) - pipe = encryptor.stdout - else: - pipe = open(backup_pipe, 'rb') - while run_error == "paused": - - # Start HMAC - hmac = subprocess.Popen(["openssl", "dgst", - "-" + hmac_algorithm, "-hmac", passphrase], - stdin=subprocess.PIPE, - stdout=subprocess.PIPE) - - # Prepare a first chunk - chunkfile = backup_tempfile + "." + "%03d" % i - i += 1 - chunkfile_p = open(chunkfile, 'wb') - - common_args = { - 'backup_target': chunkfile_p, - 'total_backup_sz': total_backup_sz, - 'hmac': hmac, - 'vmproc': vmproc, - 'addproc': tar_sparse, - 'progress_callback': compute_progress, - 'size_limit': 100 * 1024 * 1024, - } - run_error = wait_backup_feedback( - in_stream=pipe, streamproc=encryptor, - **common_args) - chunkfile_p.close() - - if BACKUP_DEBUG: - print "Wait_backup_feedback returned:", run_error - - if running_backup_operation.canceled: - try: - tar_sparse.terminate() - except: - pass - try: - hmac.terminate() - except: - pass - tar_sparse.wait() - hmac.wait() - to_send.put("ERROR") - send_proc.join() - shutil.rmtree(backup_tmpdir) - running_backup_operation = None - raise BackupCanceledError("Backup canceled") - if run_error and run_error != "size_limit": - send_proc.terminate() - if run_error == "VM" and vmproc: - raise qubes.exc.QubesException( - "Failed to write the backup, VM output:\n" + - vmproc.stderr.read(MAX_STDERR_BYTES)) - else: - raise qubes.exc.QubesException("Failed to perform backup: error in " + - run_error) - - # Send the chunk to the backup target - queue_put_with_check( - send_proc, vmproc, to_send, - os.path.relpath(chunkfile, backup_tmpdir)) - - # Close HMAC - hmac.stdin.close() - hmac.wait() - if BACKUP_DEBUG: - print "HMAC proc return code:", hmac.poll() - - # Write HMAC data next to the chunk file - hmac_data = hmac.stdout.read() - if BACKUP_DEBUG: - print "Writing hmac to", chunkfile + ".hmac" - hmac_file = open(chunkfile + ".hmac", 'w') - hmac_file.write(hmac_data) - hmac_file.flush() - hmac_file.close() - - # Send the HMAC to the backup target - queue_put_with_check( - send_proc, vmproc, to_send, - os.path.relpath(chunkfile, backup_tmpdir) + ".hmac") - - if tar_sparse.poll() is None or run_error == "size_limit": - run_error = "paused" + # Prepare the backup target (local file) + if os.path.isdir(self.target_dir): + backup_target = self.target_dir + "/qubes-{0}". \ + format(time.strftime("%Y-%m-%dT%H%M%S")) else: - running_backup_operation.processes_to_kill_on_cancel.remove( - tar_sparse) - if BACKUP_DEBUG: - print "Finished tar sparse with exit code", tar_sparse \ - .poll() - pipe.close() + backup_target = self.target_dir - queue_put_with_check(send_proc, vmproc, to_send, "FINISHED") - send_proc.join() - shutil.rmtree(backup_tmpdir) + # Create the target directory + if not os.path.exists(os.path.dirname(self.target_dir)): + raise qubes.exc.QubesException( + "ERROR: the backup directory for {0} does not exists". + format(self.target_dir)) - if running_backup_operation.canceled: - running_backup_operation = None - raise BackupCanceledError("Backup canceled") + # If not APPVM, STDOUT is a local file + backup_stdout = open(backup_target, 'wb') - running_backup_operation = None - - if send_proc.exitcode != 0: - raise qubes.exc.QubesException( - "Failed to send backup: error in the sending process") - - if vmproc: + # Tar with tape length does not deals well with stdout (close stdout between + # two tapes) + # For this reason, we will use named pipes instead if BACKUP_DEBUG: - print "VMProc1 proc return code:", vmproc.poll() - if tar_sparse is not None: - print "Sparse1 proc return code:", tar_sparse.poll() - vmproc.stdin.close() + print "Working in", self.tmpdir - # Save date of last backup - for vm in app.domains: - if vm.backup_content: - vm.backup_timestamp = datetime.datetime.now() + backup_pipe = os.path.join(self.tmpdir, "backup_pipe") + if BACKUP_DEBUG: + print "Creating pipe in:", backup_pipe + os.mkfifo(backup_pipe) - app.save() + if BACKUP_DEBUG: + print "Will backup:", files_to_backup + + header_files = self.prepare_backup_header() + + # Setup worker to send encrypted data chunks to the backup_target + to_send = Queue(10) + send_proc = SendWorker(to_send, self.tmpdir, backup_stdout) + send_proc.start() + + for f in header_files: + to_send.put(f) + + vm_files_to_backup = self.get_files_to_backup() + qubes_xml_info = { + 'files': self._file_to_backup(qubes_xml, ''), + 'vm': None, + 'size': 0, + 'subdir': '', + } + for vm_info in itertools.chain([qubes_xml_info], + vm_files_to_backup.itervalues()): + for file_info in vm_info['files']: + + if BACKUP_DEBUG: + print "Backing up", file_info + + backup_tempfile = os.path.join(self.tmpdir, + file_info["subdir"], + os.path.basename(file_info["path"])) + if BACKUP_DEBUG: + print "Using temporary location:", backup_tempfile + + # Ensure the temporary directory exists + if not os.path.isdir(os.path.dirname(backup_tempfile)): + os.makedirs(os.path.dirname(backup_tempfile)) + + # The first tar cmd can use any complex feature as we want. Files will + # be verified before untaring this. + # Prefix the path in archive with filename["subdir"] to have it + # verified during untar + tar_cmdline = (["tar", "-Pc", '--sparse', + "-f", backup_pipe, + '-C', os.path.dirname(file_info["path"])] + + (['--dereference'] if file_info["subdir"] != "dom0-home/" + else []) + + ['--xform', 's:^%s:%s\\0:' % ( + os.path.basename(file_info["path"]), + file_info["subdir"]), + os.path.basename(file_info["path"]) + ]) + if self.compressed: + tar_cmdline.insert(-1, + "--use-compress-program=%s" % self.compression_filter) + + if BACKUP_DEBUG: + print " ".join(tar_cmdline) + + # Tips: Popen(bufsize=0) + # Pipe: tar-sparse | encryptor [| hmac] | tar | backup_target + # Pipe: tar-sparse [| hmac] | tar | backup_target + tar_sparse = subprocess.Popen(tar_cmdline, stdin=subprocess.PIPE, + stderr=(open(os.devnull, 'w') + if not BACKUP_DEBUG + else None)) + self.processes_to_kill_on_cancel.append(tar_sparse) + + # Wait for compressor (tar) process to finish or for any error of other + # subprocesses + i = 0 + run_error = "paused" + encryptor = None + if self.encrypted: + # Start encrypt + # If no cipher is provided, the data is forwarded unencrypted !!! + encryptor = subprocess.Popen([ + "openssl", "enc", + "-e", "-" + self.crypto_algorithm, + "-pass", "pass:" + passphrase], + stdin=open(backup_pipe, 'rb'), + stdout=subprocess.PIPE) + pipe = encryptor.stdout + else: + pipe = open(backup_pipe, 'rb') + while run_error == "paused": + + # Start HMAC + hmac = subprocess.Popen([ + "openssl", "dgst", "-" + self.hmac_algorithm, + "-hmac", passphrase], + stdin=subprocess.PIPE, + stdout=subprocess.PIPE) + + # Prepare a first chunk + chunkfile = backup_tempfile + "." + "%03d" % i + i += 1 + chunkfile_p = open(chunkfile, 'wb') + + common_args = { + 'backup_target': chunkfile_p, + 'hmac': hmac, + 'vmproc': vmproc, + 'addproc': tar_sparse, + 'progress_callback': self._add_vm_progress, + 'size_limit': self.chunk_size, + } + run_error = wait_backup_feedback( + in_stream=pipe, streamproc=encryptor, + **common_args) + chunkfile_p.close() + + if BACKUP_DEBUG: + print "Wait_backup_feedback returned:", run_error + + if self.canceled: + try: + tar_sparse.terminate() + except: + pass + try: + hmac.terminate() + except: + pass + tar_sparse.wait() + hmac.wait() + to_send.put("ERROR") + send_proc.join() + shutil.rmtree(self.tmpdir) + raise BackupCanceledError("Backup canceled") + if run_error and run_error != "size_limit": + send_proc.terminate() + if run_error == "VM" and vmproc: + raise qubes.exc.QubesException( + "Failed to write the backup, VM output:\n" + + vmproc.stderr.read(MAX_STDERR_BYTES)) + else: + raise qubes.exc.QubesException("Failed to perform backup: error in " + + run_error) + + # Send the chunk to the backup target + self._queue_put_with_check( + send_proc, vmproc, to_send, + os.path.relpath(chunkfile, self.tmpdir)) + + # Close HMAC + hmac.stdin.close() + hmac.wait() + if BACKUP_DEBUG: + print "HMAC proc return code:", hmac.poll() + + # Write HMAC data next to the chunk file + hmac_data = hmac.stdout.read() + if BACKUP_DEBUG: + print "Writing hmac to", chunkfile + ".hmac" + hmac_file = open(chunkfile + ".hmac", 'w') + hmac_file.write(hmac_data) + hmac_file.flush() + hmac_file.close() + + # Send the HMAC to the backup target + self._queue_put_with_check( + send_proc, vmproc, to_send, + os.path.relpath(chunkfile, self.tmpdir) + ".hmac") + + if tar_sparse.poll() is None or run_error == "size_limit": + run_error = "paused" + else: + self.processes_to_kill_on_cancel.remove(tar_sparse) + if BACKUP_DEBUG: + print "Finished tar sparse with exit code", tar_sparse \ + .poll() + pipe.close() + + # This VM done, update progress + self._done_vms_bytes += vm_info['size'] + self._current_vm_bytes = 0 + self._send_progress_update() + + self._queue_put_with_check(send_proc, vmproc, to_send, "FINISHED") + send_proc.join() + shutil.rmtree(self.tmpdir) + + if self.canceled: + raise BackupCanceledError("Backup canceled") + + if send_proc.exitcode != 0: + raise qubes.exc.QubesException( + "Failed to send backup: error in the sending process") + + if vmproc: + if BACKUP_DEBUG: + print "VMProc1 proc return code:", vmproc.poll() + if tar_sparse is not None: + print "Sparse1 proc return code:", tar_sparse.poll() + vmproc.stdin.close() + + # Save date of last backup + for vm in self.app.domains: + if vm.backup_content: + vm.backup_timestamp = datetime.datetime.now() + + self.app.save() ''' @@ -777,7 +861,7 @@ def backup_do(app, base_backup_dir, files_to_backup, passphrase, def wait_backup_feedback(progress_callback, in_stream, streamproc, - backup_target, total_backup_sz, hmac=None, vmproc=None, + backup_target, hmac=None, vmproc=None, addproc=None, size_limit=None): buffer_size = 409600 @@ -790,7 +874,8 @@ def wait_backup_feedback(progress_callback, in_stream, streamproc, if size_limit and bytes_copied + buffer_size > size_limit: return "size_limit" buf = in_stream.read(buffer_size) - progress_callback(len(buf), total_backup_sz) + if callable(progress_callback): + progress_callback(len(buf)) bytes_copied += len(buf) run_count = 0 @@ -848,46 +933,8 @@ def wait_backup_feedback(progress_callback, in_stream, streamproc, return run_error - -def verify_hmac(filename, hmacfile, passphrase, algorithm): - if BACKUP_DEBUG: - print "Verifying file " + filename - - if hmacfile != filename + ".hmac": - raise qubes.exc.QubesException( - "ERROR: expected hmac for {}, but got {}". - format(filename, hmacfile)) - - hmac_proc = subprocess.Popen(["openssl", "dgst", "-" + algorithm, - "-hmac", passphrase], - stdin=open(filename, 'rb'), - stdout=subprocess.PIPE, stderr=subprocess.PIPE) - hmac_stdout, hmac_stderr = hmac_proc.communicate() - - if len(hmac_stderr) > 0: - raise qubes.exc.QubesException( - "ERROR: verify file {0}: {1}".format(filename, hmac_stderr)) - else: - if BACKUP_DEBUG: - print "Loading hmac for file " + filename - hmac = load_hmac(open(hmacfile, 'r').read()) - - if len(hmac) > 0 and load_hmac(hmac_stdout) == hmac: - os.unlink(hmacfile) - if BACKUP_DEBUG: - print "File verification OK -> Sending file " + filename - return True - else: - raise qubes.exc.QubesException( - "ERROR: invalid hmac for file {0}: {1}. " - "Is the passphrase correct?". - format(filename, load_hmac(hmac_stdout))) - # Not reachable - return False - - class ExtractWorker2(Process): - def __init__(self, queue, base_dir, passphrase, encrypted, total_size, + def __init__(self, queue, base_dir, passphrase, encrypted, print_callback, error_callback, progress_callback, vmproc=None, compressed=False, crypto_algorithm=DEFAULT_CRYPTO_ALGORITHM, verify_only=False): @@ -899,7 +946,6 @@ class ExtractWorker2(Process): self.compressed = compressed self.crypto_algorithm = crypto_algorithm self.verify_only = verify_only - self.total_size = total_size self.blocks_backedup = 0 self.tar2_process = None self.tar2_current_file = None @@ -919,13 +965,6 @@ class ExtractWorker2(Process): self.stderr_encoding = sys.stderr.encoding or 'utf-8' - def compute_progress(self, new_size, _): - if self.progress_callback: - self.blocks_backedup += new_size - progress = self.blocks_backedup / float(self.total_size) - progress = int(round(progress * 100, 2)) - self.progress_callback(progress) - def collect_tar_output(self): if not self.tar2_process.stderr: return @@ -1031,7 +1070,6 @@ class ExtractWorker2(Process): pipe = open(self.restore_pipe, 'wb') common_args = { 'backup_target': pipe, - 'total_backup_sz': self.total_size, 'hmac': None, 'vmproc': self.vmproc, 'addproc': self.tar2_process @@ -1049,7 +1087,7 @@ class ExtractWorker2(Process): stdout=subprocess.PIPE) run_error = wait_backup_feedback( - progress_callback=self.compute_progress, + progress_callback=self.progress_callback, in_stream=self.decryptor_process.stdout, streamproc=self.decryptor_process, **common_args) @@ -1060,13 +1098,13 @@ class ExtractWorker2(Process): stdout=subprocess.PIPE) run_error = wait_backup_feedback( - progress_callback=self.compute_progress, + progress_callback=self.progress_callback, in_stream=self.decompressor_process.stdout, streamproc=self.decompressor_process, **common_args) else: run_error = wait_backup_feedback( - progress_callback=self.compute_progress, + progress_callback=self.progress_callback, in_stream=open(filename, "rb"), streamproc=None, **common_args) @@ -1122,12 +1160,12 @@ class ExtractWorker2(Process): class ExtractWorker3(ExtractWorker2): - def __init__(self, queue, base_dir, passphrase, encrypted, total_size, + def __init__(self, queue, base_dir, passphrase, encrypted, print_callback, error_callback, progress_callback, vmproc=None, compressed=False, crypto_algorithm=DEFAULT_CRYPTO_ALGORITHM, compression_filter=None, verify_only=False): super(ExtractWorker3, self).__init__(queue, base_dir, passphrase, - encrypted, total_size, + encrypted, print_callback, error_callback, progress_callback, vmproc, compressed, crypto_algorithm, @@ -1223,14 +1261,13 @@ class ExtractWorker3(ExtractWorker2): common_args = { 'backup_target': input_pipe, - 'total_backup_sz': self.total_size, 'hmac': None, 'vmproc': self.vmproc, 'addproc': self.tar2_process } run_error = wait_backup_feedback( - progress_callback=self.compute_progress, + progress_callback=self.progress_callback, in_stream=open(filename, "rb"), streamproc=None, **common_args) @@ -1281,7 +1318,7 @@ class ExtractWorker3(ExtractWorker2): self.print_callback("Finished extracting thread") -def get_supported_hmac_algo(hmac_algorithm): +def get_supported_hmac_algo(hmac_algorithm=None): # Start with provided default if hmac_algorithm: yield hmac_algorithm @@ -1293,141 +1330,258 @@ def get_supported_hmac_algo(hmac_algorithm): yield algo.strip() proc.wait() - -def parse_backup_header(filename): - header_data = {} - with open(filename, 'r') as f: - for line in f.readlines(): - if line.count('=') != 1: - raise qubes.exc.QubesException("Invalid backup header (line %s)" % line) - (key, value) = line.strip().split('=') - if not any([key == getattr(BackupHeader, attr) for attr in dir( - BackupHeader)]): - # Ignoring unknown option - continue - if key in BackupHeader.bool_options: - value = value.lower() in ["1", "true", "yes"] - elif key in BackupHeader.int_options: - value = int(value) - header_data[key] = value - return header_data +class BackupRestoreOptions(object): + def __init__(self): + #: use default NetVM if the one referenced in backup do not exists on + # the host + self.use_default_netvm = True + #: set NetVM to "none" if the one referenced in backup do not exists + # on the host + self.use_none_netvm = False + #: set template to default if the one referenced in backup do not + # exists on the host + self.use_default_template = True + #: restore dom0 home + self.dom0_home = True + #: dictionary how what templates should be used instead of those + # referenced in backup + self.replace_template = {} + #: restore dom0 home even if username is different + self.ignore_username_mismatch = False + #: do not restore data, only verify backup integrity + self.verify_only = False + #: automatically rename VM during restore, when it would conflict + # with existing one + self.rename_conflicting = True + #: list of VM names to exclude + self.exclude = [] -def restore_vm_dirs(backup_source, restore_tmpdir, passphrase, vms_dirs, vms, - vms_size, print_callback=None, error_callback=None, - progress_callback=None, encrypted=False, appvm=None, - compressed=False, hmac_algorithm=DEFAULT_HMAC_ALGORITHM, - crypto_algorithm=DEFAULT_CRYPTO_ALGORITHM, - verify_only=False, - format_version=CURRENT_BACKUP_FORMAT_VERSION, - compression_filter=None): - global running_backup_operation +class BackupRestore(object): + """Usage: + >>> restore_op = BackupRestore(...) + >>> # adjust restore_op.options here + >>> restore_info = restore_op.get_restore_info() + >>> # manipulate restore_info to select VMs to restore here + >>> restore_op.restore_do(restore_info) + """ - if callable(print_callback): + def __init__(self, app, backup_location, backup_vm, passphrase): + super(BackupRestore, self).__init__() + + #: qubes.Qubes instance + self.app = app + + #: options how the backup should be restored + self.options = BackupRestoreOptions() + + #: VM from which backup should be retrieved + self.backup_vm = backup_vm + if backup_vm and backup_vm.qid == 0: + self.backup_vm = None + + #: backup path, inside VM pointed by :py:attr:`backup_vm` + self.backup_location = backup_location + + #: passphrase protecting backup integrity and optionally decryption + self.passphrase = passphrase + + #: temporary directory used to extract the data before moving to the + # final location; should be on the same filesystem as /var/lib/qubes + self.tmpdir = tempfile.mkdtemp(prefix="restore", dir="/var/tmp") + + #: list of processes (Popen objects) to kill on cancel + self.processes_to_kill_on_cancel = [] + + #: is the backup operation canceled + self.canceled = False + + # TODO: convert to python logging API + self.print_callback = print_stdout + self.error_callback = print_stderr + + #: report restore progress, called with one argument - percents of + # data restored + # FIXME: convert to float [0,1] + self.progress_callback = None + + #: basic information about the backup + self.header_data = self._retrieve_backup_header() + + #: VMs included in the backup + self.backup_app = self._process_qubes_xml() + + def cancel(self): + """Cancel running backup operation. Can be called from another thread. + """ + self.canceled = True + for proc in self.processes_to_kill_on_cancel: + try: + proc.terminate() + except: + pass + + def _start_retrieval_process(self, filelist, limit_count, limit_bytes): + """Retrieve backup stream and extract it to :py:attr:`tmpdir` + + :param filelist: list of files to extract; listing directory name + will extract the whole directory; use empty list to extract the whole + archive + :param limit_count: maximum number of files to extract + :param limit_bytes: maximum size of extracted data + :return: a touple of (Popen object of started process, file-like + object for reading extracted files list, file-like object for reading + errors) + """ + + vmproc = None + if self.backup_vm is not None: + # Prepare the backup target (Qubes service call) + backup_target = "QUBESRPC qubes.Restore dom0" + + # If APPVM, STDOUT is a PIPE + vmproc = self.backup_vm.run( + command=backup_target, passio_popen=True, passio_stderr=True) + vmproc.stdin.write( + self.backup_location.replace("\r", "").replace("\n", "") + "\n") + + # Send to tar2qfile the VMs that should be extracted + vmproc.stdin.write(" ".join(filelist) + "\n") + self.processes_to_kill_on_cancel.append(vmproc) + + backup_stdin = vmproc.stdout + tar1_command = ['/usr/libexec/qubes/qfile-dom0-unpacker', + str(os.getuid()), self.tmpdir, '-v'] + else: + backup_stdin = open(self.backup_location, 'rb') + + tar1_command = ['tar', + '-ixv', + '-C', self.tmpdir] + filelist + + tar1_env = os.environ.copy() + tar1_env['UPDATES_MAX_BYTES'] = str(limit_bytes) + tar1_env['UPDATES_MAX_FILES'] = str(limit_count) + if BACKUP_DEBUG and callable(self.print_callback): + self.print_callback("Run command" + unicode(tar1_command)) + command = subprocess.Popen( + tar1_command, + stdin=backup_stdin, + stdout=vmproc.stdin if vmproc else subprocess.PIPE, + stderr=subprocess.PIPE, + env=tar1_env) + self.processes_to_kill_on_cancel.append(command) + + # qfile-dom0-unpacker output filelist on stderr (and have stdout connected + # to the VM), while tar output filelist on stdout + if self.backup_vm: + filelist_pipe = command.stderr + # let qfile-dom0-unpacker hold the only open FD to the write end of + # pipe, otherwise qrexec-client will not receive EOF when + # qfile-dom0-unpacker terminates + vmproc.stdin.close() + else: + filelist_pipe = command.stdout + + if self.backup_vm: + error_pipe = vmproc.stderr + else: + error_pipe = command.stderr + return command, filelist_pipe, error_pipe + + def _verify_hmac(self, filename, hmacfile, algorithm=None): + def load_hmac(hmac): + hmac = hmac.strip().split("=") + if len(hmac) > 1: + hmac = hmac[1].strip() + else: + raise qubes.exc.QubesException("ERROR: invalid hmac file content") + + return hmac + if algorithm is None: + algorithm = self.header_data.hmac_algorithm + passphrase = self.passphrase.encode('utf-8') if BACKUP_DEBUG: - print_callback("Working in temporary dir:" + restore_tmpdir) - print_callback( - "Extracting data: " + size_to_human(vms_size) + " to restore") + print "Verifying file " + filename - passphrase = passphrase.encode('utf-8') - header_data = None - vmproc = None - if appvm is not None: - # Prepare the backup target (Qubes service call) - backup_target = "QUBESRPC qubes.Restore dom0" + if hmacfile != filename + ".hmac": + raise qubes.exc.QubesException( + "ERROR: expected hmac for {}, but got {}". + format(filename, hmacfile)) - # If APPVM, STDOUT is a PIPE - vmproc = appvm.run(command=backup_target, passio_popen=True, - passio_stderr=True) - vmproc.stdin.write( - backup_source.replace("\r", "").replace("\n", "") + "\n") + hmac_proc = subprocess.Popen( + ["openssl", "dgst", "-" + algorithm, "-hmac", passphrase], + stdin=open(os.path.join(self.tmpdir, filename), 'rb'), + stdout=subprocess.PIPE, stderr=subprocess.PIPE) + hmac_stdout, hmac_stderr = hmac_proc.communicate() - # Send to tar2qfile the VMs that should be extracted - vmproc.stdin.write(" ".join(vms_dirs) + "\n") - if running_backup_operation: - running_backup_operation.processes_to_kill_on_cancel.append(vmproc) + if len(hmac_stderr) > 0: + raise qubes.exc.QubesException( + "ERROR: verify file {0}: {1}".format(filename, hmac_stderr)) + else: + if BACKUP_DEBUG: + print "Loading hmac for file " + filename + hmac = load_hmac(open(os.path.join(self.tmpdir, hmacfile), + 'r').read()) - backup_stdin = vmproc.stdout - tar1_command = ['/usr/libexec/qubes/qfile-dom0-unpacker', - str(os.getuid()), restore_tmpdir, '-v'] - else: - backup_stdin = open(backup_source, 'rb') + if len(hmac) > 0 and load_hmac(hmac_stdout) == hmac: + os.unlink(os.path.join(self.tmpdir, hmacfile)) + if BACKUP_DEBUG: + print "File verification OK -> Sending file " + filename + return True + else: + raise qubes.exc.QubesException( + "ERROR: invalid hmac for file {0}: {1}. " + "Is the passphrase correct?". + format(filename, load_hmac(hmac_stdout))) - tar1_command = ['tar', - '-ixvf', backup_source, - '-C', restore_tmpdir] + vms_dirs + def _retrieve_backup_header(self): + """Retrieve backup header and qubes.xml. Only backup header is + analyzed, qubes.xml is left as-is + (not even verified/decrypted/uncompressed) - tar1_env = os.environ.copy() - # TODO: add some safety margin? - tar1_env['UPDATES_MAX_BYTES'] = str(vms_size) - # Restoring only header - if vms_dirs and vms_dirs[0] == HEADER_FILENAME: - # backup-header, backup-header.hmac, qubes-xml.000, qubes-xml.000.hmac - tar1_env['UPDATES_MAX_FILES'] = '4' - else: - # Currently each VM consists of at most 7 archives (count - # file_to_backup calls in backup_prepare()), but add some safety - # margin for further extensions. Each archive is divided into 100MB - # chunks. Additionally each file have own hmac file. So assume upper - # limit as 2*(10*COUNT_OF_VMS+TOTAL_SIZE/100MB) - tar1_env['UPDATES_MAX_FILES'] = str(2 * (10 * len(vms_dirs) + - int(vms_size / - (100 * 1024 * 1024)))) - if BACKUP_DEBUG and callable(print_callback): - print_callback("Run command" + unicode(tar1_command)) - command = subprocess.Popen( - tar1_command, - stdin=backup_stdin, - stdout=vmproc.stdin if vmproc else subprocess.PIPE, - stderr=subprocess.PIPE, - env=tar1_env) - if running_backup_operation: - running_backup_operation.processes_to_kill_on_cancel.append(command) + :return header_data + :rtype :py:class:`BackupHeader` + """ - # qfile-dom0-unpacker output filelist on stderr (and have stdout connected - # to the VM), while tar output filelist on stdout - if appvm: - filelist_pipe = command.stderr - # let qfile-dom0-unpacker hold the only open FD to the write end of - # pipe, otherwise qrexec-client will not receive EOF when - # qfile-dom0-unpacker terminates - vmproc.stdin.close() - else: - filelist_pipe = command.stdout + if not self.backup_vm and os.path.exists( + os.path.join(self.backup_location, 'qubes.xml')): + # backup format version 1 doesn't have header + header_data = BackupHeader() + header_data.version = 1 + return header_data - expect_tar_error = False + (retrieve_proc, filelist_pipe, error_pipe) = \ + self._start_retrieval_process( + ['backup-header', 'backup-header.hmac', + 'qubes.xml.000', 'qubes.xml.000.hmac'], 4, 1024 * 1024) - to_extract = Queue() - nextfile = None + nextfile = None + expect_tar_error = False - # If want to analyze backup header, do it now - if vms_dirs and vms_dirs[0] == HEADER_FILENAME: filename = filelist_pipe.readline().strip() hmacfile = filelist_pipe.readline().strip() - if not appvm: + # tar output filename before actually extracting it, so wait for the + # next one before trying to access it + if not self.backup_vm: nextfile = filelist_pipe.readline().strip() - if BACKUP_DEBUG and callable(print_callback): - print_callback("Got backup header and hmac: %s, %s" % (filename, - hmacfile)) + if BACKUP_DEBUG and callable(self.print_callback): + self.print_callback("Got backup header and hmac: %s, %s" % ( + filename, hmacfile)) if not filename or filename == "EOF" or \ not hmacfile or hmacfile == "EOF": - if appvm: - vmproc.wait() - proc_error_msg = vmproc.stderr.read(MAX_STDERR_BYTES) - else: - command.wait() - proc_error_msg = command.stderr.read(MAX_STDERR_BYTES) - raise qubes.exc.QubesException("Premature end of archive while receiving " - "backup header. Process output:\n" + - proc_error_msg) - filename = os.path.join(restore_tmpdir, filename) - hmacfile = os.path.join(restore_tmpdir, hmacfile) + retrieve_proc.wait() + proc_error_msg = error_pipe.read(MAX_STDERR_BYTES) + raise qubes.exc.QubesException( + "Premature end of archive while receiving " + "backup header. Process output:\n" + proc_error_msg) file_ok = False + hmac_algorithm = DEFAULT_HMAC_ALGORITHM for hmac_algo in get_supported_hmac_algo(hmac_algorithm): try: - if verify_hmac(filename, hmacfile, passphrase, hmac_algo): + if self._verify_hmac(filename, hmacfile, hmac_algo): file_ok = True hmac_algorithm = hmac_algo break @@ -1435,896 +1589,762 @@ def restore_vm_dirs(backup_source, restore_tmpdir, passphrase, vms_dirs, vms, # Ignore exception here, try the next algo pass if not file_ok: - raise qubes.exc.QubesException("Corrupted backup header (hmac verification " - "failed). Is the password correct?") + raise qubes.exc.QubesException( + "Corrupted backup header (hmac verification " + "failed). Is the password correct?") if os.path.basename(filename) == HEADER_FILENAME: - header_data = parse_backup_header(filename) - if BackupHeader.version in header_data: - format_version = header_data[BackupHeader.version] - if BackupHeader.crypto_algorithm in header_data: - crypto_algorithm = header_data[BackupHeader.crypto_algorithm] - if BackupHeader.hmac_algorithm in header_data: - hmac_algorithm = header_data[BackupHeader.hmac_algorithm] - if BackupHeader.compressed in header_data: - compressed = header_data[BackupHeader.compressed] - if BackupHeader.encrypted in header_data: - encrypted = header_data[BackupHeader.encrypted] - if BackupHeader.compression_filter in header_data: - compression_filter = header_data[ - BackupHeader.compression_filter] + filename = os.path.join(self.tmpdir, filename) + header_data = BackupHeader(open(filename, 'r').read()) os.unlink(filename) else: # if no header found, create one with guessed HMAC algo - header_data = {BackupHeader.hmac_algorithm: hmac_algorithm} - # If this isn't backup header, pass it to ExtractWorker - to_extract.put(filename) + header_data = BackupHeader() + header_data.version = 2 + header_data.hmac_algorithm = hmac_algorithm + # place explicitly this value, because it is what format_version + # 2 have + header_data.crypto_algorithm = 'aes-256-cbc' + # TODO: set header_data.encrypted to something... # when tar do not find expected file in archive, it exit with # code 2. This will happen because we've requested backup-header # file, but the archive do not contain it. Ignore this particular # error. - if not appvm: + if not self.backup_vm: expect_tar_error = True - # Setup worker to extract encrypted data chunks to the restore dirs - # Create the process here to pass it options extracted from backup header - extractor_params = { - 'queue': to_extract, - 'base_dir': restore_tmpdir, - 'passphrase': passphrase, - 'encrypted': encrypted, - 'compressed': compressed, - 'crypto_algorithm': crypto_algorithm, - 'verify_only': verify_only, - 'total_size': vms_size, - 'print_callback': print_callback, - 'error_callback': error_callback, - 'progress_callback': progress_callback, - } - if format_version == 2: - extract_proc = ExtractWorker2(**extractor_params) - elif format_version == 3: - extractor_params['compression_filter'] = compression_filter - extract_proc = ExtractWorker3(**extractor_params) - else: - raise NotImplemented( - "Backup format version %d not supported" % format_version) - extract_proc.start() + if retrieve_proc.wait() != 0 and not expect_tar_error: + raise qubes.exc.QubesException( + "unable to read the qubes backup file {0} ({1}): {2}".format( + self.backup_location, + retrieve_proc.wait(), + error_pipe.read(MAX_STDERR_BYTES) + )) + if retrieve_proc in self.processes_to_kill_on_cancel: + self.processes_to_kill_on_cancel.remove(retrieve_proc) + # wait for other processes (if any) + for proc in self.processes_to_kill_on_cancel: + if proc.wait() != 0: + raise qubes.exc.QubesException( + "Backup header retrieval failed (exit code {})".format( + proc.wait()) + ) + return header_data - try: - filename = None - while True: - if running_backup_operation and running_backup_operation.canceled: - break - if not extract_proc.is_alive(): - command.terminate() - command.wait() - expect_tar_error = True - if vmproc: - vmproc.terminate() - vmproc.wait() - vmproc = None - break - if nextfile is not None: - filename = nextfile - else: - filename = filelist_pipe.readline().strip() + def _start_inner_extraction_worker(self, queue): + """Start a worker process, extracting inner layer of bacup archive, + extract them to :py:attr:`tmpdir`. + End the data by pushing "FINISHED" or "ERROR" to the queue. - if BACKUP_DEBUG and callable(print_callback): - print_callback("Getting new file:" + filename) + :param queue :py:class:`Queue` object to handle files from + """ - if not filename or filename == "EOF": - break + # Setup worker to extract encrypted data chunks to the restore dirs + # Create the process here to pass it options extracted from backup header + extractor_params = { + 'queue': queue, + 'base_dir': self.tmpdir, + 'passphrase': self.passphrase, + 'encrypted': self.header_data.encrypted, + 'compressed': self.header_data.compressed, + 'crypto_algorithm': self.header_data.crypto_algorithm, + 'verify_only': self.options.verify_only, + 'print_callback': self.print_callback, + 'error_callback': print_stderr, + 'progress_callback': self.progress_callback, + } + format_version = self.header_data.version + if format_version == 2: + extract_proc = ExtractWorker2(**extractor_params) + elif format_version == 3: + extractor_params['compression_filter'] = \ + self.header_data.compression_filter + extract_proc = ExtractWorker3(**extractor_params) + else: + raise NotImplementedError( + "Backup format version %d not supported" % format_version) + extract_proc.start() + return extract_proc - hmacfile = filelist_pipe.readline().strip() + def _process_qubes_xml(self): + """Verify, unpack and load qubes.xml. Possibly convert its format if + necessary. It expect that :py:attr:`header_data` is already populated, + and :py:meth:`retrieve_backup_header` was called. + """ + if self.header_data.version == 1: + raise NotImplementedError("TODO: conversion core[12] qubes.xml") + else: + self._verify_hmac("qubes.xml.000", "qubes.xml.000.hmac") + queue = Queue() + queue.put("qubes.xml.000") + queue.put("FINISHED") - if running_backup_operation and running_backup_operation.canceled: - break - # if reading archive directly with tar, wait for next filename - - # tar prints filename before processing it, so wait for - # the next one to be sure that whole file was extracted - if not appvm: - nextfile = filelist_pipe.readline().strip() + extract_proc = self._start_inner_extraction_worker(queue) + extract_proc.join() + if extract_proc.exitcode != 0: + raise qubes.exc.QubesException( + "unable to extract the qubes backup. " + "Check extracting process errors.") - if BACKUP_DEBUG and callable(print_callback): - print_callback("Getting hmac:" + hmacfile) - if not hmacfile or hmacfile == "EOF": - # Premature end of archive, either of tar1_command or - # vmproc exited with error - break + if self.header_data.version in [2]: # TODO add 3 + raise NotImplementedError("TODO: conversion core[12] qubes.xml") + else: + backup_app = qubes.Qubes(os.path.join(self.tmpdir, 'qubes.xml')) + # Not needed anymore - all the data stored in backup_app + os.unlink(os.path.join(self.tmpdir, 'qubes.xml')) + return backup_app - if not any(map(lambda x: filename.startswith(x), vms_dirs)): - if BACKUP_DEBUG and callable(print_callback): - print_callback("Ignoring VM not selected for restore") - os.unlink(os.path.join(restore_tmpdir, filename)) - os.unlink(os.path.join(restore_tmpdir, hmacfile)) + def _restore_vm_dirs(self, vms_dirs, vms_size): + # Currently each VM consists of at most 7 archives (count + # file_to_backup calls in backup_prepare()), but add some safety + # margin for further extensions. Each archive is divided into 100MB + # chunks. Additionally each file have own hmac file. So assume upper + # limit as 2*(10*COUNT_OF_VMS+TOTAL_SIZE/100MB) + limit_count = str(2 * (10 * len(vms_dirs) + + int(vms_size / (100 * 1024 * 1024)))) + + if callable(self.print_callback): + if BACKUP_DEBUG: + self.print_callback("Working in temporary dir:" + + self.tmpdir) + self.print_callback( + "Extracting data: " + size_to_human(vms_size) + " to restore") + + # retrieve backup from the backup stream (either VM, or dom0 file) + # TODO: add some safety margin in vms_size? + (retrieve_proc, filelist_pipe, error_pipe) = \ + self._start_retrieval_process(vms_dirs, limit_count, vms_size) + + to_extract = Queue() + + # extract data retrieved by retrieve_proc + extract_proc = self._start_inner_extraction_worker(to_extract) + + try: + filename = None + nextfile = None + while True: + if self.canceled: + break + if not extract_proc.is_alive(): + retrieve_proc.terminate() + retrieve_proc.wait() + expect_tar_error = True + if retrieve_proc in self.processes_to_kill_on_cancel: + self.processes_to_kill_on_cancel.remove(retrieve_proc) + # wait for other processes (if any) + for proc in self.processes_to_kill_on_cancel: + proc.wait() + break + if nextfile is not None: + filename = nextfile + else: + filename = filelist_pipe.readline().strip() + + if BACKUP_DEBUG and callable(self.print_callback): + self.print_callback("Getting new file:" + filename) + + if not filename or filename == "EOF": + break + + hmacfile = filelist_pipe.readline().strip() + + if self.canceled: + break + # if reading archive directly with tar, wait for next filename - + # tar prints filename before processing it, so wait for + # the next one to be sure that whole file was extracted + if not self.backup_vm: + nextfile = filelist_pipe.readline().strip() + + if BACKUP_DEBUG and callable(self.print_callback): + self.print_callback("Getting hmac:" + hmacfile) + if not hmacfile or hmacfile == "EOF": + # Premature end of archive, either of tar1_command or + # vmproc exited with error + break + + if not any(map(lambda x: filename.startswith(x), vms_dirs)): + if BACKUP_DEBUG and callable(self.print_callback): + self.print_callback("Ignoring VM not selected for " + "restore") + os.unlink(os.path.join(self.tmpdir, filename)) + os.unlink(os.path.join(self.tmpdir, hmacfile)) + continue + + if self._verify_hmac(filename, hmacfile): + to_extract.put(os.path.join(self.tmpdir, filename)) + + if self.canceled: + raise BackupCanceledError("Restore canceled", + tmpdir=self.tmpdir) + + if retrieve_proc.wait() != 0: + raise qubes.exc.QubesException( + "unable to read the qubes backup file {0} ({1}): {2}" + .format(self.backup_location, error_pipe.read( + MAX_STDERR_BYTES))) + # wait for other processes (if any) + for proc in self.processes_to_kill_on_cancel: + # FIXME check 'vmproc' exit code? + proc.wait() + + if filename and filename != "EOF": + raise qubes.exc.QubesException( + "Premature end of archive, the last file was %s" % filename) + except: + to_extract.put("ERROR") + extract_proc.join() + raise + else: + to_extract.put("FINISHED") + + if BACKUP_DEBUG and callable(self.print_callback): + self.print_callback("Waiting for the extraction process to " + "finish...") + extract_proc.join() + if BACKUP_DEBUG and callable(self.print_callback): + self.print_callback("Extraction process finished with code:" + + str(extract_proc.exitcode)) + if extract_proc.exitcode != 0: + raise qubes.exc.QubesException( + "unable to extract the qubes backup. " + "Check extracting process errors.") + + def generate_new_name_for_conflicting_vm(self, orig_name, restore_info): + number = 1 + if len(orig_name) > 29: + orig_name = orig_name[0:29] + new_name = orig_name + while (new_name in restore_info.keys() or + new_name in map(lambda x: x.get('rename_to', None), + restore_info.values()) or + new_name in self.app.domains): + new_name = str('{}{}'.format(orig_name, number)) + number += 1 + if number == 100: + # give up + return None + return new_name + + def restore_info_verify(self, restore_info): + for vm in restore_info.keys(): + if vm in ['dom0']: continue - if verify_hmac(os.path.join(restore_tmpdir, filename), - os.path.join(restore_tmpdir, hmacfile), - passphrase, hmac_algorithm): - to_extract.put(os.path.join(restore_tmpdir, filename)) + vm_info = restore_info[vm] - if running_backup_operation and running_backup_operation.canceled: - raise BackupCanceledError("Restore canceled", - tmpdir=restore_tmpdir) - - if command.wait() != 0 and not expect_tar_error: - raise qubes.exc.QubesException( - "unable to read the qubes backup file {0} ({1}). " - "Is it really a backup?".format(backup_source, command.wait())) - if vmproc: - if vmproc.wait() != 0: - raise qubes.exc.QubesException( - "unable to read the qubes backup {0} " - "because of a VM error: {1}".format( - backup_source, vmproc.stderr.read(MAX_STDERR_BYTES))) - - if filename and filename != "EOF": - raise qubes.exc.QubesException( - "Premature end of archive, the last file was %s" % filename) - except: - to_extract.put("ERROR") - extract_proc.join() - raise - else: - to_extract.put("FINISHED") - - if BACKUP_DEBUG and callable(print_callback): - print_callback("Waiting for the extraction process to finish...") - extract_proc.join() - if BACKUP_DEBUG and callable(print_callback): - print_callback("Extraction process finished with code:" + - str(extract_proc.exitcode)) - if extract_proc.exitcode != 0: - raise qubes.exc.QubesException( - "unable to extract the qubes backup. " - "Check extracting process errors.") - - return header_data - - -def backup_restore_set_defaults(options): - if 'use-default-netvm' not in options: - options['use-default-netvm'] = False - if 'use-none-netvm' not in options: - options['use-none-netvm'] = False - if 'use-default-template' not in options: - options['use-default-template'] = False - if 'dom0-home' not in options: - options['dom0-home'] = True - if 'replace-template' not in options: - options['replace-template'] = [] - if 'ignore-username-mismatch' not in options: - options['ignore-username-mismatch'] = False - if 'verify-only' not in options: - options['verify-only'] = False - if 'rename-conflicting' not in options: - options['rename-conflicting'] = False - - return options - - -def load_hmac(hmac): - hmac = hmac.strip().split("=") - if len(hmac) > 1: - hmac = hmac[1].strip() - else: - raise qubes.exc.QubesException("ERROR: invalid hmac file content") - - return hmac - - -def backup_detect_format_version(backup_location): - if os.path.exists(os.path.join(backup_location, 'qubes.xml')): - return 1 - else: - # this could mean also 3, but not distinguishable until backup header - # is read - return 2 - - -def backup_restore_header(source, passphrase, - print_callback=print_stdout, - error_callback=print_stderr, - encrypted=False, appvm=None, compressed=False, - format_version=None, - hmac_algorithm=DEFAULT_HMAC_ALGORITHM, - crypto_algorithm=DEFAULT_CRYPTO_ALGORITHM): - global running_backup_operation - running_backup_operation = None - - restore_tmpdir = tempfile.mkdtemp(prefix="/var/tmp/restore_") - - if format_version is None: - format_version = backup_detect_format_version(source) - - if format_version == 1: - return restore_tmpdir, os.path.join(source, 'qubes.xml'), None - - # tar2qfile matches only beginnings, while tar full path - if appvm: - extract_filter = [HEADER_FILENAME, 'qubes.xml.000'] - else: - extract_filter = [HEADER_FILENAME, HEADER_FILENAME + '.hmac', - 'qubes.xml.000', 'qubes.xml.000.hmac'] - - header_data = restore_vm_dirs(source, - restore_tmpdir, - passphrase=passphrase, - vms_dirs=extract_filter, - vms=None, - vms_size=HEADER_QUBES_XML_MAX_SIZE, - format_version=format_version, - hmac_algorithm=hmac_algorithm, - crypto_algorithm=crypto_algorithm, - print_callback=print_callback, - error_callback=error_callback, - progress_callback=None, - encrypted=encrypted, - compressed=compressed, - appvm=appvm) - - return (restore_tmpdir, os.path.join(restore_tmpdir, "qubes.xml"), - header_data) - - -def generate_new_name_for_conflicting_vm(orig_name, host_collection, - restore_info): - number = 1 - if len(orig_name) > 29: - orig_name = orig_name[0:29] - new_name = orig_name - while (new_name in restore_info.keys() or - new_name in map(lambda x: x.get('rename_to', None), - restore_info.values()) or - new_name in host_collection.domains): - new_name = str('{}{}'.format(orig_name, number)) - number += 1 - if number == 100: - # give up - return None - return new_name - -def restore_info_verify(restore_info, host_collection): - assert isinstance(host_collection, qubes.Qubes) - options = restore_info['$OPTIONS$'] - for vm in restore_info.keys(): - if vm in ['$OPTIONS$', 'dom0']: - continue - - vm_info = restore_info[vm] - - vm_info.pop('excluded', None) - if 'exclude' in options.keys(): - if vm in options['exclude']: + vm_info.pop('excluded', None) + if vm in self.options.exclude: vm_info['excluded'] = True - vm_info.pop('already-exists', None) - if not options['verify-only'] and \ - vm in host_collection.domains: - if options['rename-conflicting']: - new_name = generate_new_name_for_conflicting_vm( - vm, host_collection, restore_info - ) - if new_name is not None: - vm_info['rename-to'] = new_name + vm_info.pop('already-exists', None) + if not self.options.verify_only and \ + vm in self.app.domains: + if self.options.rename_conflicting: + new_name = self.generate_new_name_for_conflicting_vm( + vm, restore_info + ) + if new_name is not None: + vm_info['rename-to'] = new_name + else: + vm_info['already-exists'] = True else: vm_info['already-exists'] = True - else: - vm_info['already-exists'] = True - # check template - vm_info.pop('missing-template', None) - if vm_info['template']: + # check template + vm_info.pop('missing-template', None) + if vm_info['template']: + template_name = vm_info['template'] + try: + host_template = self.app.domains[template_name] + except KeyError: + host_template = None + if not host_template or not host_template.is_template(): + # Maybe the (custom) template is in the backup? + if not (template_name in restore_info.keys() and + restore_info[template_name]['vm'].is_template()): + if self.options.use_default_template: + if 'orig-template' not in vm_info.keys(): + vm_info['orig-template'] = template_name + vm_info['template'] = self.app.default_template.name + else: + vm_info['missing-template'] = True + + # check netvm + vm_info.pop('missing-netvm', None) + if vm_info['netvm']: + netvm_name = vm_info['netvm'] + + try: + netvm_on_host = self.app.domains[netvm_name] + except KeyError: + netvm_on_host = None + # No netvm on the host? + if not ((netvm_on_host is not None) and netvm_on_host.is_netvm()): + + # Maybe the (custom) netvm is in the backup? + if not (netvm_name in restore_info.keys() and + restore_info[netvm_name]['vm'].is_netvm()): + if self.options.use_default_netvm: + vm_info['netvm'] = self.app.default_netvm.name + vm_info['vm'].uses_default_netvm = True + elif self.options.use_none_netvm: + vm_info['netvm'] = None + else: + vm_info['missing-netvm'] = True + + vm_info['good-to-go'] = not any([(prop in vm_info.keys()) for + prop in ['missing-netvm', + 'missing-template', + 'already-exists', + 'excluded']]) + + # update references to renamed VMs: + for vm in restore_info.keys(): + if vm in ['dom0']: + continue + vm_info = restore_info[vm] template_name = vm_info['template'] - host_template = host_collection.domains.get(template_name, None) - if not host_template or not host_template.is_template(): - # Maybe the (custom) template is in the backup? - if not (template_name in restore_info.keys() and - restore_info[template_name]['vm'].is_template()): - if options['use-default-template']: - if 'orig-template' not in vm_info.keys(): - vm_info['orig-template'] = template_name - vm_info['template'] = host_collection \ - .default_template.name - else: - vm_info['missing-template'] = True - - # check netvm - vm_info.pop('missing-netvm', None) - if vm_info['netvm']: + if (template_name in restore_info and + restore_info[template_name]['good-to-go'] and + 'rename-to' in restore_info[template_name]): + vm_info['template'] = restore_info[template_name]['rename-to'] netvm_name = vm_info['netvm'] + if (netvm_name in restore_info and + restore_info[netvm_name]['good-to-go'] and + 'rename-to' in restore_info[netvm_name]): + vm_info['netvm'] = restore_info[netvm_name]['rename-to'] - netvm_on_host = host_collection.domains.get(netvm_name, None) + return restore_info - # No netvm on the host? - if not ((netvm_on_host is not None) and netvm_on_host.is_netvm()): - - # Maybe the (custom) netvm is in the backup? - if not (netvm_name in restore_info.keys() and - restore_info[netvm_name]['vm'].is_netvm()): - if options['use-default-netvm']: - vm_info['netvm'] = host_collection \ - .default_netvm.name - vm_info['vm'].uses_default_netvm = True - elif options['use-none-netvm']: - vm_info['netvm'] = None - else: - vm_info['missing-netvm'] = True - - vm_info['good-to-go'] = not any([(prop in vm_info.keys()) for - prop in ['missing-netvm', - 'missing-template', - 'already-exists', - 'excluded']]) - - # update references to renamed VMs: - for vm in restore_info.keys(): - if vm in ['$OPTIONS$', 'dom0']: - continue - vm_info = restore_info[vm] - template_name = vm_info['template'] - if (template_name in restore_info and - restore_info[template_name]['good-to-go'] and - 'rename-to' in restore_info[template_name]): - vm_info['template'] = restore_info[template_name]['rename-to'] - netvm_name = vm_info['netvm'] - if (netvm_name in restore_info and - restore_info[netvm_name]['good-to-go'] and - 'rename-to' in restore_info[netvm_name]): - vm_info['netvm'] = restore_info[netvm_name]['rename-to'] - - return restore_info - - -def backup_restore_prepare(backup_location, passphrase, options=None, - host_collection=None, encrypted=False, appvm=None, - compressed=False, print_callback=print_stdout, - error_callback=print_stderr, - format_version=None, - hmac_algorithm=DEFAULT_HMAC_ALGORITHM, - crypto_algorithm=DEFAULT_CRYPTO_ALGORITHM): - if options is None: - options = {} - # Defaults - backup_restore_set_defaults(options) - # Options introduced in backup format 3+, which always have a header, - # so no need for fallback in function parameter - compression_filter = DEFAULT_COMPRESSION_FILTER - - # Private functions begin - def is_vm_included_in_backup_v1(backup_dir, check_vm): + def _is_vm_included_in_backup_v1(self, check_vm): if check_vm.qid == 0: - return os.path.exists(os.path.join(backup_dir, 'dom0-home')) + return os.path.exists( + os.path.join(self.backup_location, 'dom0-home')) # DisposableVM if check_vm.dir_path is None: return False backup_vm_dir_path = check_vm.dir_path.replace( - qubes.config.system_path["qubes_base_dir"], backup_dir) + qubes.config.system_path["qubes_base_dir"], self.backup_location) if os.path.exists(backup_vm_dir_path): return True else: return False - def is_vm_included_in_backup_v2(_, check_vm): + def _is_vm_included_in_backup_v2(self, check_vm): if check_vm.backup_content: return True else: return False - def find_template_name(template, replaces): - rx_replace = re.compile("(.*):(.*)") - for r in replaces: - m = rx_replace.match(r) - if m.group(1) == template: - return m.group(2) - + def _find_template_name(self, template): + if template in self.options.replace_template: + return self.options.replace_template[template] return template - # Private functions end - - # Format versions: - # 1 - Qubes R1, Qubes R2 beta1, beta2 - # 2 - Qubes R2 beta3+ - - if format_version is None: - format_version = backup_detect_format_version(backup_location) - - if format_version == 1: - is_vm_included_in_backup = is_vm_included_in_backup_v1 - elif format_version in [2, 3]: - is_vm_included_in_backup = is_vm_included_in_backup_v2 - if not appvm: - if not os.path.isfile(backup_location): - raise qubes.exc.QubesException("Invalid backup location (not a file or " - "directory with qubes.xml)" - ": %s" % unicode(backup_location)) - else: - raise qubes.exc.QubesException( - "Unknown backup format version: %s" % str(format_version)) - - (restore_tmpdir, qubes_xml, header_data) = backup_restore_header( - backup_location, - passphrase, - encrypted=encrypted, - appvm=appvm, - compressed=compressed, - hmac_algorithm=hmac_algorithm, - crypto_algorithm=crypto_algorithm, - print_callback=print_callback, - error_callback=error_callback, - format_version=format_version) - - if header_data: - if BackupHeader.version in header_data: - format_version = header_data[BackupHeader.version] - if BackupHeader.crypto_algorithm in header_data: - crypto_algorithm = header_data[BackupHeader.crypto_algorithm] - if BackupHeader.hmac_algorithm in header_data: - hmac_algorithm = header_data[BackupHeader.hmac_algorithm] - if BackupHeader.compressed in header_data: - compressed = header_data[BackupHeader.compressed] - if BackupHeader.encrypted in header_data: - encrypted = header_data[BackupHeader.encrypted] - if BackupHeader.compression_filter in header_data: - compression_filter = header_data[BackupHeader.compression_filter] - - if BACKUP_DEBUG: - print "Loading file", qubes_xml - backup_collection = qubes.Qubes(qubes_xml) - - if host_collection is None: - host_collection = qubes.Qubes() - - backup_vms_list = [vm for vm in backup_collection.domains] - vms_to_restore = {} - - # ... and the actual data - for vm in backup_vms_list: - if vm.qid == 0: - # Handle dom0 as special case later - continue - if is_vm_included_in_backup(backup_location, vm): - if BACKUP_DEBUG: - print vm.name, "is included in backup" - - vms_to_restore[vm.name] = {} - vms_to_restore[vm.name]['vm'] = vm - - if vm.template is None: - vms_to_restore[vm.name]['template'] = None - else: - templatevm_name = find_template_name(vm.template.name, options[ - 'replace-template']) - vms_to_restore[vm.name]['template'] = templatevm_name - - if vm.netvm is None: - vms_to_restore[vm.name]['netvm'] = None - else: - netvm_name = vm.netvm.name - vms_to_restore[vm.name]['netvm'] = netvm_name - # Set to None to not confuse QubesVm object from backup - # collection with host collection (further in clone_attrs). Set - # directly _netvm to suppress setter action, especially - # modifying firewall - vm._netvm = None - - # Store restore parameters - options['location'] = backup_location - options['restore_tmpdir'] = restore_tmpdir - options['passphrase'] = passphrase - options['encrypted'] = encrypted - options['compressed'] = compressed - options['compression_filter'] = compression_filter - options['hmac_algorithm'] = hmac_algorithm - options['crypto_algorithm'] = crypto_algorithm - options['appvm'] = appvm - options['format_version'] = format_version - vms_to_restore['$OPTIONS$'] = options - - vms_to_restore = restore_info_verify(vms_to_restore, host_collection) - - # ...and dom0 home - if options['dom0-home'] and \ - is_vm_included_in_backup(backup_location, - backup_collection.domains[0]): - vm = backup_collection.domains[0] - vms_to_restore['dom0'] = {} - if format_version == 1: - vms_to_restore['dom0']['subdir'] = \ - os.listdir(os.path.join(backup_location, 'dom0-home'))[0] - vms_to_restore['dom0']['size'] = 0 # unknown + def _is_vm_included_in_backup(self, vm): + if self.header_data.version == 1: + return self._is_vm_included_in_backup_v1(vm) + elif self.header_data.version in [2, 3]: + return self._is_vm_included_in_backup_v2(vm) else: - vms_to_restore['dom0']['subdir'] = vm.backup_path - vms_to_restore['dom0']['size'] = vm.backup_size - local_user = grp.getgrnam('qubes').gr_mem[0] + raise qubes.exc.QubesException( + "Unknown backup format version: {}".format( + self.header_data.version)) - dom0_home = vms_to_restore['dom0']['subdir'] + def get_restore_info(self): + # Format versions: + # 1 - Qubes R1, Qubes R2 beta1, beta2 + # 2 - Qubes R2 beta3+ - vms_to_restore['dom0']['username'] = os.path.basename(dom0_home) - if vms_to_restore['dom0']['username'] != local_user: - vms_to_restore['dom0']['username-mismatch'] = True - if options['ignore-username-mismatch']: - vms_to_restore['dom0']['ignore-username-mismatch'] = True + vms_to_restore = {} + + for vm in self.backup_app.domains: + if vm.qid == 0: + # Handle dom0 as special case later + continue + if self._is_vm_included_in_backup(vm): + if BACKUP_DEBUG: + print vm.name, "is included in backup" + + vms_to_restore[vm.name] = {} + vms_to_restore[vm.name]['vm'] = vm + + if not hasattr(vm, 'template'): + vms_to_restore[vm.name]['template'] = None + else: + templatevm_name = self._find_template_name( + vm.template.name) + vms_to_restore[vm.name]['template'] = templatevm_name + + if vm.netvm is None: + vms_to_restore[vm.name]['netvm'] = None + else: + netvm_name = vm.netvm.name + vms_to_restore[vm.name]['netvm'] = netvm_name + # Set to None to not confuse QubesVm object from backup + # collection with host collection (further in clone_attrs). + vm.netvm = None + + vms_to_restore = self.restore_info_verify(vms_to_restore) + + # ...and dom0 home + if self.options.dom0_home and \ + self._is_vm_included_in_backup(self.backup_app.domains[0]): + vm = self.backup_app.domains[0] + vms_to_restore['dom0'] = {} + if self.header_data.version == 1: + vms_to_restore['dom0']['subdir'] = \ + os.listdir(os.path.join( + self.backup_location, 'dom0-home'))[0] + vms_to_restore['dom0']['size'] = 0 # unknown else: - vms_to_restore['dom0']['good-to-go'] = False + vms_to_restore['dom0']['subdir'] = vm.backup_path + vms_to_restore['dom0']['size'] = vm.backup_size + local_user = grp.getgrnam('qubes').gr_mem[0] - if 'good-to-go' not in vms_to_restore['dom0']: - vms_to_restore['dom0']['good-to-go'] = True + dom0_home = vms_to_restore['dom0']['subdir'] - # Not needed - all the data stored in vms_to_restore - if format_version >= 2: - os.unlink(qubes_xml) - return vms_to_restore + vms_to_restore['dom0']['username'] = os.path.basename(dom0_home) + if vms_to_restore['dom0']['username'] != local_user: + vms_to_restore['dom0']['username-mismatch'] = True + if self.options.ignore_username_mismatch: + vms_to_restore['dom0']['ignore-username-mismatch'] = True + else: + vms_to_restore['dom0']['good-to-go'] = False + if 'good-to-go' not in vms_to_restore['dom0']: + vms_to_restore['dom0']['good-to-go'] = True -def backup_restore_print_summary(restore_info, print_callback=print_stdout): - fields = { - "qid": {"func": "vm.qid"}, + return vms_to_restore - "name": {"func": "('[' if vm.is_template() else '')\ - + ('{' if vm.is_netvm() else '')\ - + vm.name \ - + (']' if vm.is_template() else '')\ - + ('}' if vm.is_netvm() else '')"}, + def get_restore_summary(self, restore_info): + fields = { + "qid": {"func": "vm.qid"}, - "type": {"func": "'Tpl' if vm.is_template() else \ - 'HVM' if vm.type == 'HVM' else \ - vm.type.replace('VM','')"}, + "name": {"func": "('[' if vm.is_template() else '')\ + + ('{' if vm.is_netvm() else '')\ + + vm.name \ + + (']' if vm.is_template() else '')\ + + ('}' if vm.is_netvm() else '')"}, - "updbl": {"func": "'Yes' if vm.updateable else ''"}, + "type": {"func": "'Tpl' if vm.is_template() else \ + 'App' if isinstance(vm, qubes.vm.appvm.AppVM) else \ + vm.__class__.__name__.replace('VM','')"}, - "template": {"func": "'n/a' if vm.is_template() or vm.template is None else\ - vm_info['template']"}, + "updbl": {"func": "'Yes' if vm.updateable else ''"}, - "netvm": {"func": "'n/a' if vm.is_netvm() and not vm.is_proxyvm() else\ - ('*' if vm.uses_default_netvm else '') +\ - vm_info['netvm'] if vm_info['netvm'] is not None else '-'"}, + "template": {"func": "'n/a' if vm.is_template() or vm.template is None else\ + vm_info['template']"}, - "label": {"func": "vm.label.name"}, - } + "netvm": {"func": "'n/a' if vm.is_netvm() and not vm.is_proxyvm() else\ + ('*' if vm.property_is_default('netvm') else '') +\ + vm_info['netvm'] if vm_info['netvm'] is not None else '-'"}, - fields_to_display = ["name", "type", "template", "updbl", "netvm", "label"] + "label": {"func": "vm.label.name"}, + } + + fields_to_display = ["name", "type", "template", "updbl", "netvm", "label"] + + # First calculate the maximum width of each field we want to display + total_width = 0 + for f in fields_to_display: + fields[f]["max_width"] = len(f) + for vm_info in restore_info.values(): + if 'vm' in vm_info.keys(): + # noinspection PyUnusedLocal + vm = vm_info['vm'] + l = len(unicode(eval(fields[f]["func"]))) + if l > fields[f]["max_width"]: + fields[f]["max_width"] = l + total_width += fields[f]["max_width"] + + summary = "" + summary += "The following VMs are included in the backup:\n" + summary += "\n" + + # Display the header + for f in fields_to_display: + fmt = "{{0:-^{0}}}-+".format(fields[f]["max_width"] + 1) + summary += fmt.format('-') + summary += "\n" + for f in fields_to_display: + fmt = "{{0:>{0}}} |".format(fields[f]["max_width"] + 1) + summary += fmt.format(f) + summary += "\n" + for f in fields_to_display: + fmt = "{{0:-^{0}}}-+".format(fields[f]["max_width"] + 1) + summary += fmt.format('-') + summary += "\n" - # First calculate the maximum width of each field we want to display - total_width = 0 - for f in fields_to_display: - fields[f]["max_width"] = len(f) for vm_info in restore_info.values(): - if 'vm' in vm_info.keys(): - # noinspection PyUnusedLocal - vm = vm_info['vm'] - l = len(unicode(eval(fields[f]["func"]))) - if l > fields[f]["max_width"]: - fields[f]["max_width"] = l - total_width += fields[f]["max_width"] + # Skip non-VM here + if 'vm' not in vm_info: + continue + # noinspection PyUnusedLocal + vm = vm_info['vm'] + s = "" + for f in fields_to_display: + fmt = "{{0:>{0}}} |".format(fields[f]["max_width"] + 1) + s += fmt.format(eval(fields[f]["func"])) - print_callback("") - print_callback("The following VMs are included in the backup:") - print_callback("") - - # Display the header - s = "" - for f in fields_to_display: - fmt = "{{0:-^{0}}}-+".format(fields[f]["max_width"] + 1) - s += fmt.format('-') - print_callback(s) - s = "" - for f in fields_to_display: - fmt = "{{0:>{0}}} |".format(fields[f]["max_width"] + 1) - s += fmt.format(f) - print_callback(s) - s = "" - for f in fields_to_display: - fmt = "{{0:-^{0}}}-+".format(fields[f]["max_width"] + 1) - s += fmt.format('-') - print_callback(s) - - for vm_info in restore_info.values(): - # Skip non-VM here - if 'vm' not in vm_info: - continue - # noinspection PyUnusedLocal - vm = vm_info['vm'] - s = "" - for f in fields_to_display: - fmt = "{{0:>{0}}} |".format(fields[f]["max_width"] + 1) - s += fmt.format(eval(fields[f]["func"])) - - if 'excluded' in vm_info and vm_info['excluded']: - s += " <-- Excluded from restore" - elif 'already-exists' in vm_info: - s += " <-- A VM with the same name already exists on the host!" - elif 'missing-template' in vm_info: - s += " <-- No matching template on the host or in the backup found!" - elif 'missing-netvm' in vm_info: - s += " <-- No matching netvm on the host or in the backup found!" - else: - if 'orig-template' in vm_info: - s += " <-- Original template was '%s'" % (vm_info['orig-template']) - if 'rename-to' in vm_info: - s += " <-- Will be renamed to '%s'" % vm_info['rename-to'] - - print_callback(s) - - if 'dom0' in restore_info.keys(): - s = "" - for f in fields_to_display: - fmt = "{{0:>{0}}} |".format(fields[f]["max_width"] + 1) - if f == "name": - s += fmt.format("Dom0") - elif f == "type": - s += fmt.format("Home") + if 'excluded' in vm_info and vm_info['excluded']: + s += " <-- Excluded from restore" + elif 'already-exists' in vm_info: + s += " <-- A VM with the same name already exists on the host!" + elif 'missing-template' in vm_info: + s += " <-- No matching template on the host or in the backup found!" + elif 'missing-netvm' in vm_info: + s += " <-- No matching netvm on the host or in the backup found!" else: - s += fmt.format("") - if 'username-mismatch' in restore_info['dom0']: - s += " <-- username in backup and dom0 mismatch" - if 'ignore-username-mismatch' in restore_info['dom0']: - s += " (ignored)" + if 'orig-template' in vm_info: + s += " <-- Original template was '%s'" % (vm_info['orig-template']) + if 'rename-to' in vm_info: + s += " <-- Will be renamed to '%s'" % vm_info['rename-to'] - print_callback(s) + summary += s + "\n" + if 'dom0' in restore_info.keys(): + s = "" + for f in fields_to_display: + fmt = "{{0:>{0}}} |".format(fields[f]["max_width"] + 1) + if f == "name": + s += fmt.format("Dom0") + elif f == "type": + s += fmt.format("Home") + else: + s += fmt.format("") + if 'username-mismatch' in restore_info['dom0']: + s += " <-- username in backup and dom0 mismatch" + if 'ignore-username-mismatch' in restore_info['dom0']: + s += " (ignored)" -def backup_restore_do(restore_info, - host_collection=None, print_callback=print_stdout, - error_callback=print_stderr, progress_callback=None, - ): - global running_backup_operation + summary += s + "\n" - # Private functions begin - def restore_vm_dir_v1(backup_dir, src_dir, dst_dir): + return summary + + def _restore_vm_dir_v1(self, src_dir, dst_dir): backup_src_dir = src_dir.replace( - qubes.config.system_path["qubes_base_dir"], backup_dir) + qubes.config.system_path["qubes_base_dir"], self.backup_location) # We prefer to use Linux's cp, because it nicely handles sparse files - cp_retcode = subprocess.call(["cp", "-rp", "--reflink=auto", backup_src_dir, dst_dir]) + cp_retcode = subprocess.call( + ["cp", "-rp", "--reflink=auto", backup_src_dir, dst_dir]) if cp_retcode != 0: raise qubes.exc.QubesException( "*** Error while copying file {0} to {1}".format(backup_src_dir, dst_dir)) - # Private functions end + def restore_do(self, restore_info): + # FIXME handle locking - options = restore_info['$OPTIONS$'] - backup_location = options['location'] - restore_tmpdir = options['restore_tmpdir'] - passphrase = options['passphrase'] - encrypted = options['encrypted'] - compressed = options['compressed'] - compression_filter = options['compression_filter'] - hmac_algorithm = options['hmac_algorithm'] - crypto_algorithm = options['crypto_algorithm'] - verify_only = options['verify-only'] - appvm = options['appvm'] - format_version = options['format_version'] - - if format_version is None: - format_version = backup_detect_format_version(backup_location) - - lock_obtained = False - if host_collection is None: - host_collection = qubes.Qubes() - # FIXME - lock_obtained = True - - # Perform VM restoration in backup order - vms_dirs = [] - vms_size = 0 - vms = {} - for vm_info in restore_info.values(): - if 'vm' not in vm_info: - continue - if not vm_info['good-to-go']: - continue - vm = vm_info['vm'] - if format_version >= 2: - vms_size += vm.backup_size - vms_dirs.append(vm.backup_path) - vms[vm.name] = vm - - running_backup_operation = BackupOperationInfo() - - if format_version >= 2: - if 'dom0' in restore_info.keys() and restore_info['dom0']['good-to-go']: - vms_dirs.append(os.path.dirname(restore_info['dom0']['subdir'])) - vms_size += restore_info['dom0']['size'] - - try: - restore_vm_dirs(backup_location, - restore_tmpdir, - passphrase=passphrase, - vms_dirs=vms_dirs, - vms=vms, - vms_size=vms_size, - format_version=format_version, - hmac_algorithm=hmac_algorithm, - crypto_algorithm=crypto_algorithm, - verify_only=verify_only, - print_callback=print_callback, - error_callback=error_callback, - progress_callback=progress_callback, - encrypted=encrypted, - compressed=compressed, - compression_filter=compression_filter, - appvm=appvm) - except qubes.exc.QubesException: - if verify_only: - raise - else: - if callable(print_callback): - print_callback( - "Some errors occurred during data extraction, " - "continuing anyway to restore at least some " - "VMs") - else: - if verify_only: - if callable(print_callback): - print_callback("WARNING: Backup verification not supported for " - "this backup format.") - - if verify_only: - shutil.rmtree(restore_tmpdir) - return - - # First load templates, then other VMs - for do_templates in (True, False): - if running_backup_operation.canceled: - break - for vm in vms.values(): - if running_backup_operation.canceled: - # only break the loop to save qubes.xml with already restored - # VMs - break - if vm.is_template != do_templates: + # Perform VM restoration in backup order + vms_dirs = [] + vms_size = 0 + vms = {} + for vm_info in restore_info.values(): + if 'vm' not in vm_info: continue - if callable(print_callback): - print_callback("-> Restoring {0}...".format(vm.name)) - retcode = subprocess.call( - ["mkdir", "-p", os.path.dirname(vm.dir_path)]) - if retcode != 0: - error_callback("*** Cannot create directory: {0}?!".format( - vm.dir_path)) - error_callback("Skipping...") + if not vm_info['good-to-go']: continue + vm = vm_info['vm'] + if self.header_data.version >= 2: + vms_size += vm.backup_size + vms_dirs.append(vm.backup_path) + vms[vm.name] = vm - kwargs = {} - if hasattr(vm, 'template'): - if vm.template is not None: - kwargs['template'] = restore_info[vm.name]['template'] + if self.header_data.version >= 2: + if 'dom0' in restore_info.keys() and \ + restore_info['dom0']['good-to-go']: + vms_dirs.append(os.path.dirname(restore_info['dom0']['subdir'])) + vms_size += restore_info['dom0']['size'] + + try: + self._restore_vm_dirs(vms_dirs=vms_dirs, vms_size=vms_size) + except qubes.exc.QubesException: + if self.options.verify_only: + raise else: - kwargs['template'] = None + if callable(self.print_callback): + self.print_callback( + "Some errors occurred during data extraction, " + "continuing anyway to restore at least some " + "VMs") + else: + if self.options.verify_only: + if callable(self.print_callback): + self.print_callback("WARNING: Backup verification not " + "supported for " + "this backup format.") - new_vm = None + if self.options.verify_only: + shutil.rmtree(self.tmpdir) + return + + # First load templates, then other VMs + for do_templates in (True, False): + if self.canceled: + break + for vm in vms.values(): + if self.canceled: + # only break the loop to save qubes.xml with already restored + # VMs + break + if vm.is_template() != do_templates: + continue + if callable(self.print_callback): + self.print_callback("-> Restoring {0}...".format(vm.name)) + retcode = subprocess.call( + ["mkdir", "-p", os.path.dirname(vm.dir_path)]) + if retcode != 0: + self.error_callback("*** Cannot create directory: {" + "0}?!".format( + vm.dir_path)) + self.error_callback("Skipping...") + continue + + kwargs = {} + if hasattr(vm, 'template'): + if vm.template is not None: + kwargs['template'] = restore_info[vm.name]['template'] + else: + kwargs['template'] = None + + new_vm = None + vm_name = vm.name + if 'rename-to' in restore_info[vm.name]: + vm_name = restore_info[vm.name]['rename-to'] + + try: + # first only minimal set, later clone_properties will be called + new_vm = self.app.add_new_vm( + vm.__class__, + name=vm_name, + label=vm.label, + installed_by_rpm=False, + **kwargs) + if os.path.exists(new_vm.dir_path): + move_to_path = tempfile.mkdtemp('', os.path.basename( + new_vm.dir_path), os.path.dirname(new_vm.dir_path)) + try: + os.rename(new_vm.dir_path, move_to_path) + self.error_callback( + "*** Directory {} already exists! It has " + "been moved to {}".format(new_vm.dir_path, + move_to_path)) + except OSError: + self.error_callback( + "*** Directory {} already exists and " + "cannot be moved!".format(new_vm.dir_path)) + self.error_callback("Skipping...") + continue + + if self.header_data.version == 1: + self._restore_vm_dir_v1(vm.dir_path, + os.path.dirname(new_vm.dir_path)) + else: + shutil.move(os.path.join(self.tmpdir, vm.backup_path), + new_vm.dir_path) + + new_vm.verify_files() + except Exception as err: + self.error_callback("ERROR: {0}".format(err)) + self.error_callback("*** Skipping VM: {0}".format(vm.name)) + if new_vm: + del self.app.domains[new_vm.qid] + continue + + if hasattr(vm, 'kernel'): + # TODO: add a setting for this? + if not vm.property_is_default('kernel') and \ + vm.kernel not in \ + os.listdir(qubes.config.system_path[ + 'qubes_kernels_base_dir']): + if callable(self.print_callback): + self.print_callback("WARNING: Kernel %s not " + "installed, " + "using default one" % vm.kernel) + vm.kernel = qubes.property.DEFAULT + try: + new_vm.clone_properties(vm) + except Exception as err: + self.error_callback("ERROR: {0}".format(err)) + self.error_callback("*** Some VM property will not be " + "restored") + + try: + new_vm.fire_event('domain-restore') + except Exception as err: + self.error_callback("ERROR during appmenu restore: {" + "0}".format(err)) + self.error_callback( + "*** VM '{0}' will not have appmenus".format(vm.name)) + + # Set network dependencies - only non-default netvm setting + for vm in vms.values(): vm_name = vm.name if 'rename-to' in restore_info[vm.name]: vm_name = restore_info[vm.name]['rename-to'] - try: - # first only minimal set, later clone_properties will be called - new_vm = host_collection.add_new_vm( - vm.__class__, - name=vm_name, - label=vm.label, - installed_by_rpm=False, - **kwargs) - if os.path.exists(new_vm.dir_path): - move_to_path = tempfile.mkdtemp('', os.path.basename( - new_vm.dir_path), os.path.dirname(new_vm.dir_path)) - try: - os.rename(new_vm.dir_path, move_to_path) - error_callback( - "*** Directory {} already exists! It has " - "been moved to {}".format(new_vm.dir_path, - move_to_path)) - except OSError: - error_callback( - "*** Directory {} already exists and " - "cannot be moved!".format(new_vm.dir_path)) - error_callback("Skipping...") - continue - - if format_version == 1: - restore_vm_dir_v1(backup_location, - vm.dir_path, - os.path.dirname(new_vm.dir_path)) - elif format_version >= 2: - shutil.move(os.path.join(restore_tmpdir, vm.backup_path), - new_vm.dir_path) - - new_vm.verify_files() - except Exception as err: - error_callback("ERROR: {0}".format(err)) - error_callback("*** Skipping VM: {0}".format(vm.name)) - if new_vm: - del host_collection.domains[new_vm.qid] + host_vm = self.app.domains[vm_name] + except KeyError: + # Failed/skipped VM continue - if hasattr(vm, 'kernel'): - # TODO: add a setting for this? - if not vm.is_property_default('kernel') and \ - vm.kernel not in \ - os.listdir(qubes.config.system_path[ - 'qubes_kernels_base_dir']): - if callable(print_callback): - print_callback("WARNING: Kernel %s not installed, " - "using default one" % vm.kernel) - vm.kernel = qubes.property.DEFAULT - try: - new_vm.clone_attrs(vm) - except Exception as err: - error_callback("ERROR: {0}".format(err)) - error_callback("*** Some VM property will not be restored") + if not vm.property_is_default('netvm'): + if restore_info[vm.name]['netvm'] is not None: + host_vm.netvm = restore_info[vm.name]['netvm'] + else: + host_vm.netvm = None - try: - new_vm.appmenus_create() - except Exception as err: - error_callback("ERROR during appmenu restore: {0}".format(err)) - error_callback( - "*** VM '{0}' will not have appmenus".format(vm.name)) + self.app.save() - # Set network dependencies - only non-default netvm setting - for vm in vms.values(): - vm_name = vm.name - if 'rename-to' in restore_info[vm.name]: - vm_name = restore_info[vm.name]['rename-to'] - try: - host_vm = host_collection.domains[vm_name] - except KeyError: - # Failed/skipped VM - continue - - if not vm.is_property_default('netvm'): - if restore_info[vm.name]['netvm'] is not None: - host_vm.netvm = restore_info[vm.name]['netvm'] + if self.canceled: + if self.header_data.version >= 2: + raise BackupCanceledError("Restore canceled", + tmpdir=self.tmpdir) else: - host_vm.netvm = None + raise BackupCanceledError("Restore canceled") - host_collection.save() + # ... and dom0 home as last step + if 'dom0' in restore_info.keys() and restore_info['dom0']['good-to-go']: + backup_path = restore_info['dom0']['subdir'] + local_user = grp.getgrnam('qubes').gr_mem[0] + home_dir = pwd.getpwnam(local_user).pw_dir + if self.header_data.version == 1: + backup_dom0_home_dir = os.path.join(self.backup_location, + backup_path) + else: + backup_dom0_home_dir = os.path.join(self.tmpdir, backup_path) + restore_home_backupdir = "home-pre-restore-{0}".format( + time.strftime("%Y-%m-%d-%H%M%S")) - if running_backup_operation.canceled: - if format_version >= 2: - raise BackupCanceledError("Restore canceled", - tmpdir=restore_tmpdir) - else: - raise BackupCanceledError("Restore canceled") + if callable(self.print_callback): + self.print_callback( + "-> Restoring home of user '{0}'...".format(local_user)) + self.print_callback( + "--> Existing files/dirs backed up in '{0}' dir".format( + restore_home_backupdir)) + os.mkdir(home_dir + '/' + restore_home_backupdir) + for f in os.listdir(backup_dom0_home_dir): + home_file = home_dir + '/' + f + if os.path.exists(home_file): + os.rename(home_file, + home_dir + '/' + restore_home_backupdir + '/' + f) + if self.header_data.version == 1: + subprocess.call( + ["cp", "-nrp", "--reflink=auto", backup_dom0_home_dir + '/' + f, home_file]) + elif self.header_data.version >= 2: + shutil.move(backup_dom0_home_dir + '/' + f, home_file) + retcode = subprocess.call(['sudo', 'chown', '-R', local_user, home_dir]) + if retcode != 0: + self.error_callback("*** Error while setting home directory " + "owner") - # ... and dom0 home as last step - if 'dom0' in restore_info.keys() and restore_info['dom0']['good-to-go']: - backup_path = restore_info['dom0']['subdir'] - local_user = grp.getgrnam('qubes').gr_mem[0] - home_dir = pwd.getpwnam(local_user).pw_dir - if format_version == 1: - backup_dom0_home_dir = os.path.join(backup_location, backup_path) - else: - backup_dom0_home_dir = os.path.join(restore_tmpdir, backup_path) - restore_home_backupdir = "home-pre-restore-{0}".format( - time.strftime("%Y-%m-%d-%H%M%S")) - - if callable(print_callback): - print_callback( - "-> Restoring home of user '{0}'...".format(local_user)) - print_callback( - "--> Existing files/dirs backed up in '{0}' dir".format( - restore_home_backupdir)) - os.mkdir(home_dir + '/' + restore_home_backupdir) - for f in os.listdir(backup_dom0_home_dir): - home_file = home_dir + '/' + f - if os.path.exists(home_file): - os.rename(home_file, - home_dir + '/' + restore_home_backupdir + '/' + f) - if format_version == 1: - subprocess.call( - ["cp", "-nrp", "--reflink=auto", backup_dom0_home_dir + '/' + f, home_file]) - elif format_version >= 2: - shutil.move(backup_dom0_home_dir + '/' + f, home_file) - retcode = subprocess.call(['sudo', 'chown', '-R', local_user, home_dir]) - if retcode != 0: - error_callback("*** Error while setting home directory owner") - - shutil.rmtree(restore_tmpdir) + shutil.rmtree(self.tmpdir) # vim:sw=4:et: diff --git a/qubes/tests/__init__.py b/qubes/tests/__init__.py index 3c13f701..53b5500e 100644 --- a/qubes/tests/__init__.py +++ b/qubes/tests/__init__.py @@ -717,25 +717,22 @@ class BackupTestsMixin(SystemTestsMixin): return vms - def make_backup(self, vms, prepare_kwargs=dict(), do_kwargs=dict(), - target=None, expect_failure=False): + def make_backup(self, vms, target=None, expect_failure=False, **kwargs): if target is None: target = self.backupdir try: - files_to_backup = \ - qubes.backup.backup_prepare(self.app, vms, - print_callback=self.print_callback, - **prepare_kwargs) + backup = qubes.backup.Backup(self.app, vms, **kwargs) except qubes.exc.QubesException as e: if not expect_failure: self.fail("QubesException during backup_prepare: %s" % str(e)) else: raise + backup.passphrase = 'qubes' + backup.target_dir = target + try: - qubes.backup.backup_do(self.app, target, files_to_backup, "qubes", - progress_callback=self.print_progress, - **do_kwargs) + backup.backup_do() except qubes.exc.QubesException as e: if not expect_failure: self.fail("QubesException during backup_do: %s" % str(e)) @@ -754,22 +751,17 @@ class BackupTestsMixin(SystemTestsMixin): backupfile = source with self.assertNotRaises(qubes.exc.QubesException): - backup_info = qubes.backup.backup_restore_prepare( - backupfile, "qubes", - host_collection=self.app, - print_callback=self.print_callback, - appvm=appvm, - options=options or {}) - + restore_op = qubes.backup.BackupRestore( + self.app, backupfile, appvm, "qubes") + if options: + for key, value in options.iteritems(): + setattr(restore_op.options, key, value) + restore_info = restore_op.get_restore_info() if self.verbose: - qubes.backup.backup_restore_print_summary(backup_info) + print restore_op.get_restore_summary(restore_info) with self.assertNotRaises(qubes.exc.QubesException): - qubes.backup.backup_restore_do( - backup_info, - host_collection=self.app, - print_callback=self.print_callback if self.verbose else None, - error_callback=self.error_callback) + restore_op.restore_do(restore_info) # maybe someone forgot to call .save() self.reload_db() diff --git a/qubes/tests/int/backup.py b/qubes/tests/int/backup.py index d47492b4..2acb2754 100644 --- a/qubes/tests/int/backup.py +++ b/qubes/tests/int/backup.py @@ -45,7 +45,7 @@ class TC_00_Backup(qubes.tests.BackupTestsMixin, qubes.tests.QubesTestCase): def test_001_compressed_backup(self): vms = self.create_backup_vms() - self.make_backup(vms, do_kwargs={'compressed': True}) + self.make_backup(vms, compressed=True) self.remove_vms(vms) self.restore_backup() for vm in vms: @@ -53,7 +53,7 @@ class TC_00_Backup(qubes.tests.BackupTestsMixin, qubes.tests.QubesTestCase): def test_002_encrypted_backup(self): vms = self.create_backup_vms() - self.make_backup(vms, do_kwargs={'encrypted': True}) + self.make_backup(vms, encrypted=True) self.remove_vms(vms) self.restore_backup() for vm in vms: @@ -61,10 +61,7 @@ class TC_00_Backup(qubes.tests.BackupTestsMixin, qubes.tests.QubesTestCase): def test_003_compressed_encrypted_backup(self): vms = self.create_backup_vms() - self.make_backup(vms, - do_kwargs={ - 'compressed': True, - 'encrypted': True}) + self.make_backup(vms, compressed=True, encrypted=True) self.remove_vms(vms) self.restore_backup() for vm in vms: @@ -96,7 +93,7 @@ class TC_00_Backup(qubes.tests.BackupTestsMixin, qubes.tests.QubesTestCase): def test_005_compressed_custom(self): vms = self.create_backup_vms() - self.make_backup(vms, do_kwargs={'compressed': "bzip2"}) + self.make_backup(vms, compressed="bzip2") self.remove_vms(vms) self.restore_backup() for vm in vms: @@ -135,16 +132,16 @@ class TC_00_Backup(qubes.tests.BackupTestsMixin, qubes.tests.QubesTestCase): vms = self.create_backup_vms() self.make_backup(vms) self.restore_backup(options={ - 'rename-conflicting': True + 'rename_conflicting': True }) for vm in vms: - with self.assertNotRaises(qubes.exc.QubesVMNotFoundError): + with self.assertNotRaises( + (qubes.exc.QubesVMNotFoundError, KeyError)): restored_vm = self.app.domains[vm.name + '1'] if vm.netvm and not vm.property_is_default('netvm'): self.assertEqual(restored_vm.netvm.name, vm.netvm.name + '1') - class TC_10_BackupVMMixin(qubes.tests.BackupTestsMixin): def setUp(self): super(TC_10_BackupVMMixin, self).setUp() @@ -160,12 +157,9 @@ class TC_10_BackupVMMixin(qubes.tests.BackupTestsMixin): vms = self.create_backup_vms() self.backupvm.start() self.backupvm.run("mkdir '/var/tmp/backup directory'", wait=True) - self.make_backup(vms, - do_kwargs={ - 'appvm': self.backupvm, - 'compressed': True, - 'encrypted': True}, - target='/var/tmp/backup directory') + self.make_backup(vms, target_vm=self.backupvm, + compressed=True, encrypted=True, + target='/var/tmp/backup directory') self.remove_vms(vms) p = self.backupvm.run("ls /var/tmp/backup*/qubes-backup*", passio_popen=True) @@ -177,12 +171,9 @@ class TC_10_BackupVMMixin(qubes.tests.BackupTestsMixin): def test_110_send_to_vm_command(self): vms = self.create_backup_vms() self.backupvm.start() - self.make_backup(vms, - do_kwargs={ - 'appvm': self.backupvm, - 'compressed': True, - 'encrypted': True}, - target='dd of=/var/tmp/backup-test') + self.make_backup(vms, target_vm=self.backupvm, + compressed=True, encrypted=True, + target='dd of=/var/tmp/backup-test') self.remove_vms(vms) self.restore_backup(source='dd if=/var/tmp/backup-test', appvm=self.backupvm) @@ -205,13 +196,10 @@ class TC_10_BackupVMMixin(qubes.tests.BackupTestsMixin): if retcode != 0: raise RuntimeError("Failed to prepare backup directory") with self.assertRaises(qubes.exc.QubesException): - self.make_backup(vms, - do_kwargs={ - 'appvm': self.backupvm, - 'compressed': False, - 'encrypted': True}, - target='/home/user/backup', - expect_failure=True) + self.make_backup(vms, target_vm=self.backupvm, + compressed=False, encrypted=True, + target='/home/user/backup', + expect_failure=True) def load_tests(loader, tests, pattern):