123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349 |
- import collections
- import glob
- import json
- import logging
- import os
- import shutil
- import subprocess
- import borgmatic.borg.pattern
- import borgmatic.config.paths
- import borgmatic.execute
- import borgmatic.hooks.command
- import borgmatic.hooks.data_source.snapshot
- logger = logging.getLogger(__name__)
- def use_streaming(hook_config, config): # pragma: no cover
- '''
- Return whether dump streaming is used for this hook. (Spoiler: It isn't.)
- '''
- return False
- def get_subvolume_mount_points(findmnt_command):
- '''
- Given a findmnt command to run, get all sorted Btrfs subvolume mount points.
- '''
- findmnt_output = borgmatic.execute.execute_command_and_capture_output(
- tuple(findmnt_command.split(' '))
- + (
- '-t', # Filesystem type.
- 'btrfs',
- '--json',
- '--list', # Request a flat list instead of a nested subvolume hierarchy.
- )
- )
- try:
- return tuple(
- sorted(filesystem['target'] for filesystem in json.loads(findmnt_output)['filesystems'])
- )
- except json.JSONDecodeError as error:
- raise ValueError(f'Invalid {findmnt_command} JSON output: {error}')
- except KeyError as error:
- raise ValueError(f'Invalid {findmnt_command} output: Missing key "{error}"')
- Subvolume = collections.namedtuple('Subvolume', ('path', 'contained_patterns'), defaults=((),))
- def get_subvolumes(btrfs_command, findmnt_command, patterns=None):
- '''
- Given a Btrfs command to run and a sequence of configured patterns, find the intersection
- between the current Btrfs filesystem and subvolume mount points and the paths of any patterns.
- The idea is that these pattern paths represent the requested subvolumes to snapshot.
- Only include subvolumes that contain at least one root pattern sourced from borgmatic
- configuration (as opposed to generated elsewhere in borgmatic). But if patterns is None, then
- return all subvolumes instead, sorted by path.
- Return the result as a sequence of matching subvolume mount points.
- '''
- candidate_patterns = set(patterns or ())
- subvolumes = []
- # For each subvolume mount point, match it against the given patterns to find the subvolumes to
- # backup. Sort the subvolumes from longest to shortest mount points, so longer mount points get
- # a whack at the candidate pattern piñata before their parents do. (Patterns are consumed during
- # this process, so no two subvolumes end up with the same contained patterns.)
- for mount_point in reversed(get_subvolume_mount_points(findmnt_command)):
- subvolumes.extend(
- Subvolume(mount_point, contained_patterns)
- for contained_patterns in (
- borgmatic.hooks.data_source.snapshot.get_contained_patterns(
- mount_point, candidate_patterns
- ),
- )
- if patterns is None
- or any(
- pattern.type == borgmatic.borg.pattern.Pattern_type.ROOT
- and pattern.source == borgmatic.borg.pattern.Pattern_source.CONFIG
- for pattern in contained_patterns
- )
- )
- return tuple(sorted(subvolumes, key=lambda subvolume: subvolume.path))
- BORGMATIC_SNAPSHOT_PREFIX = '.borgmatic-snapshot-'
- def make_snapshot_path(subvolume_path):
- '''
- Given the path to a subvolume, make a corresponding snapshot path for it.
- '''
- return os.path.join(
- subvolume_path,
- f'{BORGMATIC_SNAPSHOT_PREFIX}{os.getpid()}',
- # Included so that the snapshot ends up in the Borg archive at the "original" subvolume path.
- ) + subvolume_path.rstrip(os.path.sep)
- def make_snapshot_exclude_pattern(subvolume_path): # pragma: no cover
- '''
- Given the path to a subvolume, make a corresponding exclude pattern for its embedded snapshot
- path. This is to work around a quirk of Btrfs: If you make a snapshot path as a child directory
- of a subvolume, then the snapshot's own initial directory component shows up as an empty
- directory within the snapshot itself. For instance, if you have a Btrfs subvolume at /mnt and
- make a snapshot of it at:
- /mnt/.borgmatic-snapshot-1234/mnt
- ... then the snapshot itself will have an empty directory at:
- /mnt/.borgmatic-snapshot-1234/mnt/.borgmatic-snapshot-1234
- So to prevent that from ending up in the Borg archive, this function produces an exclude pattern
- to exclude that path.
- '''
- snapshot_directory = f'{BORGMATIC_SNAPSHOT_PREFIX}{os.getpid()}'
- return borgmatic.borg.pattern.Pattern(
- os.path.join(
- subvolume_path,
- snapshot_directory,
- subvolume_path.lstrip(os.path.sep),
- snapshot_directory,
- ),
- borgmatic.borg.pattern.Pattern_type.NO_RECURSE,
- borgmatic.borg.pattern.Pattern_style.FNMATCH,
- source=borgmatic.borg.pattern.Pattern_source.HOOK,
- )
- def make_borg_snapshot_pattern(subvolume_path, pattern):
- '''
- Given the path to a subvolume and a pattern as a borgmatic.borg.pattern.Pattern instance whose
- path is inside the subvolume, return a new Pattern with its path rewritten to be in a snapshot
- path intended for giving to Borg.
- Move any initial caret in a regular expression pattern path to the beginning, so as not to break
- the regular expression.
- '''
- initial_caret = (
- '^'
- if pattern.style == borgmatic.borg.pattern.Pattern_style.REGULAR_EXPRESSION
- and pattern.path.startswith('^')
- else ''
- )
- rewritten_path = initial_caret + os.path.join(
- subvolume_path,
- f'{BORGMATIC_SNAPSHOT_PREFIX}{os.getpid()}',
- '.', # Borg 1.4+ "slashdot" hack.
- # Included so that the source directory ends up in the Borg archive at its "original" path.
- pattern.path.lstrip('^').lstrip(os.path.sep),
- )
- return borgmatic.borg.pattern.Pattern(
- rewritten_path,
- pattern.type,
- pattern.style,
- pattern.device,
- source=borgmatic.borg.pattern.Pattern_source.HOOK,
- )
- def snapshot_subvolume(btrfs_command, subvolume_path, snapshot_path): # pragma: no cover
- '''
- Given a Btrfs command to run, the path to a subvolume, and the path for a snapshot, create a new
- Btrfs snapshot of the subvolume.
- '''
- os.makedirs(os.path.dirname(snapshot_path), mode=0o700, exist_ok=True)
- borgmatic.execute.execute_command(
- tuple(btrfs_command.split(' '))
- + (
- 'subvolume',
- 'snapshot',
- '-r', # Read-only.
- subvolume_path,
- snapshot_path,
- ),
- output_log_level=logging.DEBUG,
- )
- def dump_data_sources(
- hook_config,
- config,
- config_paths,
- borgmatic_runtime_directory,
- patterns,
- dry_run,
- ):
- '''
- Given a Btrfs configuration dict, a configuration dict, the borgmatic configuration file paths,
- the borgmatic runtime directory, the configured patterns, and whether this is a dry run,
- auto-detect and snapshot any Btrfs subvolume mount points listed in the given patterns. Also
- update those patterns, replacing subvolume mount points with corresponding snapshot directories
- so they get stored in the Borg archive instead.
- Return an empty sequence, since there are no ongoing dump processes from this hook.
- If this is a dry run, then don't actually snapshot anything.
- '''
- with borgmatic.hooks.command.Before_after_hooks(
- command_hooks=config.get('commands'),
- before_after='dump_data_sources',
- umask=config.get('umask'),
- dry_run=dry_run,
- hook_name='btrfs',
- ):
- dry_run_label = ' (dry run; not actually snapshotting anything)' if dry_run else ''
- logger.info(f'Snapshotting Btrfs subvolumes{dry_run_label}')
- # Based on the configured patterns, determine Btrfs subvolumes to backup. Only consider those
- # patterns that came from actual user configuration (as opposed to, say, other hooks).
- btrfs_command = hook_config.get('btrfs_command', 'btrfs')
- findmnt_command = hook_config.get('findmnt_command', 'findmnt')
- subvolumes = get_subvolumes(btrfs_command, findmnt_command, patterns)
- if not subvolumes:
- logger.warning(f'No Btrfs subvolumes found to snapshot{dry_run_label}')
- # Snapshot each subvolume, rewriting patterns to use their snapshot paths.
- for subvolume in subvolumes:
- logger.debug(f'Creating Btrfs snapshot for {subvolume.path} subvolume')
- snapshot_path = make_snapshot_path(subvolume.path)
- if dry_run:
- continue
- snapshot_subvolume(btrfs_command, subvolume.path, snapshot_path)
- for pattern in subvolume.contained_patterns:
- snapshot_pattern = make_borg_snapshot_pattern(subvolume.path, pattern)
- # Attempt to update the pattern in place, since pattern order matters to Borg.
- try:
- patterns[patterns.index(pattern)] = snapshot_pattern
- except ValueError:
- patterns.append(snapshot_pattern)
- patterns.append(make_snapshot_exclude_pattern(subvolume.path))
- return []
- def delete_snapshot(btrfs_command, snapshot_path): # pragma: no cover
- '''
- Given a Btrfs command to run and the name of a snapshot path, delete it.
- '''
- borgmatic.execute.execute_command(
- tuple(btrfs_command.split(' '))
- + (
- 'subvolume',
- 'delete',
- snapshot_path,
- ),
- output_log_level=logging.DEBUG,
- )
- def remove_data_source_dumps(hook_config, config, borgmatic_runtime_directory, dry_run):
- '''
- Given a Btrfs configuration dict, a configuration dict, the borgmatic runtime directory, and
- whether this is a dry run, delete any Btrfs snapshots created by borgmatic. If this is a dry run
- or Btrfs isn't configured in borgmatic's configuration, then don't actually remove anything.
- '''
- if hook_config is None:
- return
- dry_run_label = ' (dry run; not actually removing anything)' if dry_run else ''
- btrfs_command = hook_config.get('btrfs_command', 'btrfs')
- findmnt_command = hook_config.get('findmnt_command', 'findmnt')
- try:
- all_subvolumes = get_subvolumes(btrfs_command, findmnt_command)
- except FileNotFoundError as error:
- logger.debug(f'Could not find "{error.filename}" command')
- return
- except subprocess.CalledProcessError as error:
- logger.debug(error)
- return
- # Reversing the sorted subvolumes ensures that we remove longer mount point paths of child
- # subvolumes before the shorter mount point paths of parent subvolumes.
- for subvolume in reversed(all_subvolumes):
- subvolume_snapshots_glob = borgmatic.config.paths.replace_temporary_subdirectory_with_glob(
- os.path.normpath(make_snapshot_path(subvolume.path)),
- temporary_directory_prefix=BORGMATIC_SNAPSHOT_PREFIX,
- )
- logger.debug(
- f'Looking for snapshots to remove in {subvolume_snapshots_glob}{dry_run_label}'
- )
- for snapshot_path in glob.glob(subvolume_snapshots_glob):
- if not os.path.isdir(snapshot_path):
- continue
- logger.debug(f'Deleting Btrfs snapshot {snapshot_path}{dry_run_label}')
- if dry_run:
- continue
- try:
- delete_snapshot(btrfs_command, snapshot_path)
- except FileNotFoundError:
- logger.debug(f'Could not find "{btrfs_command}" command')
- return
- except subprocess.CalledProcessError as error:
- logger.debug(error)
- return
- # Remove the snapshot parent directory if it still exists. (It might not exist if the
- # snapshot was for "/".)
- snapshot_parent_dir = snapshot_path.rsplit(subvolume.path, 1)[0]
- if os.path.isdir(snapshot_parent_dir):
- shutil.rmtree(snapshot_parent_dir)
- def make_data_source_dump_patterns(
- hook_config, config, borgmatic_runtime_directory, name=None
- ): # pragma: no cover
- '''
- Restores aren't implemented, because stored files can be extracted directly with "extract".
- '''
- return ()
- def restore_data_source_dump(
- hook_config,
- config,
- data_source,
- dry_run,
- extract_process,
- connection_params,
- borgmatic_runtime_directory,
- ): # pragma: no cover
- '''
- Restores aren't implemented, because stored files can be extracted directly with "extract".
- '''
- raise NotImplementedError()
|