3 дней назад · 00e2284662
--- a/NEWS
+++ b/NEWS
@@ -1,6 +1,6 @@
 
				 2.0.14.dev0
			
 
				- * #1208: Fix for the database "restore" action restoring more databases than the "--database" flag
			
 
				-   specifies.
			
 
				+ * #1208: Fix for the "restore" action incorrectly extracting more database dumps than the
			
 
				+   "--database" flag specifies.
			
 
				  * #1212: Fix an error when restoring multiple directory-format database dumps at once.
			
 
				 
			
 
				 2.0.13
			
--- a/borgmatic/actions/restore.py
+++ b/borgmatic/actions/restore.py
@@ -273,7 +273,7 @@ def collect_dumps_from_archive(
 
				     borgmatic runtime directory, query the archive for the names of data sources dumps it contains
			
 
				     and return them as a set of Dump instances.
			
 
				     '''
			
 
				-    dumps_from_archive = set()
			
 
				+    dumps_from_archive = {}  # Use a dict as an ordered set.
			
 
				 
			
 
				     # There is (at most) one dump metadata file per data source hook. Load each.
			
 
				     for dumps_metadata_path in borgmatic.borg.list.capture_archive_listing(
			
@@ -302,33 +302,30 @@ def collect_dumps_from_archive(
 
				         if not dumps_metadata_path:
			
 
				             continue
			
 
				 
			
 
				-        dumps_from_archive.update(
			
 
				-            set(
			
 
				-                borgmatic.hooks.data_source.dump.parse_data_source_dumps_metadata(
			
 
				-                    borgmatic.borg.extract.extract_archive(
			
 
				-                        global_arguments.dry_run,
			
 
				-                        repository,
			
 
				-                        archive,
			
 
				-                        [dumps_metadata_path],
			
 
				-                        config,
			
 
				-                        local_borg_version,
			
 
				-                        global_arguments,
			
 
				-                        local_path=local_path,
			
 
				-                        remote_path=remote_path,
			
 
				-                        extract_to_stdout=True,
			
 
				-                    )
			
 
				-                    .stdout.read()
			
 
				-                    .decode(),
			
 
				-                    dumps_metadata_path,
			
 
				-                )
			
 
				+        for dump in borgmatic.hooks.data_source.dump.parse_data_source_dumps_metadata(
			
 
				+            borgmatic.borg.extract.extract_archive(
			
 
				+                global_arguments.dry_run,
			
 
				+                repository,
			
 
				+                archive,
			
 
				+                [dumps_metadata_path],
			
 
				+                config,
			
 
				+                local_borg_version,
			
 
				+                global_arguments,
			
 
				+                local_path=local_path,
			
 
				+                remote_path=remote_path,
			
 
				+                extract_to_stdout=True,
			
 
				             )
			
 
				-        )
			
 
				+            .stdout.read()
			
 
				+            .decode(),
			
 
				+            dumps_metadata_path,
			
 
				+        ):
			
 
				+            dumps_from_archive[dump] = None
			
 
				 
			
 
				     # If we've successfully loaded any dumps metadata, we're done.
			
 
				     if dumps_from_archive:
			
 
				         logger.debug('Collecting database dumps from archive data source dumps metadata files')
			
 
				 
			
 
				-        return dumps_from_archive
			
 
				+        return tuple(dumps_from_archive.keys())
			
 
				 
			
 
				     # No dumps metadata files were found, so for backwards compatibility, fall back to parsing the
			
 
				     # paths of dumps found in the archive to get their respective dump metadata.
			
@@ -392,11 +389,11 @@ def collect_dumps_from_archive(
 
				             except (ValueError, TypeError):
			
 
				                 port = None
			
 
				 
			
 
				-            dumps_from_archive.add(
			
 
				+            dumps_from_archive[
			
 
				                 Dump(
			
 
				                     hook_name, data_source_name, None if hostname == 'localhost' else hostname, port
			
 
				                 )
			
 
				-            )
			
 
				+            ] = None
			
 
				 
			
 
				             # We've successfully parsed the dump path, so need to probe any further.
			
 
				             break
			
@@ -405,13 +402,13 @@ def collect_dumps_from_archive(
 
				                 f'Ignoring invalid data source dump path "{dump_path}" in archive {archive}',
			
 
				             )
			
 
				 
			
 
				-    return dumps_from_archive
			
 
				+    return tuple(dumps_from_archive.keys())
			
 
				 
			
 
				 
			
 
				 def get_dumps_to_restore(restore_arguments, dumps_from_archive):
			
 
				     '''
			
 
				     Given restore arguments as an argparse.Namespace instance indicating which dumps to restore and
			
 
				-    a set of Dump instances representing the dumps found in an archive, return a set of specific
			
 
				+    a tuple of Dump instances representing the dumps found in an archive, return a tuple of specific
			
 
				     Dump instances from the archive to restore. As part of this, replace any Dump having a data
			
 
				     source name of "all" with multiple named Dump instances as appropriate.
			
 
				 
			
@@ -456,11 +453,12 @@ def get_dumps_to_restore(restore_arguments, dumps_from_archive):
 
				         }
			
 
				     )
			
 
				     missing_dumps = set()
			
 
				-    dumps_to_restore = set()
			
 
				+    dumps_to_restore = {}  # Use a dict as an ordered set.
			
 
				 
			
 
				     # If there's a requested "all" dump, add every dump from the archive to the dumps to restore.
			
 
				     if any(dump for dump in requested_dumps if dump.data_source_name == 'all'):
			
 
				-        dumps_to_restore.update(dumps_from_archive)
			
 
				+        for dump in dumps_from_archive:
			
 
				+            dumps_to_restore[dump] = None
			
 
				 
			
 
				     # If any archive dump matches a requested dump, add the archive dump to the dumps to restore.
			
 
				     for requested_dump in requested_dumps:
			
@@ -476,7 +474,7 @@ def get_dumps_to_restore(restore_arguments, dumps_from_archive):
 
				         if len(matching_dumps) == 0:
			
 
				             missing_dumps.add(requested_dump)
			
 
				         elif len(matching_dumps) == 1:
			
 
				-            dumps_to_restore.add(matching_dumps[0])
			
 
				+            dumps_to_restore[matching_dumps[0]] = None
			
 
				         else:
			
 
				             raise ValueError(
			
 
				                 f'Cannot restore data source {render_dump_metadata(requested_dump)} because there are multiple matching dumps in the archive. Try adding flags to disambiguate.',
			
@@ -491,20 +489,20 @@ def get_dumps_to_restore(restore_arguments, dumps_from_archive):
 
				             f"Cannot restore data source dump{'s' if len(missing_dumps) > 1 else ''} {rendered_dumps} missing from archive",
			
 
				         )
			
 
				 
			
 
				-    return dumps_to_restore
			
 
				+    return tuple(dumps_to_restore.keys())
			
 
				 
			
 
				 
			
 
				 def ensure_requested_dumps_restored(dumps_to_restore, dumps_actually_restored):
			
 
				     '''
			
 
				-    Given a set of requested dumps to restore and a set of dumps actually restored, raise ValueError
			
 
				-    if any requested dumps to restore weren't restored, indicating that they were missing from the
			
 
				-    configuration.
			
 
				+    Given a tuple of requested dumps to restore and a set of dumps actually restored, raise
			
 
				+    ValueError if any requested dumps to restore weren't restored, indicating that they were missing
			
 
				+    from the configuration.
			
 
				     '''
			
 
				     if not dumps_actually_restored:
			
 
				         raise ValueError('No data source dumps were found to restore')
			
 
				 
			
 
				     missing_dumps = sorted(
			
 
				-        dumps_to_restore - dumps_actually_restored,
			
 
				+        set(dumps_to_restore) - dumps_actually_restored,
			
 
				         key=lambda dump: dump.data_source_name,
			
 
				     )
			
 
				 
			
--- a/borgmatic/hooks/data_source/dump.py
+++ b/borgmatic/hooks/data_source/dump.py
@@ -2,6 +2,7 @@ import fnmatch
 
				 import json
			
 
				 import logging
			
 
				 import os
			
 
				+import re
			
 
				 import shutil
			
 
				 
			
 
				 import borgmatic.actions.restore
			
@@ -114,16 +115,33 @@ def remove_data_source_dumps(dump_path, data_source_type_name, dry_run):
 
				         shutil.rmtree(dump_path)
			
 
				 
			
 
				 
			
 
				+END_OF_STRING_PATTTERN = re.compile(r'\\z', flags=re.IGNORECASE)
			
 
				+
			
 
				+
			
 
				 def convert_glob_patterns_to_borg_pattern(patterns):
			
 
				     '''
			
 
				     Convert a sequence of shell glob patterns like "/etc/*", "/tmp/*" to the corresponding Borg
			
 
				     regular expression archive pattern as a single string like "re:etc/.*|tmp/.*".
			
 
				     '''
			
 
				-    # Remove the "\z" or "\Z" generated by fnmatch.translate() because we don't want the pattern to
			
 
				-    # match only at the end of a path, as directory format dumps require extracting files with paths
			
 
				-    # longer than the pattern. E.g., a pattern of "borgmatic/*/foo_databases/test" should also match
			
 
				-    # paths like "borgmatic/*/foo_databases/test/toc.dat"
			
 
				+    # This deserves some explanation. Here's what this code is doing for each shell glob pattern:
			
 
				+    #
			
 
				+    #  * Strip off the leading slash, since Borg doesn't store leading slashes in archives.
			
 
				+    #  * Use fnmatch.translate() to convert the pattern to a Borg pattern.
			
 
				+    #  * Remove the "\z" or \"Z" end-of-string special character generated by fnmatch.translate(),
			
 
				+    #    because Borg doesn't like it. Replace it with a "$" end-of-string special character
			
 
				+    #    instead. And yes, this is using a regular expression to modify a regular expression.
			
 
				+    #  * Do the above for each of:
			
 
				+    #    * The plain pattern. This supports the use case of a standard database where its name is a
			
 
				+    #      filename in the path. Example: borgmatic/foo_databases/hostname/test
			
 
				+    #    * The pattern with "/*" tacked onto the end of it. This supports the use case of a
			
 
				+    #      directory-format database where its name is a directory name in the path. Example:
			
 
				+    #      borgmatic/foo_databases/hostname/test/toc.dat
			
 
				+    #
			
 
				+    # Join the resulting transformed patterns together with "|" and return them as a string.
			
 
				     return 're:' + '|'.join(
			
 
				-        fnmatch.translate(pattern.lstrip('/')).replace('\\z', '').replace('\\Z', '') + '$'
			
 
				+        re.sub(END_OF_STRING_PATTTERN, '$', fnmatch.translate(stripped))
			
 
				+        + '|'
			
 
				+        + re.sub(END_OF_STRING_PATTTERN, '$', fnmatch.translate(stripped + '/*'))
			
 
				         for pattern in patterns
			
 
				+        for stripped in (pattern.lstrip('/'),)
			
 
				     )