2 anni fa · 616d5e7330
--- a/src/borg/archive.py
+++ b/src/borg/archive.py
@@ -11,6 +11,7 @@ from functools import partial
 
				 from getpass import getuser
			
 
				 from io import BytesIO
			
 
				 from itertools import groupby, zip_longest
			
 
				+from typing import Iterator
			
 
				 from shutil import get_terminal_size
			
 
				 
			
 
				 from .platformflags import is_win32
			
@@ -297,31 +298,24 @@ class DownloadPipeline:
 
				         unpacker = msgpack.Unpacker(use_list=False)
			
 
				         for data in self.fetch_many(ids):
			
 
				             unpacker.feed(data)
			
 
				-            items = [Item(internal_dict=item) for item in unpacker]
			
 
				-            for item in items:
			
 
				+            for _item in unpacker:
			
 
				+                item = Item(internal_dict=_item)
			
 
				                 if "chunks" in item:
			
 
				                     item.chunks = [ChunkListEntry(*e) for e in item.chunks]
			
 
				-
			
 
				-            if filter:
			
 
				-                items = [item for item in items if filter(item)]
			
 
				-
			
 
				-            if preload:
			
 
				-                for item in items:
			
 
				-                    if "chunks" in item:
			
 
				-                        hlid = item.get("hlid", None)
			
 
				-                        if hlid is None:
			
 
				-                            preload_chunks = True
			
 
				-                        else:
			
 
				-                            if hlid in hlids_preloaded:
			
 
				-                                preload_chunks = False
			
 
				-                            else:
			
 
				-                                # not having the hardlink's chunks already preloaded for other hardlink to same inode
			
 
				-                                preload_chunks = True
			
 
				-                                hlids_preloaded.add(hlid)
			
 
				-                        if preload_chunks:
			
 
				-                            self.repository.preload([c.id for c in item.chunks])
			
 
				-
			
 
				-            for item in items:
			
 
				+                if filter and not filter(item):
			
 
				+                    continue
			
 
				+                if preload and "chunks" in item:
			
 
				+                    hlid = item.get("hlid", None)
			
 
				+                    if hlid is None:
			
 
				+                        preload_chunks = True
			
 
				+                    elif hlid in hlids_preloaded:
			
 
				+                        preload_chunks = False
			
 
				+                    else:
			
 
				+                        # not having the hardlink's chunks already preloaded for other hardlink to same inode
			
 
				+                        preload_chunks = True
			
 
				+                        hlids_preloaded.add(hlid)
			
 
				+                    if preload_chunks:
			
 
				+                        self.repository.preload([c.id for c in item.chunks])
			
 
				                 yield item
			
 
				 
			
 
				     def fetch_many(self, ids, is_preloaded=False):
			
@@ -631,10 +625,9 @@ Duration: {0.duration}
 
				     def iter_items(self, filter=None, preload=False):
			
 
				         # note: when calling this with preload=True, later fetch_many() must be called with
			
 
				         # is_preloaded=True or the RemoteRepository code will leak memory!
			
 
				-        for item in self.pipeline.unpack_many(
			
 
				+        yield from self.pipeline.unpack_many(
			
 
				             self.metadata.items, preload=preload, filter=lambda item: self.item_filter(item, filter)
			
 
				-        ):
			
 
				-            yield item
			
 
				+        )
			
 
				 
			
 
				     def add_item(self, item, show_progress=True, stats=None):
			
 
				         if show_progress and self.show_progress:
			
@@ -1123,55 +1116,59 @@ Duration: {0.duration}
 
				             logger.warning("borg check --repair is required to free all space.")
			
 
				 
			
 
				     @staticmethod
			
 
				-    def compare_archives_iter(archive1, archive2, matcher=None, can_compare_chunk_ids=False, content_only=False):
			
 
				+    def compare_archives_iter(
			
 
				+        archive1: "Archive", archive2: "Archive", matcher=None, can_compare_chunk_ids=False
			
 
				+    ) -> Iterator[ItemDiff]:
			
 
				         """
			
 
				-        Yields tuples with a path and an ItemDiff instance describing changes/indicating equality.
			
 
				+        Yields an ItemDiff instance describing changes/indicating equality.
			
 
				 
			
 
				         :param matcher: PatternMatcher class to restrict results to only matching paths.
			
 
				         :param can_compare_chunk_ids: Whether --chunker-params are the same for both archives.
			
 
				         """
			
 
				 
			
 
				-        def compare_items(item1, item2):
			
 
				+        def compare_items(path: str, item1: Item, item2: Item):
			
 
				             return ItemDiff(
			
 
				+                path,
			
 
				                 item1,
			
 
				                 item2,
			
 
				                 archive1.pipeline.fetch_many([c.id for c in item1.get("chunks", [])]),
			
 
				                 archive2.pipeline.fetch_many([c.id for c in item2.get("chunks", [])]),
			
 
				                 can_compare_chunk_ids=can_compare_chunk_ids,
			
 
				-                content_only=content_only,
			
 
				             )
			
 
				 
			
 
				-        orphans_archive1 = OrderedDict()
			
 
				-        orphans_archive2 = OrderedDict()
			
 
				+        orphans_archive1: OrderedDict[str, Item] = OrderedDict()
			
 
				+        orphans_archive2: OrderedDict[str, Item] = OrderedDict()
			
 
				+
			
 
				+        assert matcher is not None, "matcher must be set"
			
 
				 
			
 
				         for item1, item2 in zip_longest(
			
 
				             archive1.iter_items(lambda item: matcher.match(item.path)),
			
 
				             archive2.iter_items(lambda item: matcher.match(item.path)),
			
 
				         ):
			
 
				             if item1 and item2 and item1.path == item2.path:
			
 
				-                yield (item1.path, compare_items(item1, item2))
			
 
				+                yield compare_items(item1.path, item1, item2)
			
 
				                 continue
			
 
				             if item1:
			
 
				                 matching_orphan = orphans_archive2.pop(item1.path, None)
			
 
				                 if matching_orphan:
			
 
				-                    yield (item1.path, compare_items(item1, matching_orphan))
			
 
				+                    yield compare_items(item1.path, item1, matching_orphan)
			
 
				                 else:
			
 
				                     orphans_archive1[item1.path] = item1
			
 
				             if item2:
			
 
				                 matching_orphan = orphans_archive1.pop(item2.path, None)
			
 
				                 if matching_orphan:
			
 
				-                    yield (matching_orphan.path, compare_items(matching_orphan, item2))
			
 
				+                    yield compare_items(matching_orphan.path, matching_orphan, item2)
			
 
				                 else:
			
 
				                     orphans_archive2[item2.path] = item2
			
 
				         # At this point orphans_* contain items that had no matching partner in the other archive
			
 
				         for added in orphans_archive2.values():
			
 
				             path = added.path
			
 
				             deleted_item = Item.create_deleted(path)
			
 
				-            yield (path, compare_items(deleted_item, added))
			
 
				+            yield compare_items(path, deleted_item, added)
			
 
				         for deleted in orphans_archive1.values():
			
 
				             path = deleted.path
			
 
				             deleted_item = Item.create_deleted(path)
			
 
				-            yield (path, compare_items(deleted, deleted_item))
			
 
				+            yield compare_items(path, deleted, deleted_item)
			
 
				 
			
 
				 
			
 
				 class MetadataCollector:
			
--- a/src/borg/archiver/diff_cmd.py
+++ b/src/borg/archiver/diff_cmd.py
@@ -1,13 +1,14 @@
 
				 import argparse
			
 
				+import textwrap
			
 
				 import json
			
 
				+import sys
			
 
				+import os
			
 
				 
			
 
				-from ._common import with_repository, with_archive, build_matcher
			
 
				+from ._common import with_repository, with_archive, build_matcher, Highlander
			
 
				 from ..archive import Archive
			
 
				 from ..constants import *  # NOQA
			
 
				-from ..helpers import archivename_validator
			
 
				+from ..helpers import BaseFormatter, DiffFormatter, archivename_validator, BorgJsonEncoder
			
 
				 from ..manifest import Manifest
			
 
				-from ..helpers.parseformat import BorgJsonEncoder
			
 
				-
			
 
				 from ..logger import create_logger
			
 
				 
			
 
				 logger = create_logger()
			
@@ -18,14 +19,12 @@ class DiffMixIn:
 
				     @with_archive
			
 
				     def do_diff(self, args, repository, manifest, archive):
			
 
				         """Diff contents of two archives"""
			
 
				-
			
 
				-        def print_json_output(diff, path):
			
 
				-            print(json.dumps({"path": path, "changes": [j for j, str in diff]}, sort_keys=True, cls=BorgJsonEncoder))
			
 
				-
			
 
				-        def print_text_output(diff, path):
			
 
				-            print("{:<19} {}".format(" ".join([str for j, str in diff]), path))
			
 
				-
			
 
				-        print_output = print_json_output if args.json_lines else print_text_output
			
 
				+        if args.format is not None:
			
 
				+            format = args.format
			
 
				+        elif args.content_only:
			
 
				+            format = "{content}{link}{directory}{blkdev}{chrdev}{fifo} {path}{NL}"
			
 
				+        else:
			
 
				+            format = os.environ.get("BORG_DIFF_FORMAT", "{change} {path}{NL}")
			
 
				 
			
 
				         archive1 = archive
			
 
				         archive2 = Archive(manifest, args.other_name)
			
@@ -43,17 +42,36 @@ class DiffMixIn:
 
				 
			
 
				         matcher = build_matcher(args.patterns, args.paths)
			
 
				 
			
 
				-        diffs = Archive.compare_archives_iter(
			
 
				-            archive1, archive2, matcher, can_compare_chunk_ids=can_compare_chunk_ids, content_only=args.content_only
			
 
				+        diffs_iter = Archive.compare_archives_iter(
			
 
				+            archive1, archive2, matcher, can_compare_chunk_ids=can_compare_chunk_ids
			
 
				         )
			
 
				         # Conversion to string and filtering for diff.equal to save memory if sorting
			
 
				-        diffs = ((path, diff.changes()) for path, diff in diffs if not diff.equal)
			
 
				+        diffs = (diff for diff in diffs_iter if not diff.equal(args.content_only))
			
 
				 
			
 
				         if args.sort:
			
 
				-            diffs = sorted(diffs)
			
 
				-
			
 
				-        for path, diff in diffs:
			
 
				-            print_output(diff, path)
			
 
				+            diffs = sorted(diffs, key=lambda diff: diff.path)
			
 
				+
			
 
				+        formatter = DiffFormatter(format, args.content_only)
			
 
				+        for diff in diffs:
			
 
				+            if args.json_lines:
			
 
				+                print(
			
 
				+                    json.dumps(
			
 
				+                        {
			
 
				+                            "path": diff.path,
			
 
				+                            "changes": [
			
 
				+                                change.to_dict()
			
 
				+                                for name, change in diff.changes().items()
			
 
				+                                if not args.content_only or (name not in DiffFormatter.METADATA)
			
 
				+                            ],
			
 
				+                        },
			
 
				+                        sort_keys=True,
			
 
				+                        cls=BorgJsonEncoder,
			
 
				+                    )
			
 
				+                )
			
 
				+            else:
			
 
				+                res: str = formatter.format_item(diff)
			
 
				+                if res.strip():
			
 
				+                    sys.stdout.write(res)
			
 
				 
			
 
				         for pattern in matcher.get_unmatched_include_patterns():
			
 
				             self.print_warning("Include pattern '%s' never matched.", pattern)
			
@@ -64,25 +82,48 @@ class DiffMixIn:
 
				         from ._common import process_epilog
			
 
				         from ._common import define_exclusion_group
			
 
				 
			
 
				-        diff_epilog = process_epilog(
			
 
				-            """
			
 
				-            This command finds differences (file contents, user/group/mode) between archives.
			
 
				+        diff_epilog = (
			
 
				+            process_epilog(
			
 
				+                """
			
 
				+        This command finds differences (file contents, metadata) between ARCHIVE1 and ARCHIVE2.
			
 
				+
			
 
				+        For more help on include/exclude patterns, see the :ref:`borg_patterns` command output.
			
 
				+
			
 
				+        .. man NOTES
			
 
				+
			
 
				+        The FORMAT specifier syntax
			
 
				+        +++++++++++++++++++++++++++
			
 
				+
			
 
				+        The ``--format`` option uses python's `format string syntax
			
 
				+        <https://docs.python.org/3.9/library/string.html#formatstrings>`_.
			
 
				 
			
 
				-            A repository location and an archive name must be specified for REPO::ARCHIVE1.
			
 
				-            ARCHIVE2 is just another archive name in same repository (no repository location
			
 
				-            allowed).
			
 
				+        Examples:
			
 
				+        ::
			
 
				 
			
 
				-            For archives created with Borg 1.1 or newer diff automatically detects whether
			
 
				-            the archives are created with the same chunker params. If so, only chunk IDs
			
 
				-            are compared, which is very fast.
			
 
				+            $ borg diff --format '{content:30} {path}{NL}' ArchiveFoo ArchiveBar
			
 
				+            modified:  +4.1 kB  -1.0 kB    file-diff
			
 
				+            ...
			
 
				 
			
 
				-            For archives prior to Borg 1.1 chunk contents are compared by default.
			
 
				-            If you did not create the archives with different chunker params,
			
 
				-            pass ``--same-chunker-params``.
			
 
				-            Note that the chunker params changed from Borg 0.xx to 1.0.
			
 
				+            # {VAR:<NUMBER} - pad to NUMBER columns left-aligned.
			
 
				+            # {VAR:>NUMBER} - pad to NUMBER columns right-aligned.
			
 
				+            $ borg diff --format '{content:>30} {path}{NL}' ArchiveFoo ArchiveBar
			
 
				+               modified:  +4.1 kB  -1.0 kB file-diff
			
 
				+            ...
			
 
				 
			
 
				-            For more help on include/exclude patterns, see the :ref:`borg_patterns` command output.
			
 
				-            """
			
 
				+        The following keys are always available:
			
 
				+
			
 
				+
			
 
				+        """
			
 
				+            )
			
 
				+            + BaseFormatter.keys_help()
			
 
				+            + textwrap.dedent(
			
 
				+                """
			
 
				+
			
 
				+        Keys available only when showing differences between archives:
			
 
				+
			
 
				+        """
			
 
				+            )
			
 
				+            + DiffFormatter.keys_help()
			
 
				         )
			
 
				         subparser = subparsers.add_parser(
			
 
				             "diff",
			
@@ -107,6 +148,13 @@ class DiffMixIn:
 
				             help="Override check of chunker parameters.",
			
 
				         )
			
 
				         subparser.add_argument("--sort", dest="sort", action="store_true", help="Sort the output lines by file path.")
			
 
				+        subparser.add_argument(
			
 
				+            "--format",
			
 
				+            metavar="FORMAT",
			
 
				+            dest="format",
			
 
				+            action=Highlander,
			
 
				+            help='specify format for differences between archives (default: "{change} {path}{NL}")',
			
 
				+        )
			
 
				         subparser.add_argument("--json-lines", action="store_true", help="Format output as JSON Lines. ")
			
 
				         subparser.add_argument(
			
 
				             "--content-only",
			
--- a/src/borg/archiver/list_cmd.py
+++ b/src/borg/archiver/list_cmd.py
@@ -29,10 +29,9 @@ class ListMixIn:
 
				 
			
 
				         def _list_inner(cache):
			
 
				             archive = Archive(manifest, args.name, cache=cache)
			
 
				-
			
 
				-            formatter = ItemFormatter(archive, format, json_lines=args.json_lines)
			
 
				+            formatter = ItemFormatter(archive, format)
			
 
				             for item in archive.iter_items(lambda item: matcher.match(item.path)):
			
 
				-                sys.stdout.write(formatter.format_item(item))
			
 
				+                sys.stdout.write(formatter.format_item(item, args.json_lines, sort=True))
			
 
				 
			
 
				         # Only load the cache if it will be used
			
 
				         if ItemFormatter.format_needs_cache(format):
			
--- a/src/borg/archiver/prune_cmd.py
+++ b/src/borg/archiver/prune_cmd.py
@@ -89,7 +89,7 @@ class PruneMixIn:
 
				             format = "{archive}"
			
 
				         else:
			
 
				             format = os.environ.get("BORG_PRUNE_FORMAT", "{archive:<36} {time} [{id}]")
			
 
				-        formatter = ArchiveFormatter(format, repository, manifest, manifest.key, json=False, iec=args.iec)
			
 
				+        formatter = ArchiveFormatter(format, repository, manifest, manifest.key, iec=args.iec)
			
 
				 
			
 
				         checkpoint_re = r"\.checkpoint(\.\d+)?"
			
 
				         archives_checkpoints = manifest.archives.list(
			
@@ -169,7 +169,7 @@ class PruneMixIn:
 
				                     or (args.list_pruned and archive in to_delete)
			
 
				                     or (args.list_kept and archive not in to_delete)
			
 
				                 ):
			
 
				-                    list_logger.info(f"{log_message:<40} {formatter.format_item(archive)}")
			
 
				+                    list_logger.info(f"{log_message:<40} {formatter.format_item(archive, jsonline=False)}")
			
 
				             pi.finish()
			
 
				             if sig_int:
			
 
				                 # Ctrl-C / SIGINT: do not checkpoint (commit) again, we already have a checkpoint in this case.
			
--- a/src/borg/archiver/rlist_cmd.py
+++ b/src/borg/archiver/rlist_cmd.py
@@ -23,15 +23,15 @@ class RListMixIn:
 
				             format = "{archive}{NL}"
			
 
				         else:
			
 
				             format = os.environ.get("BORG_RLIST_FORMAT", "{archive:<36} {time} [{id}]{NL}")
			
 
				-        formatter = ArchiveFormatter(format, repository, manifest, manifest.key, json=args.json, iec=args.iec)
			
 
				+        formatter = ArchiveFormatter(format, repository, manifest, manifest.key, iec=args.iec)
			
 
				 
			
 
				         output_data = []
			
 
				 
			
 
				         for archive_info in manifest.archives.list_considering(args):
			
 
				             if args.json:
			
 
				-                output_data.append(formatter.get_item_data(archive_info))
			
 
				+                output_data.append(formatter.get_item_data(archive_info, args.json))
			
 
				             else:
			
 
				-                sys.stdout.write(formatter.format_item(archive_info))
			
 
				+                sys.stdout.write(formatter.format_item(archive_info, args.json))
			
 
				 
			
 
				         if args.json:
			
 
				             json_print(basic_json_data(manifest, extra={"archives": output_data}))
			
--- a/src/borg/helpers/__init__.py
+++ b/src/borg/helpers/__init__.py
@@ -28,7 +28,7 @@ from .parseformat import sizeof_fmt, sizeof_fmt_iec, sizeof_fmt_decimal, Locatio
 
				 from .parseformat import format_line, replace_placeholders, PlaceholderError, relative_time_marker_validator
			
 
				 from .parseformat import format_archive, parse_stringified_list, clean_lines
			
 
				 from .parseformat import location_validator, archivename_validator, comment_validator
			
 
				-from .parseformat import BaseFormatter, ArchiveFormatter, ItemFormatter, file_status
			
 
				+from .parseformat import BaseFormatter, ArchiveFormatter, ItemFormatter, DiffFormatter, file_status
			
 
				 from .parseformat import swidth_slice, ellipsis_truncate
			
 
				 from .parseformat import BorgJsonEncoder, basic_json_data, json_print, json_dump, prepare_dump_dict
			
 
				 from .parseformat import Highlander, MakePathSafeAction
			
--- a/src/borg/helpers/parseformat.py
+++ b/src/borg/helpers/parseformat.py
@@ -1,3 +1,4 @@
 
				+import abc
			
 
				 import argparse
			
 
				 import base64
			
 
				 import hashlib
			
@@ -8,6 +9,7 @@ import re
 
				 import shlex
			
 
				 import stat
			
 
				 import uuid
			
 
				+from typing import List, Dict, Set, Tuple, ClassVar, Any, TYPE_CHECKING, Literal
			
 
				 from binascii import hexlify
			
 
				 from collections import Counter, OrderedDict
			
 
				 from datetime import datetime, timezone
			
@@ -27,6 +29,9 @@ from .. import __version_tuple__ as borg_version_tuple
 
				 from ..constants import *  # NOQA
			
 
				 from ..platformflags import is_win32
			
 
				 
			
 
				+if TYPE_CHECKING:
			
 
				+    from ..item import ItemDiff
			
 
				+
			
 
				 
			
 
				 def bin_to_hex(binary):
			
 
				     return hexlify(binary).decode("ascii")
			
@@ -649,8 +654,10 @@ def archivename_validator(text):
 
				     return validate_text(text)
			
 
				 
			
 
				 
			
 
				-class BaseFormatter:
			
 
				-    FIXED_KEYS = {
			
 
				+class BaseFormatter(metaclass=abc.ABCMeta):
			
 
				+    format: str
			
 
				+    static_data: Dict[str, Any]
			
 
				+    FIXED_KEYS: ClassVar[Dict[str, str]] = {
			
 
				         # Formatting aids
			
 
				         "LF": "\n",
			
 
				         "SPACE": " ",
			
@@ -660,25 +667,49 @@ class BaseFormatter:
 
				         "NEWLINE": "\n",
			
 
				         "NL": "\n",  # \n is automatically converted to os.linesep on write
			
 
				     }
			
 
				+    KEY_DESCRIPTIONS: ClassVar[Dict[str, str]] = {
			
 
				+        "NEWLINE": "OS dependent line separator",
			
 
				+        "NL": "alias of NEWLINE",
			
 
				+        "NUL": "NUL character for creating print0 / xargs -0 like output",
			
 
				+        "SPACE": "space character",
			
 
				+        "TAB": "tab character",
			
 
				+        "CR": "carriage return character",
			
 
				+        "LF": "line feed character",
			
 
				+    }
			
 
				+    KEY_GROUPS: ClassVar[Tuple[Tuple[str, ...], ...]] = (("NEWLINE", "NL", "NUL", "SPACE", "TAB", "CR", "LF"),)
			
 
				 
			
 
				-    def get_item_data(self, item):
			
 
				-        raise NotImplementedError
			
 
				+    def __init__(self, format: str, static: Dict[str, Any]) -> None:
			
 
				+        self.format = partial_format(format, static)
			
 
				+        self.static_data = static
			
 
				 
			
 
				-    def format_item(self, item):
			
 
				-        return self.format.format_map(self.get_item_data(item))
			
 
				+    @abc.abstractmethod
			
 
				+    def get_item_data(self, item, jsonline=False) -> dict:
			
 
				+        raise NotImplementedError
			
 
				 
			
 
				-    @staticmethod
			
 
				-    def keys_help():
			
 
				+    def format_item(self, item, jsonline=False, sort=False):
			
 
				+        data = self.get_item_data(item, jsonline)
			
 
				         return (
			
 
				-            "- NEWLINE: OS dependent line separator\n"
			
 
				-            "- NL: alias of NEWLINE\n"
			
 
				-            "- NUL: NUL character for creating print0 / xargs -0 like output\n"
			
 
				-            "- SPACE\n"
			
 
				-            "- TAB\n"
			
 
				-            "- CR\n"
			
 
				-            "- LF"
			
 
				+            f"{json.dumps(data, cls=BorgJsonEncoder, sort_keys=sort)}\n" if jsonline else self.format.format_map(data)
			
 
				         )
			
 
				 
			
 
				+    @classmethod
			
 
				+    def keys_help(cls):
			
 
				+        help = []
			
 
				+        keys: Set[str] = set()
			
 
				+        keys.update(cls.KEY_DESCRIPTIONS.keys())
			
 
				+        keys.update(key for group in cls.KEY_GROUPS for key in group)
			
 
				+
			
 
				+        for group in cls.KEY_GROUPS:
			
 
				+            for key in group:
			
 
				+                keys.remove(key)
			
 
				+                text = "- " + key
			
 
				+                if key in cls.KEY_DESCRIPTIONS:
			
 
				+                    text += ": " + cls.KEY_DESCRIPTIONS[key]
			
 
				+                help.append(text)
			
 
				+            help.append("")
			
 
				+        assert not keys, str(keys)
			
 
				+        return "\n".join(help)
			
 
				+
			
 
				 
			
 
				 class ArchiveFormatter(BaseFormatter):
			
 
				     KEY_DESCRIPTIONS = {
			
@@ -703,47 +734,17 @@ class ArchiveFormatter(BaseFormatter):
 
				         ("size", "nfiles"),
			
 
				     )
			
 
				 
			
 
				-    @classmethod
			
 
				-    def available_keys(cls):
			
 
				-        from ..manifest import ArchiveInfo
			
 
				-
			
 
				-        fake_archive_info = ArchiveInfo("archivename", b"\1" * 32, datetime(1970, 1, 1, tzinfo=timezone.utc))
			
 
				-        formatter = cls("", None, None, None)
			
 
				-        keys = []
			
 
				-        keys.extend(formatter.call_keys.keys())
			
 
				-        keys.extend(formatter.get_item_data(fake_archive_info).keys())
			
 
				-        return keys
			
 
				-
			
 
				-    @classmethod
			
 
				-    def keys_help(cls):
			
 
				-        help = []
			
 
				-        keys = cls.available_keys()
			
 
				-        for key in cls.FIXED_KEYS:
			
 
				-            keys.remove(key)
			
 
				-
			
 
				-        for group in cls.KEY_GROUPS:
			
 
				-            for key in group:
			
 
				-                keys.remove(key)
			
 
				-                text = "- " + key
			
 
				-                if key in cls.KEY_DESCRIPTIONS:
			
 
				-                    text += ": " + cls.KEY_DESCRIPTIONS[key]
			
 
				-                help.append(text)
			
 
				-            help.append("")
			
 
				-        assert not keys, str(keys)
			
 
				-        return "\n".join(help)
			
 
				-
			
 
				-    def __init__(self, format, repository, manifest, key, *, json=False, iec=False):
			
 
				+    def __init__(self, format, repository, manifest, key, *, iec=False):
			
 
				+        static_data = {}  # here could be stuff on repo level, above archive level
			
 
				+        static_data.update(self.FIXED_KEYS)
			
 
				+        super().__init__(format, static_data)
			
 
				         self.repository = repository
			
 
				         self.manifest = manifest
			
 
				         self.key = key
			
 
				         self.name = None
			
 
				         self.id = None
			
 
				         self._archive = None
			
 
				-        self.json = json
			
 
				         self.iec = iec
			
 
				-        static_keys = {}  # here could be stuff on repo level, above archive level
			
 
				-        static_keys.update(self.FIXED_KEYS)
			
 
				-        self.format = partial_format(format, static_keys)
			
 
				         self.format_keys = {f[1] for f in Formatter().parse(format)}
			
 
				         self.call_keys = {
			
 
				             "hostname": partial(self.get_meta, "hostname", ""),
			
@@ -755,20 +756,12 @@ class ArchiveFormatter(BaseFormatter):
 
				             "end": self.get_ts_end,
			
 
				         }
			
 
				         self.used_call_keys = set(self.call_keys) & self.format_keys
			
 
				-        if self.json:
			
 
				-            self.item_data = {}
			
 
				-            self.format_item = self.format_item_json
			
 
				-        else:
			
 
				-            self.item_data = static_keys
			
 
				-
			
 
				-    def format_item_json(self, item):
			
 
				-        return json.dumps(self.get_item_data(item), cls=BorgJsonEncoder) + "\n"
			
 
				 
			
 
				-    def get_item_data(self, archive_info):
			
 
				+    def get_item_data(self, archive_info, jsonline=False):
			
 
				         self.name = archive_info.name
			
 
				         self.id = archive_info.id
			
 
				         item_data = {}
			
 
				-        item_data.update(self.item_data)
			
 
				+        item_data.update({} if jsonline else self.static_data)
			
 
				         item_data.update(
			
 
				             {
			
 
				                 "name": archive_info.name,
			
@@ -812,15 +805,31 @@ class ItemFormatter(BaseFormatter):
 
				     # shake_* is not provided because it uses an incompatible .digest() method to support variable length.
			
 
				     hash_algorithms = set(hashlib.algorithms_guaranteed).union({"xxh64"}).difference({"shake_128", "shake_256"})
			
 
				     KEY_DESCRIPTIONS = {
			
 
				+        "type": "file type (file, dir, symlink, ...)",
			
 
				+        "mode": "file mode (as in stat)",
			
 
				+        "uid": "user id of file owner",
			
 
				+        "gid": "group id of file owner",
			
 
				+        "user": "user name of file owner",
			
 
				+        "group": "group name of file owner",
			
 
				         "path": "file path",
			
 
				         "target": "link target for symlinks",
			
 
				         "hlid": "hard link identity (same if hardlinking same fs object)",
			
 
				+        "flags": "file flags",
			
 
				         "extra": 'prepends {target} with " -> " for soft links and " link to " for hard links',
			
 
				+        "size": "file size",
			
 
				         "dsize": "deduplicated size",
			
 
				         "num_chunks": "number of chunks in this file",
			
 
				         "unique_chunks": "number of unique chunks in this file",
			
 
				+        "mtime": "file modification time",
			
 
				+        "ctime": "file change time",
			
 
				+        "atime": "file access time",
			
 
				+        "isomtime": "file modification time (ISO 8601 format)",
			
 
				+        "isoctime": "file change time (ISO 8601 format)",
			
 
				+        "isoatime": "file access time (ISO 8601 format)",
			
 
				         "xxh64": "XXH64 checksum of this file (note: this is NOT a cryptographic hash!)",
			
 
				         "health": 'either "healthy" (file ok) or "broken" (if file has all-zero replacement chunks)',
			
 
				+        "archiveid": "internal ID of the archive",
			
 
				+        "archivename": "name of the archive",
			
 
				     }
			
 
				     KEY_GROUPS = (
			
 
				         ("type", "mode", "uid", "gid", "user", "group", "path", "target", "hlid", "flags"),
			
@@ -833,57 +842,19 @@ class ItemFormatter(BaseFormatter):
 
				 
			
 
				     KEYS_REQUIRING_CACHE = ("dsize", "unique_chunks")
			
 
				 
			
 
				-    @classmethod
			
 
				-    def available_keys(cls):
			
 
				-        class FakeArchive:
			
 
				-            fpr = name = ""
			
 
				-
			
 
				-        from ..item import Item
			
 
				-
			
 
				-        fake_item = Item(mode=0, path="foo", user="", group="", mtime=0, uid=0, gid=0)
			
 
				-        formatter = cls(FakeArchive, "")
			
 
				-        keys = []
			
 
				-        keys.extend(formatter.call_keys.keys())
			
 
				-        keys.extend(formatter.get_item_data(fake_item).keys())
			
 
				-        return keys
			
 
				-
			
 
				-    @classmethod
			
 
				-    def keys_help(cls):
			
 
				-        help = []
			
 
				-        keys = cls.available_keys()
			
 
				-        for key in cls.FIXED_KEYS:
			
 
				-            keys.remove(key)
			
 
				-
			
 
				-        for group in cls.KEY_GROUPS:
			
 
				-            for key in group:
			
 
				-                keys.remove(key)
			
 
				-                text = "- " + key
			
 
				-                if key in cls.KEY_DESCRIPTIONS:
			
 
				-                    text += ": " + cls.KEY_DESCRIPTIONS[key]
			
 
				-                help.append(text)
			
 
				-            help.append("")
			
 
				-        assert not keys, str(keys)
			
 
				-        return "\n".join(help)
			
 
				-
			
 
				     @classmethod
			
 
				     def format_needs_cache(cls, format):
			
 
				         format_keys = {f[1] for f in Formatter().parse(format)}
			
 
				         return any(key in cls.KEYS_REQUIRING_CACHE for key in format_keys)
			
 
				 
			
 
				-    def __init__(self, archive, format, *, json_lines=False):
			
 
				+    def __init__(self, archive, format):
			
 
				         from ..checksums import StreamingXXH64
			
 
				 
			
 
				+        static_data = {"archivename": archive.name, "archiveid": archive.fpr}
			
 
				+        static_data.update(self.FIXED_KEYS)
			
 
				+        super().__init__(format, static_data)
			
 
				         self.xxh64 = StreamingXXH64
			
 
				         self.archive = archive
			
 
				-        self.json_lines = json_lines
			
 
				-        static_keys = {"archivename": archive.name, "archiveid": archive.fpr}
			
 
				-        static_keys.update(self.FIXED_KEYS)
			
 
				-        if self.json_lines:
			
 
				-            self.item_data = {}
			
 
				-            self.format_item = self.format_item_json
			
 
				-        else:
			
 
				-            self.item_data = static_keys
			
 
				-        self.format = partial_format(format, static_keys)
			
 
				         self.format_keys = {f[1] for f in Formatter().parse(format)}
			
 
				         self.call_keys = {
			
 
				             "size": self.calculate_size,
			
@@ -901,17 +872,14 @@ class ItemFormatter(BaseFormatter):
 
				             self.call_keys[hash_function] = partial(self.hash_item, hash_function)
			
 
				         self.used_call_keys = set(self.call_keys) & self.format_keys
			
 
				 
			
 
				-    def format_item_json(self, item):
			
 
				-        return json.dumps(self.get_item_data(item), cls=BorgJsonEncoder, sort_keys=True) + "\n"
			
 
				-
			
 
				-    def get_item_data(self, item):
			
 
				+    def get_item_data(self, item, jsonline=False):
			
 
				         item_data = {}
			
 
				-        item_data.update(self.item_data)
			
 
				+        item_data.update({} if jsonline else self.static_data)
			
 
				 
			
 
				         item_data.update(text_to_json("path", item.path))
			
 
				         target = item.get("target", "")
			
 
				         item_data.update(text_to_json("target", target))
			
 
				-        if not self.json_lines:
			
 
				+        if not jsonline:
			
 
				             item_data["extra"] = "" if not target else f" -> {item_data['target']}"
			
 
				 
			
 
				         hlid = item.get("hlid")
			
@@ -928,7 +896,7 @@ class ItemFormatter(BaseFormatter):
 
				         item_data.update(text_to_json("user", item.get("user", str(item_data["uid"]))))
			
 
				         item_data.update(text_to_json("group", item.get("group", str(item_data["gid"]))))
			
 
				 
			
 
				-        if self.json_lines:
			
 
				+        if jsonline:
			
 
				             item_data["healthy"] = "chunks_healthy" not in item
			
 
				         else:
			
 
				             item_data["health"] = "broken" if "chunks_healthy" in item else "healthy"
			
@@ -944,7 +912,7 @@ class ItemFormatter(BaseFormatter):
 
				 
			
 
				         item: The item to sum its unique chunks' metadata
			
 
				         metadata_func: A function that takes a parameter of type ChunkIndexEntry and returns a number, used to return
			
 
				-                       the metadata needed from the chunk
			
 
				+        the metadata needed from the chunk
			
 
				         """
			
 
				         chunk_index = self.archive.cache.chunks
			
 
				         chunks = item.get("chunks", [])
			
@@ -976,6 +944,134 @@ class ItemFormatter(BaseFormatter):
 
				         return self.format_time(key, item).isoformat()
			
 
				 
			
 
				 
			
 
				+class DiffFormatter(BaseFormatter):
			
 
				+    KEY_DESCRIPTIONS = {
			
 
				+        "path": "archived file path",
			
 
				+        "change": "all available changes",
			
 
				+        "content": "file content change",
			
 
				+        "mode": "file mode change",
			
 
				+        "type": "file type change",
			
 
				+        "owner": "file owner (user/group) change",
			
 
				+        "user": "file user change",
			
 
				+        "group": "file group change",
			
 
				+        "link": "file link change",
			
 
				+        "directory": "file directory change",
			
 
				+        "blkdev": "file block device change",
			
 
				+        "chrdev": "file character device change",
			
 
				+        "fifo": "file fifo change",
			
 
				+        "mtime": "file modification time change",
			
 
				+        "ctime": "file change time change",
			
 
				+        "isomtime": "file modification time change (ISO 8601)",
			
 
				+        "isoctime": "file creation time change (ISO 8601)",
			
 
				+    }
			
 
				+    KEY_GROUPS = (
			
 
				+        ("path", "change"),
			
 
				+        ("content", "mode", "type", "owner", "group", "user"),
			
 
				+        ("link", "directory", "blkdev", "chrdev", "fifo"),
			
 
				+        ("mtime", "ctime", "isomtime", "isoctime"),
			
 
				+    )
			
 
				+    METADATA = ("mode", "type", "owner", "group", "user", "mtime", "ctime")
			
 
				+
			
 
				+    def __init__(self, format, content_only=False):
			
 
				+        static_data = {}
			
 
				+        static_data.update(self.FIXED_KEYS)
			
 
				+        super().__init__(format or "{content}{link}{directory}{blkdev}{chrdev}{fifo} {path}{NL}", static_data)
			
 
				+        self.content_only = content_only
			
 
				+        self.format_keys = {f[1] for f in Formatter().parse(format)}
			
 
				+        self.call_keys = {
			
 
				+            "content": self.format_content,
			
 
				+            "mode": self.format_mode,
			
 
				+            "type": partial(self.format_mode, filetype=True),
			
 
				+            "owner": partial(self.format_owner),
			
 
				+            "group": partial(self.format_owner, spec="group"),
			
 
				+            "user": partial(self.format_owner, spec="user"),
			
 
				+            "link": partial(self.format_other, "link"),
			
 
				+            "directory": partial(self.format_other, "directory"),
			
 
				+            "blkdev": partial(self.format_other, "blkdev"),
			
 
				+            "chrdev": partial(self.format_other, "chrdev"),
			
 
				+            "fifo": partial(self.format_other, "fifo"),
			
 
				+            "mtime": partial(self.format_time, "mtime"),
			
 
				+            "ctime": partial(self.format_time, "ctime"),
			
 
				+            "isomtime": partial(self.format_iso_time, "mtime"),
			
 
				+            "isoctime": partial(self.format_iso_time, "ctime"),
			
 
				+        }
			
 
				+        self.used_call_keys = set(self.call_keys) & self.format_keys
			
 
				+        if self.content_only:
			
 
				+            self.used_call_keys -= set(self.METADATA)
			
 
				+
			
 
				+    def get_item_data(self, item: "ItemDiff", jsonline=False) -> dict:
			
 
				+        diff_data = {}
			
 
				+        for key in self.used_call_keys:
			
 
				+            diff_data[key] = self.call_keys[key](item)
			
 
				+
			
 
				+        change = []
			
 
				+        for key in self.call_keys:
			
 
				+            if key in ("isomtime", "isoctime"):
			
 
				+                continue
			
 
				+            if self.content_only and key in self.METADATA:
			
 
				+                continue
			
 
				+            change.append(self.call_keys[key](item))
			
 
				+        diff_data["change"] = " ".join([v for v in change if v])
			
 
				+        diff_data["path"] = item.path
			
 
				+        diff_data.update({} if jsonline else self.static_data)
			
 
				+        return diff_data
			
 
				+
			
 
				+    def format_other(self, key, diff: "ItemDiff"):
			
 
				+        change = diff.changes().get(key)
			
 
				+        return f"{change.diff_type}".ljust(27) if change else ""  # 27 is the length of the content change
			
 
				+
			
 
				+    def format_mode(self, diff: "ItemDiff", filetype=False):
			
 
				+        change = diff.type() if filetype else diff.mode()
			
 
				+        return f"[{change.diff_data['item1']} -> {change.diff_data['item2']}]" if change else ""
			
 
				+
			
 
				+    def format_owner(self, diff: "ItemDiff", spec: Literal["owner", "user", "group"] = "owner"):
			
 
				+        if spec == "user":
			
 
				+            change = diff.user()
			
 
				+            return f"[{change.diff_data['item1']} -> {change.diff_data['item2']}]" if change else ""
			
 
				+        if spec == "group":
			
 
				+            change = diff.group()
			
 
				+            return f"[{change.diff_data['item1']} -> {change.diff_data['item2']}]" if change else ""
			
 
				+        if spec != "owner":
			
 
				+            raise ValueError(f"Invalid owner spec: {spec}")
			
 
				+        change = diff.owner()
			
 
				+        if change:
			
 
				+            return "[{}:{} -> {}:{}]".format(
			
 
				+                change.diff_data["item1"][0],
			
 
				+                change.diff_data["item1"][1],
			
 
				+                change.diff_data["item2"][0],
			
 
				+                change.diff_data["item2"][1],
			
 
				+            )
			
 
				+        return ""
			
 
				+
			
 
				+    def format_content(self, diff: "ItemDiff"):
			
 
				+        change = diff.content()
			
 
				+        if change:
			
 
				+            if change.diff_type == "added":
			
 
				+                return "{}: {:>20}".format(change.diff_type, format_file_size(change.diff_data["added"]))
			
 
				+            if change.diff_type == "removed":
			
 
				+                return "{}: {:>18}".format(change.diff_type, format_file_size(change.diff_data["removed"]))
			
 
				+            if "added" not in change.diff_data and "removed" not in change.diff_data:
			
 
				+                return "modified:  (can't get size)"
			
 
				+            return "{}: {:>8} {:>8}".format(
			
 
				+                change.diff_type,
			
 
				+                format_file_size(change.diff_data["added"], precision=1, sign=True),
			
 
				+                format_file_size(-change.diff_data["removed"], precision=1, sign=True),
			
 
				+            )
			
 
				+        return ""
			
 
				+
			
 
				+    def format_time(self, key, diff: "ItemDiff"):
			
 
				+        change = diff.changes().get(key)
			
 
				+        return f"[{key}: {change.diff_data['item1']} -> {change.diff_data['item2']}]" if change else ""
			
 
				+
			
 
				+    def format_iso_time(self, key, diff: "ItemDiff"):
			
 
				+        change = diff.changes().get(key)
			
 
				+        return (
			
 
				+            f"[{key}: {change.diff_data['item1'].isoformat()} -> {change.diff_data['item2'].isoformat()}]"
			
 
				+            if change
			
 
				+            else ""
			
 
				+        )
			
 
				+
			
 
				+
			
 
				 def file_status(mode):
			
 
				     if stat.S_ISREG(mode):
			
 
				         return "A"
			
--- a/src/borg/item.pyi
+++ b/src/borg/item.pyi
@@ -1,4 +1,4 @@
 
				-from typing import FrozenSet, Set, NamedTuple, Tuple, Mapping, Dict, List, Iterator, Callable, Any
			
 
				+from typing import FrozenSet, Set, NamedTuple, Tuple, Mapping, Dict, List, Iterator, Callable, Any, Optional
			
 
				 
			
 
				 from .helpers import StableDict
			
 
				 
			
@@ -247,9 +247,36 @@ class ManifestItem(PropDict):
 
				     @item_keys.setter
			
 
				     def item_keys(self, val: Tuple) -> None: ...
			
 
				 
			
 
				+class DiffChange:
			
 
				+    diff_type: str
			
 
				+    diff_data: Dict[str, Any]
			
 
				+    def __init__(self, diff_type: str, diff_data: Optional[Dict[str, Any]] = ...) -> None: ...
			
 
				+    def to_dict(self) -> Dict[str, Any]: ...
			
 
				+
			
 
				 class ItemDiff:
			
 
				-    def __init__(self, *args, **kwargs) -> None: ...
			
 
				-    def _chunk_content_equal(self, c1: Iterator, c2: Iterator) -> bool: ...
			
 
				+    path: str
			
 
				+    def __init__(
			
 
				+        self,
			
 
				+        path: str,
			
 
				+        item1: Item,
			
 
				+        item2: Item,
			
 
				+        chunk_1: Iterator,
			
 
				+        chunk_2: Iterator,
			
 
				+        numeric_ids: bool = ...,
			
 
				+        can_compare_chunk_ids: bool = ...,
			
 
				+    ) -> None: ...
			
 
				+    def changes(self) -> Dict[str, DiffChange]: ...
			
 
				+    def equal(self, content_only: bool = ...) -> bool: ...
			
 
				+    def content(self) -> Optional[DiffChange]: ...
			
 
				+    def ctime(self) -> Optional[DiffChange]: ...
			
 
				+    def mtime(self) -> Optional[DiffChange]: ...
			
 
				+    def mode(self) -> Optional[DiffChange]: ...
			
 
				+    def type(self) -> Optional[DiffChange]: ...
			
 
				+    def owner(self) -> Optional[DiffChange]: ...
			
 
				+    def user(self) -> Optional[DiffChange]: ...
			
 
				+    def group(self) -> Optional[DiffChange]: ...
			
 
				+
			
 
				+def chunk_content_equal(chunks_a: Iterator, chunks_b: Iterator) -> bool: ...
			
 
				 
			
 
				 class Key(PropDict):
			
 
				     @property
			
--- a/src/borg/item.pyx
+++ b/src/borg/item.pyx
@@ -620,66 +620,76 @@ cpdef _init_names():
 
				 _init_names()
			
 
				 
			
 
				 
			
 
				+class DiffChange:
			
 
				+    """
			
 
				+    Stores a change in a diff.
			
 
				+
			
 
				+    The diff_type denotes the type of change, e.g. "added", "removed", "modified".
			
 
				+    The diff_data contains additional information about the change, e.g. the old and new mode.
			
 
				+    """
			
 
				+    def __init__(self, diff_type, diff_data=None):
			
 
				+        self.diff_type = diff_type
			
 
				+        self.diff_data = diff_data or {}
			
 
				+
			
 
				+    def to_dict(self):
			
 
				+        return {"type": self.diff_type, **self.diff_data}
			
 
				+
			
 
				+
			
 
				 class ItemDiff:
			
 
				     """
			
 
				     Comparison of two items from different archives.
			
 
				 
			
 
				     The items may have different paths and still be considered equal (e.g. for renames).
			
 
				-    It does not include extended or time attributes in the comparison.
			
 
				     """
			
 
				 
			
 
				-    def __init__(self, item1, item2, chunk_iterator1, chunk_iterator2, numeric_ids=False, can_compare_chunk_ids=False, content_only=False):
			
 
				+    def __init__(self, path, item1, item2, chunk_1, chunk_2, numeric_ids=False, can_compare_chunk_ids=False):
			
 
				+        self.path = path
			
 
				         self._item1 = item1
			
 
				         self._item2 = item2
			
 
				-        self._content_only = content_only
			
 
				         self._numeric_ids = numeric_ids
			
 
				         self._can_compare_chunk_ids = can_compare_chunk_ids
			
 
				-        self.equal = self._equal(chunk_iterator1, chunk_iterator2)
			
 
				-        changes = []
			
 
				+        self._chunk_1 = chunk_1
			
 
				+        self._chunk_2 = chunk_2
			
 
				+        
			
 
				+        self._changes = {}
			
 
				 
			
 
				         if self._item1.is_link() or self._item2.is_link():
			
 
				-            changes.append(self._link_diff())
			
 
				+            self._link_diff()
			
 
				 
			
 
				         if 'chunks' in self._item1 and 'chunks' in self._item2:
			
 
				-            changes.append(self._content_diff())
			
 
				+            self._content_diff()
			
 
				 
			
 
				         if self._item1.is_dir() or self._item2.is_dir():
			
 
				-            changes.append(self._presence_diff('directory'))
			
 
				+            self._presence_diff('directory')
			
 
				 
			
 
				         if self._item1.is_blk() or self._item2.is_blk():
			
 
				-            changes.append(self._presence_diff('blkdev'))
			
 
				+            self._presence_diff('blkdev')
			
 
				 
			
 
				         if self._item1.is_chr() or self._item2.is_chr():
			
 
				-            changes.append(self._presence_diff('chrdev'))
			
 
				+            self._presence_diff('chrdev')
			
 
				 
			
 
				         if self._item1.is_fifo() or self._item2.is_fifo():
			
 
				-            changes.append(self._presence_diff('fifo'))
			
 
				+            self._presence_diff('fifo')
			
 
				 
			
 
				-        if not self._content_only:
			
 
				-            if not (self._item1.get('deleted') or self._item2.get('deleted')):
			
 
				-                changes.append(self._owner_diff())
			
 
				-                changes.append(self._mode_diff())
			
 
				-                changes.extend(self._time_diffs())
			
 
				+        if not (self._item1.get('deleted') or self._item2.get('deleted')):
			
 
				+            self._owner_diff()
			
 
				+            self._mode_diff()
			
 
				+            self._time_diffs()
			
 
				 
			
 
				-        # filter out empty changes
			
 
				-        self._changes = [ch for ch in changes if ch]
			
 
				 
			
 
				     def changes(self):
			
 
				         return self._changes
			
 
				 
			
 
				     def __repr__(self):
			
 
				-        if self.equal:
			
 
				-            return 'equal'
			
 
				-        return ' '.join(str for d, str in self._changes)
			
 
				+        return (' '.join(self._changes.keys())) or 'equal'
			
 
				 
			
 
				-    def _equal(self, chunk_iterator1, chunk_iterator2):
			
 
				+    def equal(self, content_only=False):
			
 
				         # if both are deleted, there is nothing at path regardless of what was deleted
			
 
				         if self._item1.get('deleted') and self._item2.get('deleted'):
			
 
				             return True
			
 
				 
			
 
				         attr_list = ['deleted', 'target']
			
 
				-
			
 
				-        if not self._content_only:
			
 
				+        if not content_only:
			
 
				             attr_list += ['mode', 'ctime', 'mtime']
			
 
				             attr_list += ['uid', 'gid'] if self._numeric_ids else ['user', 'group']
			
 
				 
			
@@ -693,74 +703,107 @@ class ItemDiff:
 
				                 return False
			
 
				 
			
 
				         if 'chunks' in self._item1 and 'chunks' in self._item2:
			
 
				-            return self._content_equal(chunk_iterator1, chunk_iterator2)
			
 
				+            return self._content_equal()
			
 
				 
			
 
				         return True
			
 
				 
			
 
				     def _presence_diff(self, item_type):
			
 
				         if not self._item1.get('deleted') and self._item2.get('deleted'):
			
 
				-            chg = 'removed ' + item_type
			
 
				-            return ({"type": chg}, chg)
			
 
				+            self._changes[item_type] = DiffChange(f"removed {item_type}")
			
 
				+            return True
			
 
				         if self._item1.get('deleted') and not self._item2.get('deleted'):
			
 
				-            chg = 'added ' + item_type
			
 
				-            return ({"type": chg}, chg)
			
 
				+            self._changes[item_type] = DiffChange(f"added {item_type}")
			
 
				+            return True
			
 
				 
			
 
				     def _link_diff(self):
			
 
				-        pd = self._presence_diff('link')
			
 
				-        if pd is not None:
			
 
				-            return pd
			
 
				+        if self._presence_diff('link'):
			
 
				+            return True
			
 
				         if 'target' in self._item1 and 'target' in self._item2 and self._item1.target != self._item2.target:
			
 
				-            return ({"type": 'changed link'}, 'changed link')
			
 
				+            self._changes['link'] = DiffChange('changed link')
			
 
				+            return True
			
 
				 
			
 
				     def _content_diff(self):
			
 
				         if self._item1.get('deleted'):
			
 
				             sz = self._item2.get_size()
			
 
				-            return ({"type": "added", "size": sz}, 'added {:>13}'.format(format_file_size(sz)))
			
 
				+            self._changes['content'] = DiffChange("added", {"added": sz, "removed": 0})
			
 
				+            return True
			
 
				         if self._item2.get('deleted'):
			
 
				             sz = self._item1.get_size()
			
 
				-            return ({"type": "removed", "size": sz}, 'removed {:>11}'.format(format_file_size(sz)))
			
 
				+            self._changes['content'] = DiffChange("removed", {"added": 0, "removed": sz})
			
 
				+            return True
			
 
				         if not self._can_compare_chunk_ids:
			
 
				-            return ({"type": "modified"}, "modified")
			
 
				+            self._changes['content'] = DiffChange("modified")
			
 
				+            return True
			
 
				         chunk_ids1 = {c.id for c in self._item1.chunks}
			
 
				         chunk_ids2 = {c.id for c in self._item2.chunks}
			
 
				         added_ids = chunk_ids2 - chunk_ids1
			
 
				         removed_ids = chunk_ids1 - chunk_ids2
			
 
				         added = self._item2.get_size(consider_ids=added_ids)
			
 
				         removed = self._item1.get_size(consider_ids=removed_ids)
			
 
				-        return ({"type": "modified", "added": added, "removed": removed},
			
 
				-            '{:>9} {:>9}'.format(format_file_size(added, precision=1, sign=True),
			
 
				-            format_file_size(-removed, precision=1, sign=True)))
			
 
				+        self._changes['content'] = DiffChange("modified", {"added": added, "removed": removed})
			
 
				+        return True
			
 
				+
			
 
				 
			
 
				     def _owner_diff(self):
			
 
				         u_attr, g_attr = ('uid', 'gid') if self._numeric_ids else ('user', 'group')
			
 
				         u1, g1 = self._item1.get(u_attr), self._item1.get(g_attr)
			
 
				         u2, g2 = self._item2.get(u_attr), self._item2.get(g_attr)
			
 
				-        if (u1, g1) != (u2, g2):
			
 
				-            return ({"type": "owner", "old_user": u1, "old_group": g1, "new_user": u2, "new_group": g2},
			
 
				-                    '[{}:{} -> {}:{}]'.format(u1, g1, u2, g2))
			
 
				+        if (u1, g1) == (u2, g2):
			
 
				+            return False
			
 
				+        self._changes['owner'] = DiffChange("changed owner", {"item1": (u1, g1), "item2": (u2, g2)})
			
 
				+        if u1 != u2:
			
 
				+            self._changes['user'] = DiffChange("changed user", {"item1": u1, "item2": u2})
			
 
				+        if g1 != g2:
			
 
				+            self._changes['group'] = DiffChange("changed group", {"item1": g1, "item2": g2})
			
 
				+        return True
			
 
				 
			
 
				     def _mode_diff(self):
			
 
				         if 'mode' in self._item1 and 'mode' in self._item2 and self._item1.mode != self._item2.mode:
			
 
				             mode1 = stat.filemode(self._item1.mode)
			
 
				             mode2 = stat.filemode(self._item2.mode)
			
 
				-            return ({"type": "mode", "old_mode": mode1, "new_mode": mode2}, '[{} -> {}]'.format(mode1, mode2))
			
 
				+            self._changes['mode'] = DiffChange("changed mode", {"item1": mode1, "item2": mode2})
			
 
				+            if mode1[0] != mode2[0]:
			
 
				+                self._changes['type'] = DiffChange("changed type", {"item1": mode1[0], "item2": mode2[0]})
			
 
				 
			
 
				     def _time_diffs(self):
			
 
				-        changes = []
			
 
				         attrs = ["ctime", "mtime"]
			
 
				         for attr in attrs:
			
 
				             if attr in self._item1 and attr in self._item2 and self._item1.get(attr) != self._item2.get(attr):
			
 
				                 ts1 = OutputTimestamp(safe_timestamp(self._item1.get(attr)))
			
 
				                 ts2 = OutputTimestamp(safe_timestamp(self._item2.get(attr)))
			
 
				-                changes.append(({"type": attr, f"old_{attr}": ts1, f"new_{attr}": ts2}, '[{}: {} -> {}]'.format(attr, ts1, ts2)))
			
 
				-        return changes
			
 
				+                self._changes[attr] = DiffChange(attr, {"item1": ts1, "item2": ts2},)
			
 
				+        return True
			
 
				+
			
 
				+    def content(self):
			
 
				+        return self._changes.get('content')
			
 
				+
			
 
				+    def ctime(self):
			
 
				+        return self._changes.get('ctime')
			
 
				+
			
 
				+    def mtime(self):
			
 
				+        return self._changes.get('mtime')
			
 
				+
			
 
				+    def mode(self):
			
 
				+        return self._changes.get('mode')
			
 
				+
			
 
				+    def type(self):
			
 
				+        return self._changes.get('type')
			
 
				+
			
 
				+    def owner(self):
			
 
				+        return self._changes.get('owner')
			
 
				+
			
 
				+    def user(self):
			
 
				+        return self._changes.get('user')
			
 
				+
			
 
				+    def group(self):
			
 
				+        return self._changes.get('group')
			
 
				 
			
 
				-    def _content_equal(self, chunk_iterator1, chunk_iterator2):
			
 
				+    def _content_equal(self):
			
 
				         if self._can_compare_chunk_ids:
			
 
				             return self._item1.chunks == self._item2.chunks
			
 
				         if self._item1.get_size() != self._item2.get_size():
			
 
				             return False
			
 
				-        return chunks_contents_equal(chunk_iterator1, chunk_iterator2)
			
 
				+        return chunks_contents_equal(self._chunk_1, self._chunk_2)
			
 
				 
			
 
				 
			
 
				 def chunks_contents_equal(chunks_a, chunks_b):
			
--- a/src/borg/testsuite/archiver/diff_cmd.py
+++ b/src/borg/testsuite/archiver/diff_cmd.py
@@ -72,22 +72,20 @@ class ArchiverTestCase(ArchiverTestCaseBase):
 
				         self.cmd(f"--repo={self.repository_location}", "create", "test1b", "input", "--chunker-params", "16,18,17,4095")
			
 
				 
			
 
				         def do_asserts(output, can_compare_ids, content_only=False):
			
 
				-            # File contents changed (deleted and replaced with a new file)
			
 
				-            change = "B" if can_compare_ids else "{:<19}".format("modified")
			
 
				-            lines = output.splitlines()
			
 
				+            lines: list = output.splitlines()
			
 
				             assert "file_replaced" in output  # added to debug #3494
			
 
				+            change = "modified.*B" if can_compare_ids else r"modified:  \(can't get size\)"
			
 
				             self.assert_line_exists(lines, f"{change}.*input/file_replaced")
			
 
				-
			
 
				             # File unchanged
			
 
				             assert "input/file_unchanged" not in output
			
 
				 
			
 
				             # Directory replaced with a regular file
			
 
				             if "BORG_TESTS_IGNORE_MODES" not in os.environ and not is_win32 and not content_only:
			
 
				-                self.assert_line_exists(lines, "drwxr-xr-x -> -rwxr-xr-x.*input/dir_replaced_with_file")
			
 
				+                self.assert_line_exists(lines, "[drwxr-xr-x -> -rwxr-xr-x].*input/dir_replaced_with_file")
			
 
				 
			
 
				             # Basic directory cases
			
 
				-            assert "added directory     input/dir_added" in output
			
 
				-            assert "removed directory   input/dir_removed" in output
			
 
				+            assert "added directory             input/dir_added" in output
			
 
				+            assert "removed directory           input/dir_removed" in output
			
 
				 
			
 
				             if are_symlinks_supported():
			
 
				                 # Basic symlink cases
			
@@ -96,8 +94,9 @@ class ArchiverTestCase(ArchiverTestCaseBase):
 
				                 self.assert_line_exists(lines, "removed link.*input/link_removed")
			
 
				 
			
 
				                 # Symlink replacing or being replaced
			
 
				-                assert "input/dir_replaced_with_link" in output
			
 
				-                assert "input/link_replaced_by_file" in output
			
 
				+                if not content_only:
			
 
				+                    assert "input/dir_replaced_with_link" in output
			
 
				+                    assert "input/link_replaced_by_file" in output
			
 
				 
			
 
				                 # Symlink target removed. Should not affect the symlink at all.
			
 
				                 assert "input/link_target_removed" not in output
			
@@ -105,7 +104,7 @@ class ArchiverTestCase(ArchiverTestCaseBase):
 
				             # The inode has two links and the file contents changed. Borg
			
 
				             # should notice the changes in both links. However, the symlink
			
 
				             # pointing to the file is not changed.
			
 
				-            change = "0 B" if can_compare_ids else "{:<19}".format("modified")
			
 
				+            change = "modified.*0 B" if can_compare_ids else r"modified:  \(can't get size\)"
			
 
				             self.assert_line_exists(lines, f"{change}.*input/empty")
			
 
				             if are_hardlinks_supported():
			
 
				                 self.assert_line_exists(lines, f"{change}.*input/hardlink_contents_changed")
			
@@ -114,18 +113,18 @@ class ArchiverTestCase(ArchiverTestCaseBase):
 
				 
			
 
				             # Added a new file and a hard link to it. Both links to the same
			
 
				             # inode should appear as separate files.
			
 
				-            assert "added       2.05 kB input/file_added" in output
			
 
				+            assert "added:              2.05 kB input/file_added" in output
			
 
				             if are_hardlinks_supported():
			
 
				-                assert "added       2.05 kB input/hardlink_added" in output
			
 
				+                assert "added:              2.05 kB input/hardlink_added" in output
			
 
				 
			
 
				             # check if a diff between nonexistent and empty new file is found
			
 
				-            assert "added           0 B input/file_empty_added" in output
			
 
				+            assert "added:                  0 B input/file_empty_added" in output
			
 
				 
			
 
				             # The inode has two links and both of them are deleted. They should
			
 
				             # appear as two deleted files.
			
 
				-            assert "removed       256 B input/file_removed" in output
			
 
				+            assert "removed:              256 B input/file_removed" in output
			
 
				             if are_hardlinks_supported():
			
 
				-                assert "removed       256 B input/hardlink_removed" in output
			
 
				+                assert "removed:              256 B input/hardlink_removed" in output
			
 
				 
			
 
				             if are_hardlinks_supported() and content_only:
			
 
				                 # Another link (marked previously as the source in borg) to the
			
@@ -143,7 +142,7 @@ class ArchiverTestCase(ArchiverTestCaseBase):
 
				                 chgsets = [j["changes"] for j in data if j["path"] == filename]
			
 
				                 assert len(chgsets) < 2
			
 
				                 # return a flattened list of changes for given filename
			
 
				-                return [chg for chgset in chgsets for chg in chgset]
			
 
				+                return sum(chgsets, [])
			
 
				 
			
 
				             # convert output to list of dicts
			
 
				             joutput = [json.loads(line) for line in output.split("\n") if line]
			
@@ -157,7 +156,7 @@ class ArchiverTestCase(ArchiverTestCaseBase):
 
				 
			
 
				             # Directory replaced with a regular file
			
 
				             if "BORG_TESTS_IGNORE_MODES" not in os.environ and not is_win32 and not content_only:
			
 
				-                assert {"type": "mode", "old_mode": "drwxr-xr-x", "new_mode": "-rwxr-xr-x"} in get_changes(
			
 
				+                assert {"type": "changed mode", "item1": "drwxr-xr-x", "item2": "-rwxr-xr-x"} in get_changes(
			
 
				                     "input/dir_replaced_with_file", joutput
			
 
				                 )
			
 
				 
			
@@ -175,11 +174,11 @@ class ArchiverTestCase(ArchiverTestCaseBase):
 
				 
			
 
				                 if not content_only:
			
 
				                     assert any(
			
 
				-                        chg["type"] == "mode" and chg["new_mode"].startswith("l")
			
 
				+                        chg["type"] == "changed mode" and chg["item1"].startswith("d") and chg["item2"].startswith("l")
			
 
				                         for chg in get_changes("input/dir_replaced_with_link", joutput)
			
 
				                     ), get_changes("input/dir_replaced_with_link", joutput)
			
 
				                     assert any(
			
 
				-                        chg["type"] == "mode" and chg["old_mode"].startswith("l")
			
 
				+                        chg["type"] == "changed mode" and chg["item1"].startswith("l") and chg["item2"].startswith("-")
			
 
				                         for chg in get_changes("input/link_replaced_by_file", joutput)
			
 
				                     ), get_changes("input/link_replaced_by_file", joutput)
			
 
				 
			
@@ -198,18 +197,18 @@ class ArchiverTestCase(ArchiverTestCaseBase):
 
				 
			
 
				             # Added a new file and a hard link to it. Both links to the same
			
 
				             # inode should appear as separate files.
			
 
				-            assert {"type": "added", "size": 2048} in get_changes("input/file_added", joutput)
			
 
				+            assert {"added": 2048, "removed": 0, "type": "added"} in get_changes("input/file_added", joutput)
			
 
				             if are_hardlinks_supported():
			
 
				-                assert {"type": "added", "size": 2048} in get_changes("input/hardlink_added", joutput)
			
 
				+                assert {"added": 2048, "removed": 0, "type": "added"} in get_changes("input/hardlink_added", joutput)
			
 
				 
			
 
				             # check if a diff between nonexistent and empty new file is found
			
 
				-            assert {"type": "added", "size": 0} in get_changes("input/file_empty_added", joutput)
			
 
				+            assert {"added": 0, "removed": 0, "type": "added"} in get_changes("input/file_empty_added", joutput)
			
 
				 
			
 
				             # The inode has two links and both of them are deleted. They should
			
 
				             # appear as two deleted files.
			
 
				-            assert {"type": "removed", "size": 256} in get_changes("input/file_removed", joutput)
			
 
				+            assert {"added": 0, "removed": 256, "type": "removed"} in get_changes("input/file_removed", joutput)
			
 
				             if are_hardlinks_supported():
			
 
				-                assert {"type": "removed", "size": 256} in get_changes("input/hardlink_removed", joutput)
			
 
				+                assert {"added": 0, "removed": 256, "type": "removed"} in get_changes("input/hardlink_removed", joutput)
			
 
				 
			
 
				             if are_hardlinks_supported() and content_only:
			
 
				                 # Another link (marked previously as the source in borg) to the
			
@@ -251,14 +250,28 @@ class ArchiverTestCase(ArchiverTestCaseBase):
 
				             time.sleep(1)  # HFS has a 1s timestamp granularity
			
 
				         self.create_regular_file("test_file", size=15)
			
 
				         self.cmd(f"--repo={self.repository_location}", "create", "archive2", "input")
			
 
				-        output = self.cmd(f"--repo={self.repository_location}", "diff", "archive1", "archive2")
			
 
				+        output = self.cmd(
			
 
				+            f"--repo={self.repository_location}",
			
 
				+            "diff",
			
 
				+            "archive1",
			
 
				+            "archive2",
			
 
				+            "--format",
			
 
				+            "'{mtime}{ctime} {path}{NL}'",
			
 
				+        )
			
 
				         self.assert_in("mtime", output)
			
 
				         self.assert_in("ctime", output)  # Should show up on windows as well since it is a new file.
			
 
				         if is_darwin:
			
 
				             time.sleep(1)  # HFS has a 1s timestamp granularity
			
 
				         os.chmod("input/test_file", 0o777)
			
 
				         self.cmd(f"--repo={self.repository_location}", "create", "archive3", "input")
			
 
				-        output = self.cmd(f"--repo={self.repository_location}", "diff", "archive2", "archive3")
			
 
				+        output = self.cmd(
			
 
				+            f"--repo={self.repository_location}",
			
 
				+            "diff",
			
 
				+            "archive2",
			
 
				+            "archive3",
			
 
				+            "--format",
			
 
				+            "'{mtime}{ctime} {path}{NL}'",
			
 
				+        )
			
 
				         self.assert_not_in("mtime", output)
			
 
				         # Checking platform because ctime should not be shown on windows since it wasn't recreated.
			
 
				         if not is_win32:
			
@@ -294,7 +307,10 @@ class ArchiverTestCase(ArchiverTestCaseBase):
 
				             "e_file_changed",
			
 
				             "f_file_removed",
			
 
				         ]
			
 
				-        assert all(x in line for x, line in zip(expected, output.splitlines()))
			
 
				+        assert isinstance(output, str)
			
 
				+        outputs = output.splitlines()
			
 
				+        assert len(outputs) == len(expected)
			
 
				+        assert all(x in line for x, line in zip(expected, outputs))
			
 
				 
			
 
				 
			
 
				 class RemoteArchiverTestCase(RemoteArchiverTestCaseBase, ArchiverTestCase):