borgbackup · hrehfeld · Apr 29, 2020 · Apr 29, 2020 · Apr 30, 2020 · Apr 30, 2020
diff --git a/src/borg/helpers/parseformat.py b/src/borg/helpers/parseformat.py
@@ -688,6 +688,8 @@ class ItemFormatter(BaseFormatter):
         ('size', 'csize', 'dsize', 'dcsize', 'num_chunks', 'unique_chunks'),
         ('mtime', 'ctime', 'atime', 'isomtime', 'isoctime', 'isoatime'),
         tuple(sorted(hash_algorithms)),
+        tuple(['chunk_ids_%s' % alg for alg in sorted(hash_algorithms)] + [
+            'chunker_params_%s' % alg for alg in sorted(hash_algorithms)]),
         ('archiveid', 'archivename', 'extra'),
         ('health', )
     )
@@ -765,6 +767,8 @@ def __init__(self, archive, format, *, json_lines=False):
         }
         for hash_function in self.hash_algorithms:
             self.add_key(hash_function, partial(self.hash_item, hash_function))
+            self.call_keys['chunk_ids_%s' % hash_function] = partial(self.hash_chunks, hash_function)
+            self.call_keys['chunker_params_%s' % hash_function] = partial(self.hash_chunker_params, hash_function)
         self.used_call_keys = set(self.call_keys) & self.format_keys
 
     def format_item_json(self, item):
@@ -834,13 +838,35 @@ def calculate_csize(self, item):
         # note: does not support hardlink slaves, they will be csize 0
         return item.get_size(compressed=True)
 
-    def hash_item(self, hash_function, item):
-        if 'chunks' not in item:
-            return ""
+    def prepare_hash_function(self, hash_function):
         if hash_function in hashlib.algorithms_guaranteed:
             hash = hashlib.new(hash_function)
         elif hash_function == 'xxh64':
             hash = self.xxh64()
+        return hash
+
+    def hash_chunker_params(self, hash_function, item):
+        hash = self.prepare_hash_function(hash_function)
+
+        chunker_params = self.archive.metadata.get('chunker_params')
+        for info in chunker_params:
+            hash.update(bytes(info))
+        return hash.hexdigest()
+
+    def hash_chunks(self, hash_function, item):
+        if 'chunks' not in item:
+            return ""
+        hash = self.prepare_hash_function(hash_function)
+        for chunk in item.chunks:
+            hash.update(chunk.id)
+            hash.update(bytes(chunk.size))
+            hash.update(bytes(chunk.csize))
+        return hash.hexdigest()
+
+    def hash_item(self, hash_function, item):
+        if 'chunks' not in item:
+            return ""
+        hash = self.prepare_hash_function(hash_function)
         for data in self.archive.pipeline.fetch_many([c.id for c in item.chunks]):
             hash.update(data)
         return hash.hexdigest()