qcow2: keep reference on zeroize with discard-no-unref enabled

author Jean-Louis Dupond <jean-louis@dupond.be>

Tue, 3 Oct 2023 12:52:37 +0000 (14:52 +0200)

committer Michael Tokarev <mjt@tls.msk.ru>

Thu, 9 Nov 2023 13:39:13 +0000 (16:39 +0300)
author Jean-Louis Dupond <jean-louis@dupond.be>
Tue, 3 Oct 2023 12:52:37 +0000 (14:52 +0200)
committer Michael Tokarev <mjt@tls.msk.ru>
Thu, 9 Nov 2023 13:39:13 +0000 (16:39 +0300)
diff --git a/block/qcow2-cluster.c b/block/qcow2-cluster.c

index f4f6cd6ad020e63a6166d3389720ecfb2de30f48..fc764aea4dc6dc0020f498db2b9f875adb793645 100644 (file)
--- a/block/qcow2-cluster.c
+++ b/block/qcow2-cluster.c
@@ -1984,7 +1984,7 @@ static int discard_in_l2_slice(BlockDriverState *bs, uint64_t offset,
              /* If we keep the reference, pass on the discard still */
              bdrv_pdiscard(s->data_file, old_l2_entry & L2E_OFFSET_MASK,
                            s->cluster_size);
-       }
+        }
      }
  
      qcow2_cache_put(s->l2_table_cache, (void **) &l2_slice);
@@ -2062,9 +2062,15 @@ zero_in_l2_slice(BlockDriverState *bs, uint64_t offset,
          QCow2ClusterType type = qcow2_get_cluster_type(bs, old_l2_entry);
          bool unmap = (type == QCOW2_CLUSTER_COMPRESSED) ||
              ((flags & BDRV_REQ_MAY_UNMAP) && qcow2_cluster_is_allocated(type));
-        uint64_t new_l2_entry = unmap ? 0 : old_l2_entry;
+        bool keep_reference =
+            (s->discard_no_unref && type != QCOW2_CLUSTER_COMPRESSED);
+        uint64_t new_l2_entry = old_l2_entry;
          uint64_t new_l2_bitmap = old_l2_bitmap;
  
+        if (unmap && !keep_reference) {
+            new_l2_entry = 0;
+        }
+
          if (has_subclusters(s)) {
              new_l2_bitmap = QCOW_L2_BITMAP_ALL_ZEROES;
          } else {
@@ -2082,9 +2088,17 @@ zero_in_l2_slice(BlockDriverState *bs, uint64_t offset,
              set_l2_bitmap(s, l2_slice, l2_index + i, new_l2_bitmap);
          }
  
-        /* Then decrease the refcount */
          if (unmap) {
-            qcow2_free_any_cluster(bs, old_l2_entry, QCOW2_DISCARD_REQUEST);
+            if (!keep_reference) {
+                /* Then decrease the refcount */
+                qcow2_free_any_cluster(bs, old_l2_entry, QCOW2_DISCARD_REQUEST);
+            } else if (s->discard_passthrough[QCOW2_DISCARD_REQUEST] &&
+                       (type == QCOW2_CLUSTER_NORMAL ||
+                        type == QCOW2_CLUSTER_ZERO_ALLOC)) {
+                /* If we keep the reference, pass on the discard still */
+                bdrv_pdiscard(s->data_file, old_l2_entry & L2E_OFFSET_MASK,
+                            s->cluster_size);
+            }
          }
      }
  
diff --git a/qapi/block-core.json b/qapi/block-core.json

index 2b1d493d6e09470c03142c215887178c1a61eb21..bca1a0c37259c4341f28523cc0dbf0fc571ca6fe 100644 (file)
--- a/qapi/block-core.json
+++ b/qapi/block-core.json
@@ -3473,16 +3473,20 @@
  # @pass-discard-other: whether discard requests for the data source
  #     should be issued on other occasions where a cluster gets freed
  #
-# @discard-no-unref: when enabled, discards from the guest will not
-#     cause cluster allocations to be relinquished.  This prevents
-#     qcow2 fragmentation that would be caused by such discards.
-#     Besides potential performance degradation, such fragmentation
-#     can lead to increased allocation of clusters past the end of the
-#     image file, resulting in image files whose file length can grow
-#     much larger than their guest disk size would suggest.  If image
-#     file length is of concern (e.g. when storing qcow2 images
-#     directly on block devices), you should consider enabling this
-#     option.  (since 8.1)
+# @discard-no-unref: when enabled, data clusters will remain
+#     preallocated when they are no longer used, e.g. because they are
+#     discarded or converted to zero clusters.  As usual, whether the
+#     old data is discarded or kept on the protocol level (i.e. in the
+#     image file) depends on the setting of the pass-discard-request
+#     option.  Keeping the clusters preallocated prevents qcow2
+#     fragmentation that would otherwise be caused by freeing and
+#     re-allocating them later.  Besides potential performance
+#     degradation, such fragmentation can lead to increased allocation
+#     of clusters past the end of the image file, resulting in image
+#     files whose file length can grow much larger than their guest disk
+#     size would suggest.  If image file length is of concern (e.g. when
+#     storing qcow2 images directly on block devices), you should
+#     consider enabling this option.  (since 8.1)
  #
  # @overlap-check: which overlap checks to perform for writes to the
  #     image, defaults to 'cached' (since 2.2)
diff --git a/qemu-options.hx b/qemu-options.hx

index b56f6b2fb2f7d68f8eb3f8623e3156cda7630408..8073f5edf52105463812b87b4cf34099c2501aae 100644 (file)
--- a/qemu-options.hx
+++ b/qemu-options.hx
@@ -1436,9 +1436,13 @@ SRST
              (on/off; default: off)
  
          ``discard-no-unref``
-            When enabled, discards from the guest will not cause cluster
-            allocations to be relinquished. This prevents qcow2 fragmentation
-            that would be caused by such discards. Besides potential
+            When enabled, data clusters will remain preallocated when they are
+            no longer used, e.g. because they are discarded or converted to
+            zero clusters. As usual, whether the old data is discarded or kept
+            on the protocol level (i.e. in the image file) depends on the
+            setting of the pass-discard-request option. Keeping the clusters
+            preallocated prevents qcow2 fragmentation that would otherwise be
+            caused by freeing and re-allocating them later. Besides potential
              performance degradation, such fragmentation can lead to increased
              allocation of clusters past the end of the image file,
              resulting in image files whose file length can grow much larger
author	Jean-Louis Dupond <jean-louis@dupond.be>
	Tue, 3 Oct 2023 12:52:37 +0000 (14:52 +0200)
committer	Michael Tokarev <mjt@tls.msk.ru>
	Thu, 9 Nov 2023 13:39:13 +0000 (16:39 +0300)
block/qcow2-cluster.c		patch \| blob \| blame \| history
qapi/block-core.json		patch \| blob \| blame \| history
qemu-options.hx		patch \| blob \| blame \| history