]> git.ipfire.org Git - thirdparty/xfsprogs-dev.git/commitdiff
mkfs.xfs: format reflink enabled filesystems
authorDarrick J. Wong <darrick.wong@oracle.com>
Tue, 25 Oct 2016 22:14:36 +0000 (15:14 -0700)
committerDarrick J. Wong <darrick.wong@oracle.com>
Wed, 26 Oct 2016 23:41:08 +0000 (16:41 -0700)
Create the refcount btree at mkfs time and set the feature flag.

v2: Turn on the reflink feature when calculating the minimum log size.

Signed-off-by: Darrick J. Wong <darrick.wong@oracle.com>
include/xfs_multidisk.h
libxfs/libxfs_api_defs.h
man/man8/mkfs.xfs.8
mkfs/maxtrres.c
mkfs/xfs_mkfs.c

index 8dc30272acb820a580759e8ba615895d80d8783e..ce9bbced05621ddd6562c8c1bec7830ea3b027df 100644 (file)
@@ -68,6 +68,7 @@ extern void res_failed (int err);
 /* maxtrres.c */
 extern int max_trans_res(unsigned long agsize, int crcs_enabled, int dirversion,
                int sectorlog, int blocklog, int inodelog, int dirblocklog,
-               int logversion, int log_sunit, int finobt, int rmapbt);
+               int logversion, int log_sunit, int finobt, int rmapbt,
+               int reflink);
 
 #endif /* __XFS_MULTIDISK_H__ */
index e95763d56648cb89cda76d872e5c0b6191c44066..d60b6c2246866ca26f15d493ae3dc45d6274697c 100644 (file)
 #define xfs_refcount_lookup_le         libxfs_refcount_lookup_le
 #define xfs_refcount_get_rec           libxfs_refcount_get_rec
 #define xfs_rmap_lookup_le_range       libxfs_rmap_lookup_le_range
+#define xfs_refc_block                 libxfs_refc_block
 
 #endif /* __LIBXFS_API_DEFS_H__ */
index c44b3bd031eaa995b03939e14bbc2bc7cf951818..b2bc223b0e1f425b0a5fcd5af4f2160038459746 100644 (file)
@@ -213,6 +213,34 @@ for filesystems created with the (default)
 option set. When the option
 .B \-m crc=0
 is used, the reverse mapping btree feature is not supported and is disabled.
+.TP
+.BI reflink= value
+This option enables the use of a separate reference count btree index in each
+allocation group. The value is either 0 to disable the feature, or 1 to create
+a reference count btree in each allocation group.
+.IP
+The reference count btree enables the sharing of physical extents between
+the data forks of different files, which is commonly known as "reflink".
+Unlike traditional Unix filesystems which assume that every inode and
+logical block pair map to a unique physical block, a reflink-capable
+XFS filesystem removes the uniqueness requirement, allowing up to four
+billion arbitrary inode/logical block pairs to map to a physical block.
+If a program tries to write to a multiply-referenced block in a file, the write
+will be redirected to a new block, and that file's logical-to-physical
+mapping will be changed to the new block ("copy on write").  This feature
+enables the creation of per-file snapshots and deduplication.  It is only
+available for the data forks of regular files.
+.IP
+By default,
+.B mkfs.xfs
+will not create reference count btrees and therefore will not enable the
+reflink feature.  This feature is only available for filesystems created with
+the (default)
+.B \-m crc=1
+option set. When the option
+.B \-m crc=0
+is used, the reference count btree feature is not supported and reflink is
+disabled.
 .RE
 .TP
 .BI \-d " data_section_options"
index d7978b65fc597293f964df8d2145349fa1421519..fba7818ab17095066c36ea3fd119399e7dcb374b 100644 (file)
@@ -39,7 +39,8 @@ max_trans_res(
        int             logversion,
        int             log_sunit,
        int             finobt,
-       int             rmapbt)
+       int             rmapbt,
+       int             reflink)
 {
        xfs_sb_t        *sbp;
        xfs_mount_t     mount;
@@ -75,6 +76,8 @@ max_trans_res(
                sbp->sb_features_ro_compat |= XFS_SB_FEAT_RO_COMPAT_FINOBT;
        if (rmapbt)
                sbp->sb_features_ro_compat |= XFS_SB_FEAT_RO_COMPAT_RMAPBT;
+       if (reflink)
+               sbp->sb_features_ro_compat |= XFS_SB_FEAT_RO_COMPAT_REFLINK;
 
        libxfs_mount(&mount, sbp, 0,0,0,0);
        maxfsb = libxfs_log_calc_minimum_size(&mount);
index 580119e5ef01a4b91db19a1b950767ff04c3f36f..fc565c0dd635efe4f3be847af5d954f49898d5ab 100644 (file)
@@ -672,6 +672,8 @@ struct opt_params mopts = {
                "uuid",
 #define M_RMAPBT       3
                "rmapbt",
+#define M_REFLINK      4
+               "reflink",
                NULL
        },
        .subopt_params = {
@@ -697,6 +699,12 @@ struct opt_params mopts = {
                  .maxval = 1,
                  .defaultval = 0,
                },
+               { .index = M_REFLINK,
+                 .conflicts = { LAST_CONFLICT },
+                 .minval = 0,
+                 .maxval = 1,
+                 .defaultval = 0,
+               },
        },
 };
 
@@ -1155,6 +1163,7 @@ struct sb_feat_args {
        bool    dirftype;
        bool    parent_pointers;
        bool    rmapbt;
+       bool    reflink;
 };
 
 static void
@@ -1227,6 +1236,8 @@ sb_set_features(
                sbp->sb_features_ro_compat = XFS_SB_FEAT_RO_COMPAT_FINOBT;
        if (fp->rmapbt)
                sbp->sb_features_ro_compat |= XFS_SB_FEAT_RO_COMPAT_RMAPBT;
+       if (fp->reflink)
+               sbp->sb_features_ro_compat |= XFS_SB_FEAT_RO_COMPAT_REFLINK;
 
        /*
         * Sparse inode chunk support has two main inode alignment requirements.
@@ -1488,6 +1499,7 @@ main(
                .dirftype = true,
                .parent_pointers = false,
                .rmapbt = false,
+               .reflink = false,
        };
 
        platform_uuid_generate(&uuid);
@@ -1776,6 +1788,10 @@ main(
                                        sb_feat.rmapbt = getnum(
                                                value, &mopts, M_RMAPBT);
                                        break;
+                               case M_REFLINK:
+                                       sb_feat.reflink = getnum(
+                                               value, &mopts, M_REFLINK);
+                                       break;
                                default:
                                        unknown('m', value);
                                }
@@ -2115,6 +2131,13 @@ _("rmapbt not supported without CRC support\n"));
                        usage();
                }
                sb_feat.rmapbt = false;
+
+               if (sb_feat.reflink) {
+                       fprintf(stderr,
+_("reflink not supported without CRC support\n"));
+                       usage();
+               }
+               sb_feat.reflink = false;
        }
 
 
@@ -2599,7 +2622,7 @@ an AG size that is one stripe unit smaller, for example %llu.\n"),
                                   sb_feat.crcs_enabled, sb_feat.dir_version,
                                   sectorlog, blocklog, inodelog, dirblocklog,
                                   sb_feat.log_version, lsunit, sb_feat.finobt,
-                                  sb_feat.rmapbt);
+                                  sb_feat.rmapbt, sb_feat.reflink);
        ASSERT(min_logblocks);
        min_logblocks = MAX(XFS_MIN_LOG_BLOCKS, min_logblocks);
        if (!logsize && dblocks >= (1024*1024*1024) >> blocklog)
@@ -2734,7 +2757,7 @@ _("size %s specified for log subvolume is too large, maximum is %lld blocks\n"),
                printf(_(
                   "meta-data=%-22s isize=%-6d agcount=%lld, agsize=%lld blks\n"
                   "         =%-22s sectsz=%-5u attr=%u, projid32bit=%u\n"
-                  "         =%-22s crc=%-8u finobt=%u, sparse=%u, rmapbt=%u\n"
+                  "         =%-22s crc=%-8u finobt=%u, sparse=%u, rmapbt=%u, reflink=%u\n"
                   "data     =%-22s bsize=%-6u blocks=%llu, imaxpct=%u\n"
                   "         =%-22s sunit=%-6u swidth=%u blks\n"
                   "naming   =version %-14u bsize=%-6u ascii-ci=%d ftype=%d\n"
@@ -2745,7 +2768,7 @@ _("size %s specified for log subvolume is too large, maximum is %lld blocks\n"),
                        "", sectorsize, sb_feat.attr_version,
                                    !sb_feat.projid16bit,
                        "", sb_feat.crcs_enabled, sb_feat.finobt, sb_feat.spinodes,
-                       sb_feat.rmapbt,
+                       sb_feat.rmapbt, sb_feat.reflink,
                        "", blocksize, (long long)dblocks, imaxpct,
                        "", dsunit, dswidth,
                        sb_feat.dir_version, dirblocksize, sb_feat.nci,
@@ -2933,7 +2956,12 @@ _("size %s specified for log subvolume is too large, maximum is %lld blocks\n"),
                        agf->agf_levels[XFS_BTNUM_RMAPi] = cpu_to_be32(1);
                        agf->agf_rmap_blocks = cpu_to_be32(1);
                }
-
+               if (xfs_sb_version_hasreflink(&mp->m_sb)) {
+                       agf->agf_refcount_root = cpu_to_be32(
+                                       libxfs_refc_block(mp));
+                       agf->agf_refcount_level = cpu_to_be32(1);
+                       agf->agf_refcount_blocks = cpu_to_be32(1);
+               }
                agf->agf_flfirst = 0;
                agf->agf_fllast = cpu_to_be32(XFS_AGFL_SIZE(mp) - 1);
                agf->agf_flcount = 0;
@@ -3101,6 +3129,24 @@ _("size %s specified for log subvolume is too large, maximum is %lld blocks\n"),
 
                libxfs_writebuf(buf, LIBXFS_EXIT_ON_FAILURE);
 
+               /*
+                * refcount btree root block
+                */
+               if (xfs_sb_version_hasreflink(&mp->m_sb)) {
+                       buf = libxfs_getbuf(mp->m_ddev_targp,
+                                       XFS_AGB_TO_DADDR(mp, agno,
+                                               libxfs_refc_block(mp)),
+                                       bsize);
+                       buf->b_ops = &xfs_refcountbt_buf_ops;
+
+                       block = XFS_BUF_TO_BLOCK(buf);
+                       memset(block, 0, blocksize);
+                       libxfs_btree_init_block(mp, buf, XFS_REFC_CRC_MAGIC, 0,
+                                               0, agno, XFS_BTREE_CRC_BLOCKS);
+
+                       libxfs_writebuf(buf, LIBXFS_EXIT_ON_FAILURE);
+               }
+
                /*
                 * INO btree root block
                 */
@@ -3189,9 +3235,21 @@ _("size %s specified for log subvolume is too large, maximum is %lld blocks\n"),
                        rrec->rm_offset = 0;
                        be16_add_cpu(&block->bb_numrecs, 1);
 
+                       /* account for refcount btree root */
+                       if (xfs_sb_version_hasreflink(&mp->m_sb)) {
+                               rrec = XFS_RMAP_REC_ADDR(block, 5);
+                               rrec->rm_startblock = cpu_to_be32(
+                                                       libxfs_refc_block(mp));
+                               rrec->rm_blockcount = cpu_to_be32(1);
+                               rrec->rm_owner = cpu_to_be64(XFS_RMAP_OWN_REFC);
+                               rrec->rm_offset = 0;
+                               be16_add_cpu(&block->bb_numrecs, 1);
+                       }
+
                        /* account for the log space */
                        if (loginternal && agno == logagno) {
-                               rrec = XFS_RMAP_REC_ADDR(block, 5);
+                               rrec = XFS_RMAP_REC_ADDR(block,
+                                       be16_to_cpu(block->bb_numrecs) + 1);
                                rrec->rm_startblock = cpu_to_be32(
                                                XFS_FSB_TO_AGBNO(mp, logstart));
                                rrec->rm_blockcount = cpu_to_be32(logblocks);
@@ -3446,7 +3504,7 @@ usage( void )
 {
        fprintf(stderr, _("Usage: %s\n\
 /* blocksize */                [-b log=n|size=num]\n\
-/* metadata */         [-m crc=0|1,finobt=0|1,uuid=xxx,rmapbt=0|1]\n\
+/* metadata */         [-m crc=0|1,finobt=0|1,uuid=xxx,rmapbt=0|1,reflink=0|1]\n\
 /* data subvol */      [-d agcount=n,agsize=n,file,name=xxx,size=num,\n\
                            (sunit=value,swidth=value|su=num,sw=num|noalign),\n\
                            sectlog=n|sectsize=num\n\