]> www.infradead.org Git - users/hch/xfs.git/commitdiff
xfs: wire up a new inode fork type for the realtime rmap
authorDarrick J. Wong <djwong@kernel.org>
Thu, 15 Aug 2024 18:48:53 +0000 (11:48 -0700)
committerDarrick J. Wong <djwong@kernel.org>
Fri, 16 Aug 2024 21:54:24 +0000 (14:54 -0700)
Plumb in the pieces we need to embed the root of the realtime rmap
btree in an inode's data fork, complete with new fork type and
on-disk interpretation functions.

Signed-off-by: Darrick J. Wong <djwong@kernel.org>
fs/xfs/libxfs/xfs_format.h
fs/xfs/libxfs/xfs_inode_fork.c
fs/xfs/libxfs/xfs_ondisk.h
fs/xfs/libxfs/xfs_rtrmap_btree.c
fs/xfs/libxfs/xfs_rtrmap_btree.h
fs/xfs/xfs_inode_item_recover.c

index 34210674f5411e1adc2f0e4cf74753308a217b72..45e8924a0c1f38c60fa2adba20f71438681c2280 100644 (file)
@@ -1734,6 +1734,14 @@ typedef __be32 xfs_rmap_ptr_t;
  */
 #define        XFS_RTRMAP_CRC_MAGIC    0x4d415052      /* 'MAPR' */
 
+/*
+ * rtrmap root header, on-disk form only.
+ */
+struct xfs_rtrmap_root {
+       __be16          bb_level;       /* 0 is a leaf */
+       __be16          bb_numrecs;     /* current # of data records */
+};
+
 /* inode-based btree pointer type */
 typedef __be64 xfs_rtrmap_ptr_t;
 
index e188723745836d86ce70a3907c275d9b58a3da23..ae25b1bc81c659b067ffc896040db057d8edec23 100644 (file)
@@ -27,6 +27,7 @@
 #include "xfs_errortag.h"
 #include "xfs_health.h"
 #include "xfs_symlink_remote.h"
+#include "xfs_rtrmap_btree.h"
 
 struct kmem_cache *xfs_ifork_cache;
 
@@ -276,8 +277,7 @@ xfs_iformat_data_fork(
                         */
                        if (!xfs_has_rmapbt(ip->i_mount))
                                return -EFSCORRUPTED;
-                       ASSERT(0); /* to be implemented later */
-                       return -EFSCORRUPTED;
+                       return xfs_iformat_rtrmap(ip, dip);
                default:
                        xfs_inode_verifier_error(ip, -EFSCORRUPTED, __func__,
                                        dip, sizeof(*dip), __this_address);
@@ -665,7 +665,9 @@ xfs_iflush_fork(
                break;
 
        case XFS_DINODE_FMT_RMAP:
-               ASSERT(0); /* to be implemented later */
+               ASSERT(whichfork == XFS_DATA_FORK);
+               if (iip->ili_fields & brootflag[whichfork])
+                       xfs_iflush_rtrmap(ip, dip);
                break;
 
        default:
index 7368e7ac319516510edae246cfd151d0d3b81607..8a0171860268041640adca462fed18844795c2ae 100644 (file)
@@ -78,6 +78,7 @@ xfs_check_ondisk_structs(void)
        XFS_CHECK_STRUCT_SIZE(union xfs_suminfo_raw,            4);
        XFS_CHECK_STRUCT_SIZE(struct xfs_rtbuf_blkinfo,         48);
        XFS_CHECK_STRUCT_SIZE(xfs_rtrmap_ptr_t,                 8);
+       XFS_CHECK_STRUCT_SIZE(struct xfs_rtrmap_root,           4);
 
        /*
         * m68k has problems with xfs_attr_leaf_name_remote_t, but we pad it to
index a0d246bd9ff2be012525f2f1b851af58fabe76e0..177fa62cce98e6335caa8155d0e1ee6d2c51961d 100644 (file)
@@ -82,6 +82,39 @@ xfs_rtrmapbt_get_maxrecs(
        return cur->bc_mp->m_rtrmap_mxr[level != 0];
 }
 
+/* Calculate number of records in the ondisk realtime rmap btree inode root. */
+unsigned int
+xfs_rtrmapbt_droot_maxrecs(
+       unsigned int            blocklen,
+       bool                    leaf)
+{
+       blocklen -= sizeof(struct xfs_rtrmap_root);
+
+       if (leaf)
+               return blocklen / sizeof(struct xfs_rmap_rec);
+       return blocklen / (2 * sizeof(struct xfs_rmap_key) +
+                       sizeof(xfs_rtrmap_ptr_t));
+}
+
+/*
+ * Get the maximum records we could store in the on-disk format.
+ *
+ * For non-root nodes this is equivalent to xfs_rtrmapbt_get_maxrecs, but
+ * for the root node this checks the available space in the dinode fork
+ * so that we can resize the in-memory buffer to match it.  After a
+ * resize to the maximum size this function returns the same value
+ * as xfs_rtrmapbt_get_maxrecs for the root node, too.
+ */
+STATIC int
+xfs_rtrmapbt_get_dmaxrecs(
+       struct xfs_btree_cur    *cur,
+       int                     level)
+{
+       if (level != cur->bc_nlevels - 1)
+               return cur->bc_mp->m_rtrmap_mxr[level != 0];
+       return xfs_rtrmapbt_droot_maxrecs(cur->bc_ino.forksize, level == 0);
+}
+
 /*
  * Convert the ondisk record's offset field into the ondisk key's offset field.
  * Fork and bmbt are significant parts of the rmap record key, but written
@@ -374,6 +407,64 @@ xfs_rtrmapbt_keys_contiguous(
                                 be32_to_cpu(key2->rmap.rm_startblock));
 }
 
+/* Move the rtrmap btree root from one incore buffer to another. */
+static void
+xfs_rtrmapbt_broot_move(
+       struct xfs_inode        *ip,
+       int                     whichfork,
+       struct xfs_btree_block  *dst_broot,
+       size_t                  dst_bytes,
+       struct xfs_btree_block  *src_broot,
+       size_t                  src_bytes,
+       unsigned int            level,
+       unsigned int            numrecs)
+{
+       struct xfs_mount        *mp = ip->i_mount;
+       void                    *dptr;
+       void                    *sptr;
+
+       ASSERT(xfs_rtrmap_droot_space(src_broot) <=
+                       xfs_inode_fork_size(ip, whichfork));
+
+       /*
+        * We always have to move the pointers because they are not butted
+        * against the btree block header.
+        */
+       if (numrecs && level > 0) {
+               sptr = xfs_rtrmap_broot_ptr_addr(mp, src_broot, 1, src_bytes);
+               dptr = xfs_rtrmap_broot_ptr_addr(mp, dst_broot, 1, dst_bytes);
+               memmove(dptr, sptr, numrecs * sizeof(xfs_fsblock_t));
+       }
+
+       if (src_broot == dst_broot)
+               return;
+
+       /*
+        * If the root is being totally relocated, we have to migrate the block
+        * header and the keys/records that come after it.
+        */
+       memcpy(dst_broot, src_broot, XFS_RTRMAP_BLOCK_LEN);
+
+       if (!numrecs)
+               return;
+
+       if (level == 0) {
+               sptr = xfs_rtrmap_rec_addr(src_broot, 1);
+               dptr = xfs_rtrmap_rec_addr(dst_broot, 1);
+               memcpy(dptr, sptr, numrecs * sizeof(struct xfs_rmap_rec));
+       } else {
+               sptr = xfs_rtrmap_key_addr(src_broot, 1);
+               dptr = xfs_rtrmap_key_addr(dst_broot, 1);
+               memcpy(dptr, sptr, numrecs * 2 * sizeof(struct xfs_rmap_key));
+       }
+}
+
+static const struct xfs_ifork_broot_ops xfs_rtrmapbt_iroot_ops = {
+       .maxrecs                = xfs_rtrmapbt_maxrecs,
+       .size                   = xfs_rtrmap_broot_space_calc,
+       .move                   = xfs_rtrmapbt_broot_move,
+};
+
 const struct xfs_btree_ops xfs_rtrmapbt_ops = {
        .name                   = "rtrmap",
        .type                   = XFS_BTREE_TYPE_INODE,
@@ -393,6 +484,7 @@ const struct xfs_btree_ops xfs_rtrmapbt_ops = {
        .free_block             = xfs_btree_free_metafile_block,
        .get_minrecs            = xfs_rtrmapbt_get_minrecs,
        .get_maxrecs            = xfs_rtrmapbt_get_maxrecs,
+       .get_dmaxrecs           = xfs_rtrmapbt_get_dmaxrecs,
        .init_key_from_rec      = xfs_rtrmapbt_init_key_from_rec,
        .init_high_key_from_rec = xfs_rtrmapbt_init_high_key_from_rec,
        .init_rec_from_cur      = xfs_rtrmapbt_init_rec_from_cur,
@@ -403,6 +495,7 @@ const struct xfs_btree_ops xfs_rtrmapbt_ops = {
        .keys_inorder           = xfs_rtrmapbt_keys_inorder,
        .recs_inorder           = xfs_rtrmapbt_recs_inorder,
        .keys_contiguous        = xfs_rtrmapbt_keys_contiguous,
+       .iroot_ops              = &xfs_rtrmapbt_iroot_ops,
 };
 
 /* Allocate a new rt rmap btree cursor. */
@@ -585,3 +678,130 @@ xfs_rtrmapbt_calc_reserves(
        return max_t(xfs_filblks_t, mp->m_rgblocks >> 6,
                        xfs_rtrmapbt_max_size(mp, mp->m_rgblocks));
 }
+
+/* Convert on-disk form of btree root to in-memory form. */
+STATIC void
+xfs_rtrmapbt_from_disk(
+       struct xfs_inode        *ip,
+       struct xfs_rtrmap_root  *dblock,
+       unsigned int            dblocklen,
+       struct xfs_btree_block  *rblock)
+{
+       struct xfs_mount        *mp = ip->i_mount;
+       struct xfs_rmap_key     *fkp;
+       __be64                  *fpp;
+       struct xfs_rmap_key     *tkp;
+       __be64                  *tpp;
+       struct xfs_rmap_rec     *frp;
+       struct xfs_rmap_rec     *trp;
+       unsigned int            rblocklen = xfs_rtrmap_broot_space(mp, dblock);
+       unsigned int            numrecs;
+       unsigned int            maxrecs;
+
+       xfs_btree_init_block(mp, rblock, &xfs_rtrmapbt_ops, 0, 0, ip->i_ino);
+
+       rblock->bb_level = dblock->bb_level;
+       rblock->bb_numrecs = dblock->bb_numrecs;
+       numrecs = be16_to_cpu(dblock->bb_numrecs);
+
+       if (be16_to_cpu(rblock->bb_level) > 0) {
+               maxrecs = xfs_rtrmapbt_droot_maxrecs(dblocklen, false);
+               fkp = xfs_rtrmap_droot_key_addr(dblock, 1);
+               tkp = xfs_rtrmap_key_addr(rblock, 1);
+               fpp = xfs_rtrmap_droot_ptr_addr(dblock, 1, maxrecs);
+               tpp = xfs_rtrmap_broot_ptr_addr(mp, rblock, 1, rblocklen);
+               memcpy(tkp, fkp, 2 * sizeof(*fkp) * numrecs);
+               memcpy(tpp, fpp, sizeof(*fpp) * numrecs);
+       } else {
+               frp = xfs_rtrmap_droot_rec_addr(dblock, 1);
+               trp = xfs_rtrmap_rec_addr(rblock, 1);
+               memcpy(trp, frp, sizeof(*frp) * numrecs);
+       }
+}
+
+/* Load a realtime reverse mapping btree root in from disk. */
+int
+xfs_iformat_rtrmap(
+       struct xfs_inode        *ip,
+       struct xfs_dinode       *dip)
+{
+       struct xfs_mount        *mp = ip->i_mount;
+       struct xfs_ifork        *ifp = xfs_ifork_ptr(ip, XFS_DATA_FORK);
+       struct xfs_rtrmap_root  *dfp = XFS_DFORK_PTR(dip, XFS_DATA_FORK);
+       unsigned int            numrecs;
+       unsigned int            level;
+       int                     dsize;
+
+       dsize = XFS_DFORK_SIZE(dip, mp, XFS_DATA_FORK);
+       numrecs = be16_to_cpu(dfp->bb_numrecs);
+       level = be16_to_cpu(dfp->bb_level);
+
+       if (level > mp->m_rtrmap_maxlevels ||
+           xfs_rtrmap_droot_space_calc(level, numrecs) > dsize)
+               return -EFSCORRUPTED;
+
+       xfs_iroot_alloc(ip, XFS_DATA_FORK,
+                       xfs_rtrmap_broot_space_calc(mp, level, numrecs));
+       xfs_rtrmapbt_from_disk(ip, dfp, dsize, ifp->if_broot);
+       return 0;
+}
+
+/* Convert in-memory form of btree root to on-disk form. */
+void
+xfs_rtrmapbt_to_disk(
+       struct xfs_mount        *mp,
+       struct xfs_btree_block  *rblock,
+       unsigned int            rblocklen,
+       struct xfs_rtrmap_root  *dblock,
+       unsigned int            dblocklen)
+{
+       struct xfs_rmap_key     *fkp;
+       __be64                  *fpp;
+       struct xfs_rmap_key     *tkp;
+       __be64                  *tpp;
+       struct xfs_rmap_rec     *frp;
+       struct xfs_rmap_rec     *trp;
+       unsigned int            numrecs;
+       unsigned int            maxrecs;
+
+       ASSERT(rblock->bb_magic == cpu_to_be32(XFS_RTRMAP_CRC_MAGIC));
+       ASSERT(uuid_equal(&rblock->bb_u.l.bb_uuid, &mp->m_sb.sb_meta_uuid));
+       ASSERT(rblock->bb_u.l.bb_blkno == cpu_to_be64(XFS_BUF_DADDR_NULL));
+       ASSERT(rblock->bb_u.l.bb_leftsib == cpu_to_be64(NULLFSBLOCK));
+       ASSERT(rblock->bb_u.l.bb_rightsib == cpu_to_be64(NULLFSBLOCK));
+
+       dblock->bb_level = rblock->bb_level;
+       dblock->bb_numrecs = rblock->bb_numrecs;
+       numrecs = be16_to_cpu(rblock->bb_numrecs);
+
+       if (be16_to_cpu(rblock->bb_level) > 0) {
+               maxrecs = xfs_rtrmapbt_droot_maxrecs(dblocklen, false);
+               fkp = xfs_rtrmap_key_addr(rblock, 1);
+               tkp = xfs_rtrmap_droot_key_addr(dblock, 1);
+               fpp = xfs_rtrmap_broot_ptr_addr(mp, rblock, 1, rblocklen);
+               tpp = xfs_rtrmap_droot_ptr_addr(dblock, 1, maxrecs);
+               memcpy(tkp, fkp, 2 * sizeof(*fkp) * numrecs);
+               memcpy(tpp, fpp, sizeof(*fpp) * numrecs);
+       } else {
+               frp = xfs_rtrmap_rec_addr(rblock, 1);
+               trp = xfs_rtrmap_droot_rec_addr(dblock, 1);
+               memcpy(trp, frp, sizeof(*frp) * numrecs);
+       }
+}
+
+/* Flush a realtime reverse mapping btree root out to disk. */
+void
+xfs_iflush_rtrmap(
+       struct xfs_inode        *ip,
+       struct xfs_dinode       *dip)
+{
+       struct xfs_ifork        *ifp = xfs_ifork_ptr(ip, XFS_DATA_FORK);
+       struct xfs_rtrmap_root  *dfp = XFS_DFORK_PTR(dip, XFS_DATA_FORK);
+
+       ASSERT(ifp->if_broot != NULL);
+       ASSERT(ifp->if_broot_bytes > 0);
+       ASSERT(xfs_rtrmap_droot_space(ifp->if_broot) <=
+                       xfs_inode_fork_size(ip, XFS_DATA_FORK));
+       xfs_rtrmapbt_to_disk(ip->i_mount, ifp->if_broot, ifp->if_broot_bytes,
+                       dfp, XFS_DFORK_SIZE(dip, ip->i_mount, XFS_DATA_FORK));
+}
index bb0ebc07f47e0f6245a77422d1d73455c65a6103..39471df846abc19bca9009c2d8cd3704fa0cf797 100644 (file)
@@ -26,6 +26,7 @@ void xfs_rtrmapbt_commit_staged_btree(struct xfs_btree_cur *cur,
 unsigned int xfs_rtrmapbt_maxrecs(struct xfs_mount *mp, unsigned int blocklen,
                bool leaf);
 void xfs_rtrmapbt_compute_maxlevels(struct xfs_mount *mp);
+unsigned int xfs_rtrmapbt_droot_maxrecs(unsigned int blocklen, bool leaf);
 
 /*
  * Addresses of records, keys, and pointers within an incore rtrmapbt block.
@@ -82,4 +83,115 @@ void xfs_rtrmapbt_destroy_cur_cache(void);
 
 xfs_filblks_t xfs_rtrmapbt_calc_reserves(struct xfs_mount *mp);
 
+/* Addresses of key, pointers, and records within an ondisk rtrmapbt block. */
+
+static inline struct xfs_rmap_rec *
+xfs_rtrmap_droot_rec_addr(
+       struct xfs_rtrmap_root  *block,
+       unsigned int            index)
+{
+       return (struct xfs_rmap_rec *)
+               ((char *)(block + 1) +
+                (index - 1) * sizeof(struct xfs_rmap_rec));
+}
+
+static inline struct xfs_rmap_key *
+xfs_rtrmap_droot_key_addr(
+       struct xfs_rtrmap_root  *block,
+       unsigned int            index)
+{
+       return (struct xfs_rmap_key *)
+               ((char *)(block + 1) +
+                (index - 1) * 2 * sizeof(struct xfs_rmap_key));
+}
+
+static inline xfs_rtrmap_ptr_t *
+xfs_rtrmap_droot_ptr_addr(
+       struct xfs_rtrmap_root  *block,
+       unsigned int            index,
+       unsigned int            maxrecs)
+{
+       return (xfs_rtrmap_ptr_t *)
+               ((char *)(block + 1) +
+                maxrecs * 2 * sizeof(struct xfs_rmap_key) +
+                (index - 1) * sizeof(xfs_rtrmap_ptr_t));
+}
+
+/*
+ * Address of pointers within the incore btree root.
+ *
+ * These are to be used when we know the size of the block and
+ * we don't have a cursor.
+ */
+static inline xfs_rtrmap_ptr_t *
+xfs_rtrmap_broot_ptr_addr(
+       struct xfs_mount        *mp,
+       struct xfs_btree_block  *bb,
+       unsigned int            index,
+       unsigned int            block_size)
+{
+       return xfs_rtrmap_ptr_addr(bb, index,
+                       xfs_rtrmapbt_maxrecs(mp, block_size, false));
+}
+
+/*
+ * Compute the space required for the incore btree root containing the given
+ * number of records.
+ */
+static inline size_t
+xfs_rtrmap_broot_space_calc(
+       struct xfs_mount        *mp,
+       unsigned int            level,
+       unsigned int            nrecs)
+{
+       size_t                  sz = XFS_RTRMAP_BLOCK_LEN;
+
+       if (level > 0)
+               return sz + nrecs * (2 * sizeof(struct xfs_rmap_key) +
+                                        sizeof(xfs_rtrmap_ptr_t));
+       return sz + nrecs * sizeof(struct xfs_rmap_rec);
+}
+
+/*
+ * Compute the space required for the incore btree root given the ondisk
+ * btree root block.
+ */
+static inline size_t
+xfs_rtrmap_broot_space(struct xfs_mount *mp, struct xfs_rtrmap_root *bb)
+{
+       return xfs_rtrmap_broot_space_calc(mp, be16_to_cpu(bb->bb_level),
+                       be16_to_cpu(bb->bb_numrecs));
+}
+
+/* Compute the space required for the ondisk root block. */
+static inline size_t
+xfs_rtrmap_droot_space_calc(
+       unsigned int            level,
+       unsigned int            nrecs)
+{
+       size_t                  sz = sizeof(struct xfs_rtrmap_root);
+
+       if (level > 0)
+               return sz + nrecs * (2 * sizeof(struct xfs_rmap_key) +
+                                        sizeof(xfs_rtrmap_ptr_t));
+       return sz + nrecs * sizeof(struct xfs_rmap_rec);
+}
+
+/*
+ * Compute the space required for the ondisk root block given an incore root
+ * block.
+ */
+static inline size_t
+xfs_rtrmap_droot_space(struct xfs_btree_block *bb)
+{
+       return xfs_rtrmap_droot_space_calc(be16_to_cpu(bb->bb_level),
+                       be16_to_cpu(bb->bb_numrecs));
+}
+
+int xfs_iformat_rtrmap(struct xfs_inode *ip, struct xfs_dinode *dip);
+void xfs_rtrmapbt_to_disk(struct xfs_mount *mp, struct xfs_btree_block *rblock,
+               unsigned int rblocklen, struct xfs_rtrmap_root *dblock,
+               unsigned int dblocklen);
+void xfs_iflush_rtrmap(struct xfs_inode *ip, struct xfs_dinode *dip);
+
 #endif /* __XFS_RTRMAP_BTREE_H__ */
index 5ab111a30dfacda1e62d6f995f341b3bb55fc34b..26543e1b7599086a0045b9b3e22b8b52c0cab156 100644 (file)
@@ -22,6 +22,7 @@
 #include "xfs_log_recover.h"
 #include "xfs_icache.h"
 #include "xfs_bmap_btree.h"
+#include "xfs_rtrmap_btree.h"
 
 STATIC void
 xlog_recover_inode_ra_pass2(
@@ -269,6 +270,31 @@ xlog_dinode_verify_extent_counts(
        return 0;
 }
 
+static inline int
+xlog_recover_inode_dbroot(
+       struct xfs_mount        *mp,
+       void                    *src,
+       unsigned int            len,
+       struct xfs_dinode       *dip)
+{
+       void                    *dfork = XFS_DFORK_DPTR(dip);
+       unsigned int            dsize = XFS_DFORK_DSIZE(dip, mp);
+
+       switch (dip->di_format) {
+       case XFS_DINODE_FMT_BTREE:
+               xfs_bmbt_to_bmdr(mp, src, len, dfork, dsize);
+               break;
+       case XFS_DINODE_FMT_RMAP:
+               xfs_rtrmapbt_to_disk(mp, src, len, dfork, dsize);
+               break;
+       default:
+               ASSERT(0);
+               return -EFSCORRUPTED;
+       }
+
+       return 0;
+}
+
 STATIC int
 xlog_recover_inode_commit_pass2(
        struct xlog                     *log,
@@ -479,9 +505,9 @@ xlog_recover_inode_commit_pass2(
                break;
 
        case XFS_ILOG_DBROOT:
-               xfs_bmbt_to_bmdr(mp, (struct xfs_btree_block *)src, len,
-                                (struct xfs_bmdr_block *)XFS_DFORK_DPTR(dip),
-                                XFS_DFORK_DSIZE(dip, mp));
+               error = xlog_recover_inode_dbroot(mp, src, len, dip);
+               if (error)
+                       goto out_release;
                break;
 
        default: