Re: [PATCH 028/119] xfs: define the on-disk rmap btree format

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 



On Thu, Jun 16, 2016 at 06:20:52PM -0700, Darrick J. Wong wrote:
> From: Dave Chinner <dchinner@xxxxxxxxxx>
> 
> Now we have all the surrounding call infrastructure in place, we can
> start filling out the rmap btree implementation. Start with the
> on-disk btree format; add everything needed to read, write and
> manipulate rmap btree blocks. This prepares the way for adding the
> btree operations implementation.
> 
> [darrick: record owner and offset info in rmap btree]
> [darrick: fork, bmbt and unwritten state in rmap btree]
> [darrick: flags are a separate field in xfs_rmap_irec]
> [darrick: calculate maxlevels separately]
> [darrick: move the 'unwritten' bit into unused parts of rm_offset]
> 
> Signed-off-by: Dave Chinner <dchinner@xxxxxxxxxx>
> Signed-off-by: Darrick J. Wong <darrick.wong@xxxxxxxxxx>
> Reviewed-by: Dave Chinner <dchinner@xxxxxxxxxx>
> Signed-off-by: Dave Chinner <david@xxxxxxxxxxxxx>
> ---
>  fs/xfs/Makefile                |    1 
>  fs/xfs/libxfs/xfs_btree.c      |    3 +
>  fs/xfs/libxfs/xfs_btree.h      |   18 ++--
>  fs/xfs/libxfs/xfs_format.h     |  140 +++++++++++++++++++++++++++++++
>  fs/xfs/libxfs/xfs_rmap_btree.c |  180 ++++++++++++++++++++++++++++++++++++++++
>  fs/xfs/libxfs/xfs_rmap_btree.h |   32 +++++++
>  fs/xfs/libxfs/xfs_sb.c         |    6 +
>  fs/xfs/libxfs/xfs_shared.h     |    2 
>  fs/xfs/xfs_mount.c             |    2 
>  fs/xfs/xfs_mount.h             |    3 +
>  fs/xfs/xfs_ondisk.h            |    3 +
>  fs/xfs/xfs_trace.h             |    2 
>  12 files changed, 384 insertions(+), 8 deletions(-)
>  create mode 100644 fs/xfs/libxfs/xfs_rmap_btree.c
> 
> 
...
> diff --git a/fs/xfs/libxfs/xfs_rmap_btree.c b/fs/xfs/libxfs/xfs_rmap_btree.c
> new file mode 100644
> index 0000000..7a35c78
> --- /dev/null
> +++ b/fs/xfs/libxfs/xfs_rmap_btree.c
> @@ -0,0 +1,180 @@
...
> +static bool
> +xfs_rmapbt_verify(
> +	struct xfs_buf		*bp)
> +{
> +	struct xfs_mount	*mp = bp->b_target->bt_mount;
> +	struct xfs_btree_block	*block = XFS_BUF_TO_BLOCK(bp);
> +	struct xfs_perag	*pag = bp->b_pag;
> +	unsigned int		level;
> +
> +	/*
> +	 * magic number and level verification
> +	 *
> +	 * During growfs operations, we can't verify the exact level or owner as
> +	 * the perag is not fully initialised and hence not attached to the
> +	 * buffer.  In this case, check against the maximum tree depth.
> +	 *
> +	 * Similarly, during log recovery we will have a perag structure
> +	 * attached, but the agf information will not yet have been initialised
> +	 * from the on disk AGF. Again, we can only check against maximum limits
> +	 * in this case.
> +	 */
> +	if (block->bb_magic != cpu_to_be32(XFS_RMAP_CRC_MAGIC))
> +		return false;
> +
> +	if (!xfs_sb_version_hasrmapbt(&mp->m_sb))
> +		return false;
> +	if (!xfs_btree_sblock_v5hdr_verify(bp))
> +		return false;
> +
> +	level = be16_to_cpu(block->bb_level);
> +	if (pag && pag->pagf_init) {
> +		if (level >= pag->pagf_levels[XFS_BTNUM_RMAPi])
> +			return false;
> +	} else if (level >= mp->m_rmap_maxlevels)
> +		return false;

It looks like the above (level >= mp->m_rmap_maxlevels) check could be
independent (rather than an 'else). Otherwise looks good:

Reviewed-by: Brian Foster <bfoster@xxxxxxxxxx>

> +
> +	return xfs_btree_sblock_verify(bp, mp->m_rmap_mxr[level != 0]);
> +}
> +
> +static void
> +xfs_rmapbt_read_verify(
> +	struct xfs_buf	*bp)
> +{
> +	if (!xfs_btree_sblock_verify_crc(bp))
> +		xfs_buf_ioerror(bp, -EFSBADCRC);
> +	else if (!xfs_rmapbt_verify(bp))
> +		xfs_buf_ioerror(bp, -EFSCORRUPTED);
> +
> +	if (bp->b_error) {
> +		trace_xfs_btree_corrupt(bp, _RET_IP_);
> +		xfs_verifier_error(bp);
> +	}
> +}
> +
> +static void
> +xfs_rmapbt_write_verify(
> +	struct xfs_buf	*bp)
> +{
> +	if (!xfs_rmapbt_verify(bp)) {
> +		trace_xfs_btree_corrupt(bp, _RET_IP_);
> +		xfs_buf_ioerror(bp, -EFSCORRUPTED);
> +		xfs_verifier_error(bp);
> +		return;
> +	}
> +	xfs_btree_sblock_calc_crc(bp);
> +
> +}
> +
> +const struct xfs_buf_ops xfs_rmapbt_buf_ops = {
> +	.name			= "xfs_rmapbt",
> +	.verify_read		= xfs_rmapbt_read_verify,
> +	.verify_write		= xfs_rmapbt_write_verify,
> +};
> +
> +static const struct xfs_btree_ops xfs_rmapbt_ops = {
> +	.rec_len		= sizeof(struct xfs_rmap_rec),
> +	.key_len		= sizeof(struct xfs_rmap_key),
> +
> +	.dup_cursor		= xfs_rmapbt_dup_cursor,
> +	.buf_ops		= &xfs_rmapbt_buf_ops,
> +};
> +
> +/*
> + * Allocate a new allocation btree cursor.
> + */
> +struct xfs_btree_cur *
> +xfs_rmapbt_init_cursor(
> +	struct xfs_mount	*mp,
> +	struct xfs_trans	*tp,
> +	struct xfs_buf		*agbp,
> +	xfs_agnumber_t		agno)
> +{
> +	struct xfs_agf		*agf = XFS_BUF_TO_AGF(agbp);
> +	struct xfs_btree_cur	*cur;
> +
> +	cur = kmem_zone_zalloc(xfs_btree_cur_zone, KM_NOFS);
> +	cur->bc_tp = tp;
> +	cur->bc_mp = mp;
> +	cur->bc_btnum = XFS_BTNUM_RMAP;
> +	cur->bc_flags = XFS_BTREE_CRC_BLOCKS;
> +	cur->bc_blocklog = mp->m_sb.sb_blocklog;
> +	cur->bc_ops = &xfs_rmapbt_ops;
> +	cur->bc_nlevels = be32_to_cpu(agf->agf_levels[XFS_BTNUM_RMAP]);
> +
> +	cur->bc_private.a.agbp = agbp;
> +	cur->bc_private.a.agno = agno;
> +
> +	return cur;
> +}
> +
> +/*
> + * Calculate number of records in an rmap btree block.
> + */
> +int
> +xfs_rmapbt_maxrecs(
> +	struct xfs_mount	*mp,
> +	int			blocklen,
> +	int			leaf)
> +{
> +	blocklen -= XFS_RMAP_BLOCK_LEN;
> +
> +	if (leaf)
> +		return blocklen / sizeof(struct xfs_rmap_rec);
> +	return blocklen /
> +		(sizeof(struct xfs_rmap_key) + sizeof(xfs_rmap_ptr_t));
> +}
> +
> +/* Compute the maximum height of an rmap btree. */
> +void
> +xfs_rmapbt_compute_maxlevels(
> +	struct xfs_mount		*mp)
> +{
> +	mp->m_rmap_maxlevels = xfs_btree_compute_maxlevels(mp,
> +			mp->m_rmap_mnr, mp->m_sb.sb_agblocks);
> +}
> diff --git a/fs/xfs/libxfs/xfs_rmap_btree.h b/fs/xfs/libxfs/xfs_rmap_btree.h
> index a3b8f90..462767f 100644
> --- a/fs/xfs/libxfs/xfs_rmap_btree.h
> +++ b/fs/xfs/libxfs/xfs_rmap_btree.h
> @@ -19,6 +19,38 @@
>  #define	__XFS_RMAP_BTREE_H__
>  
>  struct xfs_buf;
> +struct xfs_btree_cur;
> +struct xfs_mount;
> +
> +/* rmaps only exist on crc enabled filesystems */
> +#define XFS_RMAP_BLOCK_LEN	XFS_BTREE_SBLOCK_CRC_LEN
> +
> +/*
> + * Record, key, and pointer address macros for btree blocks.
> + *
> + * (note that some of these may appear unused, but they are used in userspace)
> + */
> +#define XFS_RMAP_REC_ADDR(block, index) \
> +	((struct xfs_rmap_rec *) \
> +		((char *)(block) + XFS_RMAP_BLOCK_LEN + \
> +		 (((index) - 1) * sizeof(struct xfs_rmap_rec))))
> +
> +#define XFS_RMAP_KEY_ADDR(block, index) \
> +	((struct xfs_rmap_key *) \
> +		((char *)(block) + XFS_RMAP_BLOCK_LEN + \
> +		 ((index) - 1) * sizeof(struct xfs_rmap_key)))
> +
> +#define XFS_RMAP_PTR_ADDR(block, index, maxrecs) \
> +	((xfs_rmap_ptr_t *) \
> +		((char *)(block) + XFS_RMAP_BLOCK_LEN + \
> +		 (maxrecs) * sizeof(struct xfs_rmap_key) + \
> +		 ((index) - 1) * sizeof(xfs_rmap_ptr_t)))
> +
> +struct xfs_btree_cur *xfs_rmapbt_init_cursor(struct xfs_mount *mp,
> +				struct xfs_trans *tp, struct xfs_buf *bp,
> +				xfs_agnumber_t agno);
> +int xfs_rmapbt_maxrecs(struct xfs_mount *mp, int blocklen, int leaf);
> +extern void xfs_rmapbt_compute_maxlevels(struct xfs_mount *mp);
>  
>  int xfs_rmap_alloc(struct xfs_trans *tp, struct xfs_buf *agbp,
>  		   xfs_agnumber_t agno, xfs_agblock_t bno, xfs_extlen_t len,
> diff --git a/fs/xfs/libxfs/xfs_sb.c b/fs/xfs/libxfs/xfs_sb.c
> index a544686..f86226b 100644
> --- a/fs/xfs/libxfs/xfs_sb.c
> +++ b/fs/xfs/libxfs/xfs_sb.c
> @@ -37,6 +37,7 @@
>  #include "xfs_alloc_btree.h"
>  #include "xfs_ialloc_btree.h"
>  #include "xfs_log.h"
> +#include "xfs_rmap_btree.h"
>  
>  /*
>   * Physical superblock buffer manipulations. Shared with libxfs in userspace.
> @@ -734,6 +735,11 @@ xfs_sb_mount_common(
>  	mp->m_bmap_dmnr[0] = mp->m_bmap_dmxr[0] / 2;
>  	mp->m_bmap_dmnr[1] = mp->m_bmap_dmxr[1] / 2;
>  
> +	mp->m_rmap_mxr[0] = xfs_rmapbt_maxrecs(mp, sbp->sb_blocksize, 1);
> +	mp->m_rmap_mxr[1] = xfs_rmapbt_maxrecs(mp, sbp->sb_blocksize, 0);
> +	mp->m_rmap_mnr[0] = mp->m_rmap_mxr[0] / 2;
> +	mp->m_rmap_mnr[1] = mp->m_rmap_mxr[1] / 2;
> +
>  	mp->m_bsize = XFS_FSB_TO_BB(mp, 1);
>  	mp->m_ialloc_inos = (int)MAX((__uint16_t)XFS_INODES_PER_CHUNK,
>  					sbp->sb_inopblock);
> diff --git a/fs/xfs/libxfs/xfs_shared.h b/fs/xfs/libxfs/xfs_shared.h
> index 16002b5..0c5b30b 100644
> --- a/fs/xfs/libxfs/xfs_shared.h
> +++ b/fs/xfs/libxfs/xfs_shared.h
> @@ -38,6 +38,7 @@ extern const struct xfs_buf_ops xfs_agi_buf_ops;
>  extern const struct xfs_buf_ops xfs_agf_buf_ops;
>  extern const struct xfs_buf_ops xfs_agfl_buf_ops;
>  extern const struct xfs_buf_ops xfs_allocbt_buf_ops;
> +extern const struct xfs_buf_ops xfs_rmapbt_buf_ops;
>  extern const struct xfs_buf_ops xfs_attr3_leaf_buf_ops;
>  extern const struct xfs_buf_ops xfs_attr3_rmt_buf_ops;
>  extern const struct xfs_buf_ops xfs_bmbt_buf_ops;
> @@ -116,6 +117,7 @@ int	xfs_log_calc_minimum_size(struct xfs_mount *);
>  #define	XFS_INO_BTREE_REF	3
>  #define	XFS_ALLOC_BTREE_REF	2
>  #define	XFS_BMAP_BTREE_REF	2
> +#define	XFS_RMAP_BTREE_REF	2
>  #define	XFS_DIR_BTREE_REF	2
>  #define	XFS_INO_REF		2
>  #define	XFS_ATTR_BTREE_REF	1
> diff --git a/fs/xfs/xfs_mount.c b/fs/xfs/xfs_mount.c
> index b4153f0..8af1c88 100644
> --- a/fs/xfs/xfs_mount.c
> +++ b/fs/xfs/xfs_mount.c
> @@ -42,6 +42,7 @@
>  #include "xfs_trace.h"
>  #include "xfs_icache.h"
>  #include "xfs_sysfs.h"
> +#include "xfs_rmap_btree.h"
>  
>  
>  static DEFINE_MUTEX(xfs_uuid_table_mutex);
> @@ -680,6 +681,7 @@ xfs_mountfs(
>  	xfs_bmap_compute_maxlevels(mp, XFS_DATA_FORK);
>  	xfs_bmap_compute_maxlevels(mp, XFS_ATTR_FORK);
>  	xfs_ialloc_compute_maxlevels(mp);
> +	xfs_rmapbt_compute_maxlevels(mp);
>  
>  	xfs_set_maxicount(mp);
>  
> diff --git a/fs/xfs/xfs_mount.h b/fs/xfs/xfs_mount.h
> index 0537b1f..0ed0f29 100644
> --- a/fs/xfs/xfs_mount.h
> +++ b/fs/xfs/xfs_mount.h
> @@ -116,9 +116,12 @@ typedef struct xfs_mount {
>  	uint			m_bmap_dmnr[2];	/* min bmap btree records */
>  	uint			m_inobt_mxr[2];	/* max inobt btree records */
>  	uint			m_inobt_mnr[2];	/* min inobt btree records */
> +	uint			m_rmap_mxr[2];	/* max rmap btree records */
> +	uint			m_rmap_mnr[2];	/* min rmap btree records */
>  	uint			m_ag_maxlevels;	/* XFS_AG_MAXLEVELS */
>  	uint			m_bm_maxlevels[2]; /* XFS_BM_MAXLEVELS */
>  	uint			m_in_maxlevels;	/* max inobt btree levels. */
> +	uint			m_rmap_maxlevels; /* max rmap btree levels */
>  	xfs_extlen_t		m_ag_prealloc_blocks; /* reserved ag blocks */
>  	struct radix_tree_root	m_perag_tree;	/* per-ag accounting info */
>  	spinlock_t		m_perag_lock;	/* lock for m_perag_tree */
> diff --git a/fs/xfs/xfs_ondisk.h b/fs/xfs/xfs_ondisk.h
> index 0272301..48d544f 100644
> --- a/fs/xfs/xfs_ondisk.h
> +++ b/fs/xfs/xfs_ondisk.h
> @@ -47,11 +47,14 @@ xfs_check_ondisk_structs(void)
>  	XFS_CHECK_STRUCT_SIZE(struct xfs_dsymlink_hdr,		56);
>  	XFS_CHECK_STRUCT_SIZE(struct xfs_inobt_key,		4);
>  	XFS_CHECK_STRUCT_SIZE(struct xfs_inobt_rec,		16);
> +	XFS_CHECK_STRUCT_SIZE(struct xfs_rmap_key,		20);
> +	XFS_CHECK_STRUCT_SIZE(struct xfs_rmap_rec,		24);
>  	XFS_CHECK_STRUCT_SIZE(struct xfs_timestamp,		8);
>  	XFS_CHECK_STRUCT_SIZE(xfs_alloc_key_t,			8);
>  	XFS_CHECK_STRUCT_SIZE(xfs_alloc_ptr_t,			4);
>  	XFS_CHECK_STRUCT_SIZE(xfs_alloc_rec_t,			8);
>  	XFS_CHECK_STRUCT_SIZE(xfs_inobt_ptr_t,			4);
> +	XFS_CHECK_STRUCT_SIZE(xfs_rmap_ptr_t,			4);
>  
>  	/* dir/attr trees */
>  	XFS_CHECK_STRUCT_SIZE(struct xfs_attr3_leaf_hdr,	80);
> diff --git a/fs/xfs/xfs_trace.h b/fs/xfs/xfs_trace.h
> index 4872fbd..b4ee9c8 100644
> --- a/fs/xfs/xfs_trace.h
> +++ b/fs/xfs/xfs_trace.h
> @@ -2444,6 +2444,8 @@ DECLARE_EVENT_CLASS(xfs_rmap_class,
>  		__entry->owner = oinfo->oi_owner;
>  		__entry->offset = oinfo->oi_offset;
>  		__entry->flags = oinfo->oi_flags;
> +		if (unwritten)
> +			__entry->flags |= XFS_RMAP_UNWRITTEN;
>  	),
>  	TP_printk("dev %d:%d agno %u agbno %u len %u owner %lld offset %llu flags 0x%lx",
>  		  MAJOR(__entry->dev), MINOR(__entry->dev),
> 
> _______________________________________________
> xfs mailing list
> xfs@xxxxxxxxxxx
> http://oss.sgi.com/mailman/listinfo/xfs
--
To unsubscribe from this list: send the line "unsubscribe linux-fsdevel" in
the body of a message to majordomo@xxxxxxxxxxxxxxx
More majordomo info at  http://vger.kernel.org/majordomo-info.html



[Index of Archives]     [Linux Ext4 Filesystem]     [Union Filesystem]     [Filesystem Testing]     [Ceph Users]     [Ecryptfs]     [AutoFS]     [Kernel Newbies]     [Share Photos]     [Security]     [Netfilter]     [Bugtraq]     [Yosemite News]     [MIPS Linux]     [ARM Linux]     [Linux Security]     [Linux Cachefs]     [Reiser Filesystem]     [Linux RAID]     [Samba]     [Device Mapper]     [CEPH Development]
  Powered by Linux