Re: [PATCH 07/15] xfs: automatic dfops buffer relogging

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 



On Mon, Jul 30, 2018 at 01:20:37PM -0700, Darrick J. Wong wrote:
> On Mon, Jul 30, 2018 at 12:45:12PM -0400, Brian Foster wrote:
> > Buffers that are held across deferred operations are explicitly
> > joined to the dfops structure to ensure appropriate relogging.
> > While buffers are currently joined explicitly, we can detect the
> > conditions that require relogging at dfops finish time by inspecting
> > the transaction item list for held buffers.
> > 
> > Replace the xfs_defer_bjoin() infrastructure with such detection and
> > automatic relogging of held buffers. This eliminates the need for
> > the per-dfops buffer list, replaced by an on-stack variant in
> > xfs_defer_trans_roll().
> > 
> > Signed-off-by: Brian Foster <bfoster@xxxxxxxxxx>
> > ---
> >  fs/xfs/libxfs/xfs_attr.c  |  1 -
> >  fs/xfs/libxfs/xfs_defer.c | 55 ++++++++++++++++-----------------------
> >  fs/xfs/libxfs/xfs_defer.h |  1 -
> >  fs/xfs/xfs_dquot.c        |  1 -
> >  fs/xfs/xfs_trans.h        |  1 -
> >  5 files changed, 23 insertions(+), 36 deletions(-)
> > 
...
> > diff --git a/fs/xfs/libxfs/xfs_defer.c b/fs/xfs/libxfs/xfs_defer.c
> > index 0306187b5f56..d0ee55048a7a 100644
> > --- a/fs/xfs/libxfs/xfs_defer.c
> > +++ b/fs/xfs/libxfs/xfs_defer.c
...
> > @@ -235,9 +240,21 @@ xfs_defer_trans_roll(
> >  	for (i = 0; i < XFS_DEFER_OPS_NR_INODES && dop->dop_inodes[i]; i++)
> >  		xfs_trans_log_inode(*tp, dop->dop_inodes[i], XFS_ILOG_CORE);
> >  
> > -	/* Hold the (previously bjoin'd) buffer locked across the roll. */
> > -	for (i = 0; i < XFS_DEFER_OPS_NR_BUFS && dop->dop_bufs[i]; i++)
> > -		xfs_trans_dirty_buf(*tp, dop->dop_bufs[i]);
> > +	list_for_each_entry(lip, &(*tp)->t_items, li_trans) {
> > +		switch (lip->li_type) {
> > +		case XFS_LI_BUF:
> > +			bli = container_of(lip, struct xfs_buf_log_item,
> > +					   bli_item);
> > +			if (bli->bli_flags & XFS_BLI_HOLD) {
> > +				ASSERT(bpcount < XFS_DEFER_OPS_NR_BUFS);
> 
> This is a bit of a behavior change -- previously if we oveflowed the
> array we'd bail out with -EFSCORRUPTED rather than go corrupting
> whatever came after dop_bufs.  Granted, we were pretty terrible about
> checking the return values, but I think this ought to be:
> 
> if (bpcount >= XFS_DEFER_OPS_NR_BUFS) {
> 	ASSERT(0);
> 	return -EFSCORRUPTED;
> }
> 
> rather than corrupting the on-stack array if we happen to bhold too many
> buffers to the transaction.
> 

Yup, good point. I'll fix up the error checking in both of these
patches.

Brian

> --D
> 
> > +				xfs_trans_dirty_buf(*tp, bli->bli_buf);
> > +				bplist[bpcount++] = bli->bli_buf;
> > +			}
> > +			break;
> > +		default:
> > +			break;
> > +		}
> > +	}
> >  
> >  	trace_xfs_defer_trans_roll((*tp)->t_mountp, dop, _RET_IP_);
> >  
> > @@ -255,9 +272,9 @@ xfs_defer_trans_roll(
> >  		xfs_trans_ijoin(*tp, dop->dop_inodes[i], 0);
> >  
> >  	/* Rejoin the buffers and dirty them so the log moves forward. */
> > -	for (i = 0; i < XFS_DEFER_OPS_NR_BUFS && dop->dop_bufs[i]; i++) {
> > -		xfs_trans_bjoin(*tp, dop->dop_bufs[i]);
> > -		xfs_trans_bhold(*tp, dop->dop_bufs[i]);
> > +	for (i = 0; i < bpcount; i++) {
> > +		xfs_trans_bjoin(*tp, bplist[i]);
> > +		xfs_trans_bhold(*tp, bplist[i]);
> >  	}
> >  
> >  	return error;
> > @@ -295,30 +312,6 @@ xfs_defer_ijoin(
> >  	return -EFSCORRUPTED;
> >  }
> >  
> > -/*
> > - * Add this buffer to the deferred op.  Each joined buffer is relogged
> > - * each time we roll the transaction.
> > - */
> > -int
> > -xfs_defer_bjoin(
> > -	struct xfs_defer_ops		*dop,
> > -	struct xfs_buf			*bp)
> > -{
> > -	int				i;
> > -
> > -	for (i = 0; i < XFS_DEFER_OPS_NR_BUFS; i++) {
> > -		if (dop->dop_bufs[i] == bp)
> > -			return 0;
> > -		else if (dop->dop_bufs[i] == NULL) {
> > -			dop->dop_bufs[i] = bp;
> > -			return 0;
> > -		}
> > -	}
> > -
> > -	ASSERT(0);
> > -	return -EFSCORRUPTED;
> > -}
> > -
> >  /*
> >   * Reset an already used dfops after finish.
> >   */
> > @@ -331,7 +324,6 @@ xfs_defer_reset(
> >  	ASSERT(!xfs_defer_has_unfinished_work(dop));
> >  
> >  	memset(dop->dop_inodes, 0, sizeof(dop->dop_inodes));
> > -	memset(dop->dop_bufs, 0, sizeof(dop->dop_bufs));
> >  
> >  	/*
> >  	 * Low mode state transfers across transaction rolls to mirror dfops
> > @@ -594,7 +586,6 @@ xfs_defer_move(
> >  	list_splice_init(&src->dop_pending, &dst->dop_pending);
> >  
> >  	memcpy(dst->dop_inodes, src->dop_inodes, sizeof(dst->dop_inodes));
> > -	memcpy(dst->dop_bufs, src->dop_bufs, sizeof(dst->dop_bufs));
> >  
> >  	/*
> >  	 * Low free space mode was historically controlled by a dfops field.
> > diff --git a/fs/xfs/libxfs/xfs_defer.h b/fs/xfs/libxfs/xfs_defer.h
> > index 8908a2716774..4a8bb838adf2 100644
> > --- a/fs/xfs/libxfs/xfs_defer.h
> > +++ b/fs/xfs/libxfs/xfs_defer.h
> > @@ -43,7 +43,6 @@ void xfs_defer_cancel(struct xfs_trans *);
> >  void xfs_defer_init(struct xfs_trans *tp, struct xfs_defer_ops *dop);
> >  bool xfs_defer_has_unfinished_work(struct xfs_defer_ops *dop);
> >  int xfs_defer_ijoin(struct xfs_defer_ops *dop, struct xfs_inode *ip);
> > -int xfs_defer_bjoin(struct xfs_defer_ops *dop, struct xfs_buf *bp);
> >  void xfs_defer_move(struct xfs_trans *dtp, struct xfs_trans *stp);
> >  
> >  /* Description of a deferred type. */
> > diff --git a/fs/xfs/xfs_dquot.c b/fs/xfs/xfs_dquot.c
> > index da5c55cec966..e1196854dbcd 100644
> > --- a/fs/xfs/xfs_dquot.c
> > +++ b/fs/xfs/xfs_dquot.c
> > @@ -362,7 +362,6 @@ xfs_dquot_disk_alloc(
> >  	 * manually or by committing the transaction.
> >  	 */
> >  	xfs_trans_bhold(tp, bp);
> > -	error = xfs_defer_bjoin(tp->t_dfops, bp);
> >  	if (error) {
> >  		xfs_trans_bhold_release(tp, bp);
> >  		xfs_trans_brelse(tp, bp);
> > diff --git a/fs/xfs/xfs_trans.h b/fs/xfs/xfs_trans.h
> > index 7e493221160e..581456c79197 100644
> > --- a/fs/xfs/xfs_trans.h
> > +++ b/fs/xfs/xfs_trans.h
> > @@ -100,7 +100,6 @@ struct xfs_defer_ops {
> >  
> >  	/* relog these with each roll */
> >  	struct xfs_inode	*dop_inodes[XFS_DEFER_OPS_NR_INODES];
> > -	struct xfs_buf		*dop_bufs[XFS_DEFER_OPS_NR_BUFS];
> >  };
> >  
> >  /*
> > -- 
> > 2.17.1
> > 
> > --
> > To unsubscribe from this list: send the line "unsubscribe linux-xfs" in
> > the body of a message to majordomo@xxxxxxxxxxxxxxx
> > More majordomo info at  http://vger.kernel.org/majordomo-info.html
> --
> To unsubscribe from this list: send the line "unsubscribe linux-xfs" in
> the body of a message to majordomo@xxxxxxxxxxxxxxx
> More majordomo info at  http://vger.kernel.org/majordomo-info.html
--
To unsubscribe from this list: send the line "unsubscribe linux-xfs" in
the body of a message to majordomo@xxxxxxxxxxxxxxx
More majordomo info at  http://vger.kernel.org/majordomo-info.html



[Index of Archives]     [XFS Filesystem Development (older mail)]     [Linux Filesystem Development]     [Linux Audio Users]     [Yosemite Trails]     [Linux Kernel]     [Linux RAID]     [Linux SCSI]


  Powered by Linux