On Fri, Sep 30, 2016 at 03:22:14PM -0400, Brian Foster wrote: > On Thu, Sep 29, 2016 at 08:07:45PM -0700, Darrick J. Wong wrote: > > Provide a mechanism for higher levels to create BUI/BUD items, submit > > them to the log, and a stub function to deal with recovered BUI items. > > These parts will be connected to the rmapbt in a later patch. > > > > Signed-off-by: Darrick J. Wong <darrick.wong@xxxxxxxxxx> > > --- > > v2: Only support one item per BUI. > > --- > > fs/xfs/Makefile | 1 > > fs/xfs/libxfs/xfs_bmap.h | 14 ++++ > > fs/xfs/xfs_bmap_item.c | 69 ++++++++++++++++++ > > fs/xfs/xfs_bmap_item.h | 1 > > fs/xfs/xfs_log_recover.c | 177 ++++++++++++++++++++++++++++++++++++++++++++++ > > fs/xfs/xfs_trans.h | 13 +++ > > fs/xfs/xfs_trans_bmap.c | 84 ++++++++++++++++++++++ > > 7 files changed, 359 insertions(+) > > create mode 100644 fs/xfs/xfs_trans_bmap.c > > > > > ... > > diff --git a/fs/xfs/xfs_bmap_item.c b/fs/xfs/xfs_bmap_item.c > > index ea736af..4e46b63 100644 > > --- a/fs/xfs/xfs_bmap_item.c > > +++ b/fs/xfs/xfs_bmap_item.c > ... > > @@ -372,3 +378,66 @@ xfs_bud_init( > > > > return budp; > > } > > + > > +/* > > + * Process a bmap update intent item that was recovered from the log. > > + * We need to update some inode's bmbt. > > + */ > > +int > > +xfs_bui_recover( > > + struct xfs_mount *mp, > > + struct xfs_bui_log_item *buip) > > +{ > > + int error = 0; > > + struct xfs_map_extent *bmap; > > + xfs_fsblock_t startblock_fsb; > > + xfs_fsblock_t inode_fsb; > > + bool op_ok; > > + > > + ASSERT(!test_bit(XFS_BUI_RECOVERED, &buip->bui_flags)); > > + > > + /* Only one mapping operation per BUI... */ > > + if (buip->bui_format.bui_nextents != XFS_BUI_MAX_FAST_EXTENTS) { > > + set_bit(XFS_BUI_RECOVERED, &buip->bui_flags); > > + xfs_bui_release(buip); > > + return -EIO; > > + } > > + > > + /* > > + * First check the validity of the extent described by the > > + * BUI. If anything is bad, then toss the BUI. > > + */ > > + bmap = &buip->bui_format.bui_extents[0]; > > + startblock_fsb = XFS_BB_TO_FSB(mp, > > + XFS_FSB_TO_DADDR(mp, bmap->me_startblock)); > > + inode_fsb = XFS_BB_TO_FSB(mp, XFS_FSB_TO_DADDR(mp, > > + XFS_INO_TO_FSB(mp, bmap->me_owner))); > > + switch (bmap->me_flags & XFS_BMAP_EXTENT_TYPE_MASK) { > > + case XFS_BMAP_MAP: > > + case XFS_BMAP_UNMAP: > > + op_ok = true; > > + break; > > + default: > > + op_ok = false; > > + break; > > + } > > + if (!op_ok || startblock_fsb == 0 || > > + bmap->me_len == 0 || > > + inode_fsb == 0 || > > + startblock_fsb >= mp->m_sb.sb_dblocks || > > + bmap->me_len >= mp->m_sb.sb_agblocks || > > + inode_fsb >= mp->m_sb.sb_agblocks || > > Did you mean sb_dblocks here? Yes, thank you. I'll fix that. --D > > Brian > > > + (bmap->me_flags & ~XFS_BMAP_EXTENT_FLAGS)) { > > + /* > > + * This will pull the BUI from the AIL and > > + * free the memory associated with it. > > + */ > > + set_bit(XFS_BUI_RECOVERED, &buip->bui_flags); > > + xfs_bui_release(buip); > > + return -EIO; > > + } > > + > > + set_bit(XFS_BUI_RECOVERED, &buip->bui_flags); > > + xfs_bui_release(buip); > > + return error; > > +} > > diff --git a/fs/xfs/xfs_bmap_item.h b/fs/xfs/xfs_bmap_item.h > > index 57c13d3..c867daa 100644 > > --- a/fs/xfs/xfs_bmap_item.h > > +++ b/fs/xfs/xfs_bmap_item.h > > @@ -93,5 +93,6 @@ struct xfs_bud_log_item *xfs_bud_init(struct xfs_mount *, > > struct xfs_bui_log_item *); > > void xfs_bui_item_free(struct xfs_bui_log_item *); > > void xfs_bui_release(struct xfs_bui_log_item *); > > +int xfs_bui_recover(struct xfs_mount *mp, struct xfs_bui_log_item *buip); > > > > #endif /* __XFS_BMAP_ITEM_H__ */ > > diff --git a/fs/xfs/xfs_log_recover.c b/fs/xfs/xfs_log_recover.c > > index 622881a..9697e94 100644 > > --- a/fs/xfs/xfs_log_recover.c > > +++ b/fs/xfs/xfs_log_recover.c > > @@ -46,6 +46,7 @@ > > #include "xfs_rmap_item.h" > > #include "xfs_buf_item.h" > > #include "xfs_refcount_item.h" > > +#include "xfs_bmap_item.h" > > > > #define BLK_AVG(blk1, blk2) ((blk1+blk2) >> 1) > > > > @@ -1927,6 +1928,8 @@ xlog_recover_reorder_trans( > > case XFS_LI_RUD: > > case XFS_LI_CUI: > > case XFS_LI_CUD: > > + case XFS_LI_BUI: > > + case XFS_LI_BUD: > > trace_xfs_log_recover_item_reorder_tail(log, > > trans, item, pass); > > list_move_tail(&item->ri_list, &inode_list); > > @@ -3671,6 +3674,125 @@ xlog_recover_cud_pass2( > > } > > > > /* > > + * Copy an BUI format buffer from the given buf, and into the destination > > + * BUI format structure. The BUI/BUD items were designed not to need any > > + * special alignment handling. > > + */ > > +static int > > +xfs_bui_copy_format( > > + struct xfs_log_iovec *buf, > > + struct xfs_bui_log_format *dst_bui_fmt) > > +{ > > + struct xfs_bui_log_format *src_bui_fmt; > > + uint len; > > + > > + src_bui_fmt = buf->i_addr; > > + len = xfs_bui_log_format_sizeof(src_bui_fmt->bui_nextents); > > + > > + if (buf->i_len == len) { > > + memcpy(dst_bui_fmt, src_bui_fmt, len); > > + return 0; > > + } > > + return -EFSCORRUPTED; > > +} > > + > > +/* > > + * This routine is called to create an in-core extent bmap update > > + * item from the bui format structure which was logged on disk. > > + * It allocates an in-core bui, copies the extents from the format > > + * structure into it, and adds the bui to the AIL with the given > > + * LSN. > > + */ > > +STATIC int > > +xlog_recover_bui_pass2( > > + struct xlog *log, > > + struct xlog_recover_item *item, > > + xfs_lsn_t lsn) > > +{ > > + int error; > > + struct xfs_mount *mp = log->l_mp; > > + struct xfs_bui_log_item *buip; > > + struct xfs_bui_log_format *bui_formatp; > > + > > + bui_formatp = item->ri_buf[0].i_addr; > > + > > + if (bui_formatp->bui_nextents != XFS_BUI_MAX_FAST_EXTENTS) > > + return -EFSCORRUPTED; > > + buip = xfs_bui_init(mp); > > + error = xfs_bui_copy_format(&item->ri_buf[0], &buip->bui_format); > > + if (error) { > > + xfs_bui_item_free(buip); > > + return error; > > + } > > + atomic_set(&buip->bui_next_extent, bui_formatp->bui_nextents); > > + > > + spin_lock(&log->l_ailp->xa_lock); > > + /* > > + * The RUI has two references. One for the RUD and one for RUI to ensure > > + * it makes it into the AIL. Insert the RUI into the AIL directly and > > + * drop the RUI reference. Note that xfs_trans_ail_update() drops the > > + * AIL lock. > > + */ > > + xfs_trans_ail_update(log->l_ailp, &buip->bui_item, lsn); > > + xfs_bui_release(buip); > > + return 0; > > +} > > + > > + > > +/* > > + * This routine is called when an BUD format structure is found in a committed > > + * transaction in the log. Its purpose is to cancel the corresponding BUI if it > > + * was still in the log. To do this it searches the AIL for the BUI with an id > > + * equal to that in the BUD format structure. If we find it we drop the BUD > > + * reference, which removes the BUI from the AIL and frees it. > > + */ > > +STATIC int > > +xlog_recover_bud_pass2( > > + struct xlog *log, > > + struct xlog_recover_item *item) > > +{ > > + struct xfs_bud_log_format *bud_formatp; > > + struct xfs_bui_log_item *buip = NULL; > > + struct xfs_log_item *lip; > > + __uint64_t bui_id; > > + struct xfs_ail_cursor cur; > > + struct xfs_ail *ailp = log->l_ailp; > > + > > + bud_formatp = item->ri_buf[0].i_addr; > > + if (item->ri_buf[0].i_len != sizeof(struct xfs_bud_log_format)) > > + return -EFSCORRUPTED; > > + bui_id = bud_formatp->bud_bui_id; > > + > > + /* > > + * Search for the BUI with the id in the BUD format structure in the > > + * AIL. > > + */ > > + spin_lock(&ailp->xa_lock); > > + lip = xfs_trans_ail_cursor_first(ailp, &cur, 0); > > + while (lip != NULL) { > > + if (lip->li_type == XFS_LI_BUI) { > > + buip = (struct xfs_bui_log_item *)lip; > > + if (buip->bui_format.bui_id == bui_id) { > > + /* > > + * Drop the BUD reference to the BUI. This > > + * removes the BUI from the AIL and frees it. > > + */ > > + spin_unlock(&ailp->xa_lock); > > + xfs_bui_release(buip); > > + spin_lock(&ailp->xa_lock); > > + break; > > + } > > + } > > + lip = xfs_trans_ail_cursor_next(ailp, &cur); > > + } > > + > > + xfs_trans_ail_cursor_done(&cur); > > + spin_unlock(&ailp->xa_lock); > > + > > + return 0; > > +} > > + > > +/* > > * This routine is called when an inode create format structure is found in a > > * committed transaction in the log. It's purpose is to initialise the inodes > > * being allocated on disk. This requires us to get inode cluster buffers that > > @@ -3899,6 +4021,8 @@ xlog_recover_ra_pass2( > > case XFS_LI_RUD: > > case XFS_LI_CUI: > > case XFS_LI_CUD: > > + case XFS_LI_BUI: > > + case XFS_LI_BUD: > > default: > > break; > > } > > @@ -3926,6 +4050,8 @@ xlog_recover_commit_pass1( > > case XFS_LI_RUD: > > case XFS_LI_CUI: > > case XFS_LI_CUD: > > + case XFS_LI_BUI: > > + case XFS_LI_BUD: > > /* nothing to do in pass 1 */ > > return 0; > > default: > > @@ -3964,6 +4090,10 @@ xlog_recover_commit_pass2( > > return xlog_recover_cui_pass2(log, item, trans->r_lsn); > > case XFS_LI_CUD: > > return xlog_recover_cud_pass2(log, item); > > + case XFS_LI_BUI: > > + return xlog_recover_bui_pass2(log, item, trans->r_lsn); > > + case XFS_LI_BUD: > > + return xlog_recover_bud_pass2(log, item); > > case XFS_LI_DQUOT: > > return xlog_recover_dquot_pass2(log, buffer_list, item, > > trans->r_lsn); > > @@ -4591,6 +4721,46 @@ xlog_recover_cancel_cui( > > spin_lock(&ailp->xa_lock); > > } > > > > +/* Recover the BUI if necessary. */ > > +STATIC int > > +xlog_recover_process_bui( > > + struct xfs_mount *mp, > > + struct xfs_ail *ailp, > > + struct xfs_log_item *lip) > > +{ > > + struct xfs_bui_log_item *buip; > > + int error; > > + > > + /* > > + * Skip BUIs that we've already processed. > > + */ > > + buip = container_of(lip, struct xfs_bui_log_item, bui_item); > > + if (test_bit(XFS_BUI_RECOVERED, &buip->bui_flags)) > > + return 0; > > + > > + spin_unlock(&ailp->xa_lock); > > + error = xfs_bui_recover(mp, buip); > > + spin_lock(&ailp->xa_lock); > > + > > + return error; > > +} > > + > > +/* Release the BUI since we're cancelling everything. */ > > +STATIC void > > +xlog_recover_cancel_bui( > > + struct xfs_mount *mp, > > + struct xfs_ail *ailp, > > + struct xfs_log_item *lip) > > +{ > > + struct xfs_bui_log_item *buip; > > + > > + buip = container_of(lip, struct xfs_bui_log_item, bui_item); > > + > > + spin_unlock(&ailp->xa_lock); > > + xfs_bui_release(buip); > > + spin_lock(&ailp->xa_lock); > > +} > > + > > /* Is this log item a deferred action intent? */ > > static inline bool xlog_item_is_intent(struct xfs_log_item *lip) > > { > > @@ -4598,6 +4768,7 @@ static inline bool xlog_item_is_intent(struct xfs_log_item *lip) > > case XFS_LI_EFI: > > case XFS_LI_RUI: > > case XFS_LI_CUI: > > + case XFS_LI_BUI: > > return true; > > default: > > return false; > > @@ -4664,6 +4835,9 @@ xlog_recover_process_intents( > > case XFS_LI_CUI: > > error = xlog_recover_process_cui(log->l_mp, ailp, lip); > > break; > > + case XFS_LI_BUI: > > + error = xlog_recover_process_bui(log->l_mp, ailp, lip); > > + break; > > } > > if (error) > > goto out; > > @@ -4714,6 +4888,9 @@ xlog_recover_cancel_intents( > > case XFS_LI_CUI: > > xlog_recover_cancel_cui(log->l_mp, ailp, lip); > > break; > > + case XFS_LI_BUI: > > + xlog_recover_cancel_bui(log->l_mp, ailp, lip); > > + break; > > } > > > > lip = xfs_trans_ail_cursor_next(ailp, &cur); > > diff --git a/fs/xfs/xfs_trans.h b/fs/xfs/xfs_trans.h > > index a7a87d2..7cf02d3 100644 > > --- a/fs/xfs/xfs_trans.h > > +++ b/fs/xfs/xfs_trans.h > > @@ -39,6 +39,7 @@ struct xfs_btree_cur; > > struct xfs_cui_log_item; > > struct xfs_cud_log_item; > > struct xfs_defer_ops; > > +struct xfs_bui_log_item; > > > > typedef struct xfs_log_item { > > struct list_head li_ail; /* AIL pointers */ > > @@ -263,4 +264,16 @@ int xfs_trans_log_finish_refcount_update(struct xfs_trans *tp, > > xfs_extlen_t blockcount, xfs_extlen_t *adjusted, > > struct xfs_btree_cur **pcur); > > > > +/* mapping updates */ > > +enum xfs_bmap_intent_type; > > + > > +void xfs_bmap_update_init_defer_op(void); > > +struct xfs_bud_log_item *xfs_trans_get_bud(struct xfs_trans *tp, > > + struct xfs_bui_log_item *buip); > > +int xfs_trans_log_finish_bmap_update(struct xfs_trans *tp, > > + struct xfs_bud_log_item *rudp, struct xfs_defer_ops *dfops, > > + enum xfs_bmap_intent_type type, struct xfs_inode *ip, > > + int whichfork, xfs_fileoff_t startoff, xfs_fsblock_t startblock, > > + xfs_filblks_t blockcount, xfs_exntst_t state); > > + > > #endif /* __XFS_TRANS_H__ */ > > diff --git a/fs/xfs/xfs_trans_bmap.c b/fs/xfs/xfs_trans_bmap.c > > new file mode 100644 > > index 0000000..656d669 > > --- /dev/null > > +++ b/fs/xfs/xfs_trans_bmap.c > > @@ -0,0 +1,84 @@ > > +/* > > + * Copyright (C) 2016 Oracle. All Rights Reserved. > > + * > > + * Author: Darrick J. Wong <darrick.wong@xxxxxxxxxx> > > + * > > + * This program is free software; you can redistribute it and/or > > + * modify it under the terms of the GNU General Public License > > + * as published by the Free Software Foundation; either version 2 > > + * of the License, or (at your option) any later version. > > + * > > + * This program is distributed in the hope that it would be useful, > > + * but WITHOUT ANY WARRANTY; without even the implied warranty of > > + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the > > + * GNU General Public License for more details. > > + * > > + * You should have received a copy of the GNU General Public License > > + * along with this program; if not, write the Free Software Foundation, > > + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA. > > + */ > > +#include "xfs.h" > > +#include "xfs_fs.h" > > +#include "xfs_shared.h" > > +#include "xfs_format.h" > > +#include "xfs_log_format.h" > > +#include "xfs_trans_resv.h" > > +#include "xfs_mount.h" > > +#include "xfs_defer.h" > > +#include "xfs_trans.h" > > +#include "xfs_trans_priv.h" > > +#include "xfs_bmap_item.h" > > +#include "xfs_alloc.h" > > +#include "xfs_bmap.h" > > +#include "xfs_inode.h" > > + > > +/* > > + * This routine is called to allocate a "bmap update done" > > + * log item. > > + */ > > +struct xfs_bud_log_item * > > +xfs_trans_get_bud( > > + struct xfs_trans *tp, > > + struct xfs_bui_log_item *buip) > > +{ > > + struct xfs_bud_log_item *budp; > > + > > + budp = xfs_bud_init(tp->t_mountp, buip); > > + xfs_trans_add_item(tp, &budp->bud_item); > > + return budp; > > +} > > + > > +/* > > + * Finish an bmap update and log it to the BUD. Note that the > > + * transaction is marked dirty regardless of whether the bmap update > > + * succeeds or fails to support the BUI/BUD lifecycle rules. > > + */ > > +int > > +xfs_trans_log_finish_bmap_update( > > + struct xfs_trans *tp, > > + struct xfs_bud_log_item *budp, > > + struct xfs_defer_ops *dop, > > + enum xfs_bmap_intent_type type, > > + struct xfs_inode *ip, > > + int whichfork, > > + xfs_fileoff_t startoff, > > + xfs_fsblock_t startblock, > > + xfs_filblks_t blockcount, > > + xfs_exntst_t state) > > +{ > > + int error; > > + > > + error = -EFSCORRUPTED; > > + > > + /* > > + * Mark the transaction dirty, even on error. This ensures the > > + * transaction is aborted, which: > > + * > > + * 1.) releases the BUI and frees the BUD > > + * 2.) shuts down the filesystem > > + */ > > + tp->t_flags |= XFS_TRANS_DIRTY; > > + budp->bud_item.li_desc->lid_flags |= XFS_LID_DIRTY; > > + > > + return error; > > +} > > > > -- > > To unsubscribe from this list: send the line "unsubscribe linux-xfs" in > > the body of a message to majordomo@xxxxxxxxxxxxxxx > > More majordomo info at http://vger.kernel.org/majordomo-info.html -- To unsubscribe from this list: send the line "unsubscribe linux-xfs" in the body of a message to majordomo@xxxxxxxxxxxxxxx More majordomo info at http://vger.kernel.org/majordomo-info.html