diff options
Diffstat (limited to 'fs/xfs/libxfs')
| -rw-r--r-- | fs/xfs/libxfs/xfs_ag.c | 2 | ||||
| -rw-r--r-- | fs/xfs/libxfs/xfs_alloc.c | 289 | ||||
| -rw-r--r-- | fs/xfs/libxfs/xfs_alloc.h | 24 | ||||
| -rw-r--r-- | fs/xfs/libxfs/xfs_attr_leaf.c | 2 | ||||
| -rw-r--r-- | fs/xfs/libxfs/xfs_bmap.c | 8 | ||||
| -rw-r--r-- | fs/xfs/libxfs/xfs_bmap_btree.c | 3 | ||||
| -rw-r--r-- | fs/xfs/libxfs/xfs_da_format.h | 75 | ||||
| -rw-r--r-- | fs/xfs/libxfs/xfs_fs.h | 4 | ||||
| -rw-r--r-- | fs/xfs/libxfs/xfs_ialloc.c | 32 | ||||
| -rw-r--r-- | fs/xfs/libxfs/xfs_ialloc_btree.c | 3 | ||||
| -rw-r--r-- | fs/xfs/libxfs/xfs_refcount.c | 22 | ||||
| -rw-r--r-- | fs/xfs/libxfs/xfs_refcount_btree.c | 8 | ||||
| -rw-r--r-- | fs/xfs/libxfs/xfs_rmap.c | 10 | ||||
| -rw-r--r-- | fs/xfs/libxfs/xfs_sb.c | 56 | 
14 files changed, 365 insertions, 173 deletions
| diff --git a/fs/xfs/libxfs/xfs_ag.c b/fs/xfs/libxfs/xfs_ag.c index ee84835ebc66..e9cc481b4ddf 100644 --- a/fs/xfs/libxfs/xfs_ag.c +++ b/fs/xfs/libxfs/xfs_ag.c @@ -985,7 +985,7 @@ xfs_ag_shrink_space(  			goto resv_err;  		err2 = __xfs_free_extent_later(*tpp, args.fsbno, delta, NULL, -				true); +				XFS_AG_RESV_NONE, true);  		if (err2)  			goto resv_err; diff --git a/fs/xfs/libxfs/xfs_alloc.c b/fs/xfs/libxfs/xfs_alloc.c index c20fe99405d8..3069194527dd 100644 --- a/fs/xfs/libxfs/xfs_alloc.c +++ b/fs/xfs/libxfs/xfs_alloc.c @@ -1536,7 +1536,8 @@ xfs_alloc_ag_vextent_lastblock(   */  STATIC int  xfs_alloc_ag_vextent_near( -	struct xfs_alloc_arg	*args) +	struct xfs_alloc_arg	*args, +	uint32_t		alloc_flags)  {  	struct xfs_alloc_cur	acur = {};  	int			error;		/* error code */ @@ -1555,6 +1556,8 @@ xfs_alloc_ag_vextent_near(  	if (args->agbno > args->max_agbno)  		args->agbno = args->max_agbno; +	/* Retry once quickly if we find busy extents before blocking. */ +	alloc_flags |= XFS_ALLOC_FLAG_TRYFLUSH;  restart:  	len = 0; @@ -1610,9 +1613,20 @@ restart:  	 */  	if (!acur.len) {  		if (acur.busy) { +			/* +			 * Our only valid extents must have been busy. Flush and +			 * retry the allocation again. If we get an -EAGAIN +			 * error, we're being told that a deadlock was avoided +			 * and the current transaction needs committing before +			 * the allocation can be retried. +			 */  			trace_xfs_alloc_near_busy(args); -			xfs_extent_busy_flush(args->mp, args->pag, -					      acur.busy_gen); +			error = xfs_extent_busy_flush(args->tp, args->pag, +					acur.busy_gen, alloc_flags); +			if (error) +				goto out; + +			alloc_flags &= ~XFS_ALLOC_FLAG_TRYFLUSH;  			goto restart;  		}  		trace_xfs_alloc_size_neither(args); @@ -1635,22 +1649,25 @@ out:   * and of the form k * prod + mod unless there's nothing that large.   * Return the starting a.g. block, or NULLAGBLOCK if we can't do it.   */ -STATIC int				/* error */ +static int  xfs_alloc_ag_vextent_size( -	xfs_alloc_arg_t	*args)		/* allocation argument structure */ +	struct xfs_alloc_arg	*args, +	uint32_t		alloc_flags)  { -	struct xfs_agf	*agf = args->agbp->b_addr; -	struct xfs_btree_cur *bno_cur;	/* cursor for bno btree */ -	struct xfs_btree_cur *cnt_cur;	/* cursor for cnt btree */ -	int		error;		/* error result */ -	xfs_agblock_t	fbno;		/* start of found freespace */ -	xfs_extlen_t	flen;		/* length of found freespace */ -	int		i;		/* temp status variable */ -	xfs_agblock_t	rbno;		/* returned block number */ -	xfs_extlen_t	rlen;		/* length of returned extent */ -	bool		busy; -	unsigned	busy_gen; +	struct xfs_agf		*agf = args->agbp->b_addr; +	struct xfs_btree_cur	*bno_cur; +	struct xfs_btree_cur	*cnt_cur; +	xfs_agblock_t		fbno;		/* start of found freespace */ +	xfs_extlen_t		flen;		/* length of found freespace */ +	xfs_agblock_t		rbno;		/* returned block number */ +	xfs_extlen_t		rlen;		/* length of returned extent */ +	bool			busy; +	unsigned		busy_gen; +	int			error; +	int			i; +	/* Retry once quickly if we find busy extents before blocking. */ +	alloc_flags |= XFS_ALLOC_FLAG_TRYFLUSH;  restart:  	/*  	 * Allocate and initialize a cursor for the by-size btree. @@ -1708,19 +1725,25 @@ restart:  			error = xfs_btree_increment(cnt_cur, 0, &i);  			if (error)  				goto error0; -			if (i == 0) { -				/* -				 * Our only valid extents must have been busy. -				 * Make it unbusy by forcing the log out and -				 * retrying. -				 */ -				xfs_btree_del_cursor(cnt_cur, -						     XFS_BTREE_NOERROR); -				trace_xfs_alloc_size_busy(args); -				xfs_extent_busy_flush(args->mp, -							args->pag, busy_gen); -				goto restart; -			} +			if (i) +				continue; + +			/* +			 * Our only valid extents must have been busy. Flush and +			 * retry the allocation again. If we get an -EAGAIN +			 * error, we're being told that a deadlock was avoided +			 * and the current transaction needs committing before +			 * the allocation can be retried. +			 */ +			trace_xfs_alloc_size_busy(args); +			error = xfs_extent_busy_flush(args->tp, args->pag, +					busy_gen, alloc_flags); +			if (error) +				goto error0; + +			alloc_flags &= ~XFS_ALLOC_FLAG_TRYFLUSH; +			xfs_btree_del_cursor(cnt_cur, XFS_BTREE_NOERROR); +			goto restart;  		}  	} @@ -1800,9 +1823,21 @@ restart:  	args->len = rlen;  	if (rlen < args->minlen) {  		if (busy) { -			xfs_btree_del_cursor(cnt_cur, XFS_BTREE_NOERROR); +			/* +			 * Our only valid extents must have been busy. Flush and +			 * retry the allocation again. If we get an -EAGAIN +			 * error, we're being told that a deadlock was avoided +			 * and the current transaction needs committing before +			 * the allocation can be retried. +			 */  			trace_xfs_alloc_size_busy(args); -			xfs_extent_busy_flush(args->mp, args->pag, busy_gen); +			error = xfs_extent_busy_flush(args->tp, args->pag, +					busy_gen, alloc_flags); +			if (error) +				goto error0; + +			alloc_flags &= ~XFS_ALLOC_FLAG_TRYFLUSH; +			xfs_btree_del_cursor(cnt_cur, XFS_BTREE_NOERROR);  			goto restart;  		}  		goto out_nominleft; @@ -2435,23 +2470,25 @@ static int  xfs_defer_agfl_block(  	struct xfs_trans		*tp,  	xfs_agnumber_t			agno, -	xfs_fsblock_t			agbno, +	xfs_agblock_t			agbno,  	struct xfs_owner_info		*oinfo)  {  	struct xfs_mount		*mp = tp->t_mountp;  	struct xfs_extent_free_item	*xefi; +	xfs_fsblock_t			fsbno = XFS_AGB_TO_FSB(mp, agno, agbno);  	ASSERT(xfs_extfree_item_cache != NULL);  	ASSERT(oinfo != NULL); +	if (XFS_IS_CORRUPT(mp, !xfs_verify_fsbno(mp, fsbno))) +		return -EFSCORRUPTED; +  	xefi = kmem_cache_zalloc(xfs_extfree_item_cache,  			       GFP_KERNEL | __GFP_NOFAIL); -	xefi->xefi_startblock = XFS_AGB_TO_FSB(mp, agno, agbno); +	xefi->xefi_startblock = fsbno;  	xefi->xefi_blockcount = 1;  	xefi->xefi_owner = oinfo->oi_owner; - -	if (XFS_IS_CORRUPT(mp, !xfs_verify_fsbno(mp, xefi->xefi_startblock))) -		return -EFSCORRUPTED; +	xefi->xefi_agresv = XFS_AG_RESV_AGFL;  	trace_xfs_agfl_free_defer(mp, agno, 0, agbno, 1); @@ -2470,6 +2507,7 @@ __xfs_free_extent_later(  	xfs_fsblock_t			bno,  	xfs_filblks_t			len,  	const struct xfs_owner_info	*oinfo, +	enum xfs_ag_resv_type		type,  	bool				skip_discard)  {  	struct xfs_extent_free_item	*xefi; @@ -2490,6 +2528,7 @@ __xfs_free_extent_later(  	ASSERT(agbno + len <= mp->m_sb.sb_agblocks);  #endif  	ASSERT(xfs_extfree_item_cache != NULL); +	ASSERT(type != XFS_AG_RESV_AGFL);  	if (XFS_IS_CORRUPT(mp, !xfs_verify_fsbext(mp, bno, len)))  		return -EFSCORRUPTED; @@ -2498,6 +2537,7 @@ __xfs_free_extent_later(  			       GFP_KERNEL | __GFP_NOFAIL);  	xefi->xefi_startblock = bno;  	xefi->xefi_blockcount = (xfs_extlen_t)len; +	xefi->xefi_agresv = type;  	if (skip_discard)  		xefi->xefi_flags |= XFS_EFI_SKIP_DISCARD;  	if (oinfo) { @@ -2568,7 +2608,7 @@ out:  int			/* error */  xfs_alloc_fix_freelist(  	struct xfs_alloc_arg	*args,	/* allocation argument structure */ -	int			flags)	/* XFS_ALLOC_FLAG_... */ +	uint32_t		alloc_flags)  {  	struct xfs_mount	*mp = args->mp;  	struct xfs_perag	*pag = args->pag; @@ -2584,7 +2624,7 @@ xfs_alloc_fix_freelist(  	ASSERT(tp->t_flags & XFS_TRANS_PERM_LOG_RES);  	if (!xfs_perag_initialised_agf(pag)) { -		error = xfs_alloc_read_agf(pag, tp, flags, &agbp); +		error = xfs_alloc_read_agf(pag, tp, alloc_flags, &agbp);  		if (error) {  			/* Couldn't lock the AGF so skip this AG. */  			if (error == -EAGAIN) @@ -2600,13 +2640,13 @@ xfs_alloc_fix_freelist(  	 */  	if (xfs_perag_prefers_metadata(pag) &&  	    (args->datatype & XFS_ALLOC_USERDATA) && -	    (flags & XFS_ALLOC_FLAG_TRYLOCK)) { -		ASSERT(!(flags & XFS_ALLOC_FLAG_FREEING)); +	    (alloc_flags & XFS_ALLOC_FLAG_TRYLOCK)) { +		ASSERT(!(alloc_flags & XFS_ALLOC_FLAG_FREEING));  		goto out_agbp_relse;  	}  	need = xfs_alloc_min_freelist(mp, pag); -	if (!xfs_alloc_space_available(args, need, flags | +	if (!xfs_alloc_space_available(args, need, alloc_flags |  			XFS_ALLOC_FLAG_CHECK))  		goto out_agbp_relse; @@ -2615,7 +2655,7 @@ xfs_alloc_fix_freelist(  	 * Can fail if we're not blocking on locks, and it's held.  	 */  	if (!agbp) { -		error = xfs_alloc_read_agf(pag, tp, flags, &agbp); +		error = xfs_alloc_read_agf(pag, tp, alloc_flags, &agbp);  		if (error) {  			/* Couldn't lock the AGF so skip this AG. */  			if (error == -EAGAIN) @@ -2630,7 +2670,7 @@ xfs_alloc_fix_freelist(  	/* If there isn't enough total space or single-extent, reject it. */  	need = xfs_alloc_min_freelist(mp, pag); -	if (!xfs_alloc_space_available(args, need, flags)) +	if (!xfs_alloc_space_available(args, need, alloc_flags))  		goto out_agbp_relse;  #ifdef DEBUG @@ -2668,11 +2708,12 @@ xfs_alloc_fix_freelist(  	 */  	memset(&targs, 0, sizeof(targs));  	/* struct copy below */ -	if (flags & XFS_ALLOC_FLAG_NORMAP) +	if (alloc_flags & XFS_ALLOC_FLAG_NORMAP)  		targs.oinfo = XFS_RMAP_OINFO_SKIP_UPDATE;  	else  		targs.oinfo = XFS_RMAP_OINFO_AG; -	while (!(flags & XFS_ALLOC_FLAG_NOSHRINK) && pag->pagf_flcount > need) { +	while (!(alloc_flags & XFS_ALLOC_FLAG_NOSHRINK) && +			pag->pagf_flcount > need) {  		error = xfs_alloc_get_freelist(pag, tp, agbp, &bno, 0);  		if (error)  			goto out_agbp_relse; @@ -2700,7 +2741,7 @@ xfs_alloc_fix_freelist(  		targs.resv = XFS_AG_RESV_AGFL;  		/* Allocate as many blocks as possible at once. */ -		error = xfs_alloc_ag_vextent_size(&targs); +		error = xfs_alloc_ag_vextent_size(&targs, alloc_flags);  		if (error)  			goto out_agflbp_relse; @@ -2710,7 +2751,7 @@ xfs_alloc_fix_freelist(  		 * on a completely full ag.  		 */  		if (targs.agbno == NULLAGBLOCK) { -			if (flags & XFS_ALLOC_FLAG_FREEING) +			if (alloc_flags & XFS_ALLOC_FLAG_FREEING)  				break;  			goto out_agflbp_relse;  		} @@ -2916,6 +2957,47 @@ xfs_alloc_put_freelist(  }  /* + * Check that this AGF/AGI header's sequence number and length matches the AG + * number and size in fsblocks. + */ +xfs_failaddr_t +xfs_validate_ag_length( +	struct xfs_buf		*bp, +	uint32_t		seqno, +	uint32_t		length) +{ +	struct xfs_mount	*mp = bp->b_mount; +	/* +	 * During growfs operations, the perag is not fully initialised, +	 * so we can't use it for any useful checking. growfs ensures we can't +	 * use it by using uncached buffers that don't have the perag attached +	 * so we can detect and avoid this problem. +	 */ +	if (bp->b_pag && seqno != bp->b_pag->pag_agno) +		return __this_address; + +	/* +	 * Only the last AG in the filesystem is allowed to be shorter +	 * than the AG size recorded in the superblock. +	 */ +	if (length != mp->m_sb.sb_agblocks) { +		/* +		 * During growfs, the new last AG can get here before we +		 * have updated the superblock. Give it a pass on the seqno +		 * check. +		 */ +		if (bp->b_pag && seqno != mp->m_sb.sb_agcount - 1) +			return __this_address; +		if (length < XFS_MIN_AG_BLOCKS) +			return __this_address; +		if (length > mp->m_sb.sb_agblocks) +			return __this_address; +	} + +	return NULL; +} + +/*   * Verify the AGF is consistent.   *   * We do not verify the AGFL indexes in the AGF are fully consistent here @@ -2934,6 +3016,9 @@ xfs_agf_verify(  {  	struct xfs_mount	*mp = bp->b_mount;  	struct xfs_agf		*agf = bp->b_addr; +	xfs_failaddr_t		fa; +	uint32_t		agf_seqno = be32_to_cpu(agf->agf_seqno); +	uint32_t		agf_length = be32_to_cpu(agf->agf_length);  	if (xfs_has_crc(mp)) {  		if (!uuid_equal(&agf->agf_uuid, &mp->m_sb.sb_meta_uuid)) @@ -2945,18 +3030,26 @@ xfs_agf_verify(  	if (!xfs_verify_magic(bp, agf->agf_magicnum))  		return __this_address; -	if (!(XFS_AGF_GOOD_VERSION(be32_to_cpu(agf->agf_versionnum)) && -	      be32_to_cpu(agf->agf_freeblks) <= be32_to_cpu(agf->agf_length) && -	      be32_to_cpu(agf->agf_flfirst) < xfs_agfl_size(mp) && -	      be32_to_cpu(agf->agf_fllast) < xfs_agfl_size(mp) && -	      be32_to_cpu(agf->agf_flcount) <= xfs_agfl_size(mp))) +	if (!XFS_AGF_GOOD_VERSION(be32_to_cpu(agf->agf_versionnum)))  		return __this_address; -	if (be32_to_cpu(agf->agf_length) > mp->m_sb.sb_dblocks) +	/* +	 * Both agf_seqno and agf_length need to validated before anything else +	 * block number related in the AGF or AGFL can be checked. +	 */ +	fa = xfs_validate_ag_length(bp, agf_seqno, agf_length); +	if (fa) +		return fa; + +	if (be32_to_cpu(agf->agf_flfirst) >= xfs_agfl_size(mp)) +		return __this_address; +	if (be32_to_cpu(agf->agf_fllast) >= xfs_agfl_size(mp)) +		return __this_address; +	if (be32_to_cpu(agf->agf_flcount) > xfs_agfl_size(mp))  		return __this_address;  	if (be32_to_cpu(agf->agf_freeblks) < be32_to_cpu(agf->agf_longest) || -	    be32_to_cpu(agf->agf_freeblks) > be32_to_cpu(agf->agf_length)) +	    be32_to_cpu(agf->agf_freeblks) > agf_length)  		return __this_address;  	if (be32_to_cpu(agf->agf_levels[XFS_BTNUM_BNO]) < 1 || @@ -2967,38 +3060,28 @@ xfs_agf_verify(  						mp->m_alloc_maxlevels)  		return __this_address; -	if (xfs_has_rmapbt(mp) && -	    (be32_to_cpu(agf->agf_levels[XFS_BTNUM_RMAP]) < 1 || -	     be32_to_cpu(agf->agf_levels[XFS_BTNUM_RMAP]) > -						mp->m_rmap_maxlevels)) -		return __this_address; - -	if (xfs_has_rmapbt(mp) && -	    be32_to_cpu(agf->agf_rmap_blocks) > be32_to_cpu(agf->agf_length)) +	if (xfs_has_lazysbcount(mp) && +	    be32_to_cpu(agf->agf_btreeblks) > agf_length)  		return __this_address; -	/* -	 * during growfs operations, the perag is not fully initialised, -	 * so we can't use it for any useful checking. growfs ensures we can't -	 * use it by using uncached buffers that don't have the perag attached -	 * so we can detect and avoid this problem. -	 */ -	if (bp->b_pag && be32_to_cpu(agf->agf_seqno) != bp->b_pag->pag_agno) -		return __this_address; +	if (xfs_has_rmapbt(mp)) { +		if (be32_to_cpu(agf->agf_rmap_blocks) > agf_length) +			return __this_address; -	if (xfs_has_lazysbcount(mp) && -	    be32_to_cpu(agf->agf_btreeblks) > be32_to_cpu(agf->agf_length)) -		return __this_address; +		if (be32_to_cpu(agf->agf_levels[XFS_BTNUM_RMAP]) < 1 || +		    be32_to_cpu(agf->agf_levels[XFS_BTNUM_RMAP]) > +							mp->m_rmap_maxlevels) +			return __this_address; +	} -	if (xfs_has_reflink(mp) && -	    be32_to_cpu(agf->agf_refcount_blocks) > -	    be32_to_cpu(agf->agf_length)) -		return __this_address; +	if (xfs_has_reflink(mp)) { +		if (be32_to_cpu(agf->agf_refcount_blocks) > agf_length) +			return __this_address; -	if (xfs_has_reflink(mp) && -	    (be32_to_cpu(agf->agf_refcount_level) < 1 || -	     be32_to_cpu(agf->agf_refcount_level) > mp->m_refc_maxlevels)) -		return __this_address; +		if (be32_to_cpu(agf->agf_refcount_level) < 1 || +		    be32_to_cpu(agf->agf_refcount_level) > mp->m_refc_maxlevels) +			return __this_address; +	}  	return NULL;  } @@ -3226,7 +3309,7 @@ xfs_alloc_vextent_check_args(  static int  xfs_alloc_vextent_prepare_ag(  	struct xfs_alloc_arg	*args, -	uint32_t		flags) +	uint32_t		alloc_flags)  {  	bool			need_pag = !args->pag;  	int			error; @@ -3235,7 +3318,7 @@ xfs_alloc_vextent_prepare_ag(  		args->pag = xfs_perag_get(args->mp, args->agno);  	args->agbp = NULL; -	error = xfs_alloc_fix_freelist(args, flags); +	error = xfs_alloc_fix_freelist(args, alloc_flags);  	if (error) {  		trace_xfs_alloc_vextent_nofix(args);  		if (need_pag) @@ -3357,6 +3440,7 @@ xfs_alloc_vextent_this_ag(  {  	struct xfs_mount	*mp = args->mp;  	xfs_agnumber_t		minimum_agno; +	uint32_t		alloc_flags = 0;  	int			error;  	ASSERT(args->pag != NULL); @@ -3375,9 +3459,9 @@ xfs_alloc_vextent_this_ag(  		return error;  	} -	error = xfs_alloc_vextent_prepare_ag(args, 0); +	error = xfs_alloc_vextent_prepare_ag(args, alloc_flags);  	if (!error && args->agbp) -		error = xfs_alloc_ag_vextent_size(args); +		error = xfs_alloc_ag_vextent_size(args, alloc_flags);  	return xfs_alloc_vextent_finish(args, minimum_agno, error, false);  } @@ -3406,20 +3490,20 @@ xfs_alloc_vextent_iterate_ags(  	xfs_agnumber_t		minimum_agno,  	xfs_agnumber_t		start_agno,  	xfs_agblock_t		target_agbno, -	uint32_t		flags) +	uint32_t		alloc_flags)  {  	struct xfs_mount	*mp = args->mp;  	xfs_agnumber_t		restart_agno = minimum_agno;  	xfs_agnumber_t		agno;  	int			error = 0; -	if (flags & XFS_ALLOC_FLAG_TRYLOCK) +	if (alloc_flags & XFS_ALLOC_FLAG_TRYLOCK)  		restart_agno = 0;  restart:  	for_each_perag_wrap_range(mp, start_agno, restart_agno,  			mp->m_sb.sb_agcount, agno, args->pag) {  		args->agno = agno; -		error = xfs_alloc_vextent_prepare_ag(args, flags); +		error = xfs_alloc_vextent_prepare_ag(args, alloc_flags);  		if (error)  			break;  		if (!args->agbp) { @@ -3433,10 +3517,10 @@ restart:  		 */  		if (args->agno == start_agno && target_agbno) {  			args->agbno = target_agbno; -			error = xfs_alloc_ag_vextent_near(args); +			error = xfs_alloc_ag_vextent_near(args, alloc_flags);  		} else {  			args->agbno = 0; -			error = xfs_alloc_ag_vextent_size(args); +			error = xfs_alloc_ag_vextent_size(args, alloc_flags);  		}  		break;  	} @@ -3453,8 +3537,8 @@ restart:  	 * constraining flags by the caller, drop them and retry the allocation  	 * without any constraints being set.  	 */ -	if (flags) { -		flags = 0; +	if (alloc_flags & XFS_ALLOC_FLAG_TRYLOCK) { +		alloc_flags &= ~XFS_ALLOC_FLAG_TRYLOCK;  		restart_agno = minimum_agno;  		goto restart;  	} @@ -3482,6 +3566,7 @@ xfs_alloc_vextent_start_ag(  	xfs_agnumber_t		start_agno;  	xfs_agnumber_t		rotorstep = xfs_rotorstep;  	bool			bump_rotor = false; +	uint32_t		alloc_flags = XFS_ALLOC_FLAG_TRYLOCK;  	int			error;  	ASSERT(args->pag == NULL); @@ -3508,7 +3593,7 @@ xfs_alloc_vextent_start_ag(  	start_agno = max(minimum_agno, XFS_FSB_TO_AGNO(mp, target));  	error = xfs_alloc_vextent_iterate_ags(args, minimum_agno, start_agno, -			XFS_FSB_TO_AGBNO(mp, target), XFS_ALLOC_FLAG_TRYLOCK); +			XFS_FSB_TO_AGBNO(mp, target), alloc_flags);  	if (bump_rotor) {  		if (args->agno == start_agno) @@ -3535,6 +3620,7 @@ xfs_alloc_vextent_first_ag(  	struct xfs_mount	*mp = args->mp;  	xfs_agnumber_t		minimum_agno;  	xfs_agnumber_t		start_agno; +	uint32_t		alloc_flags = XFS_ALLOC_FLAG_TRYLOCK;  	int			error;  	ASSERT(args->pag == NULL); @@ -3553,7 +3639,7 @@ xfs_alloc_vextent_first_ag(  	start_agno = max(minimum_agno, XFS_FSB_TO_AGNO(mp, target));  	error = xfs_alloc_vextent_iterate_ags(args, minimum_agno, start_agno, -			XFS_FSB_TO_AGBNO(mp, target), 0); +			XFS_FSB_TO_AGBNO(mp, target), alloc_flags);  	return xfs_alloc_vextent_finish(args, minimum_agno, error, true);  } @@ -3606,6 +3692,7 @@ xfs_alloc_vextent_near_bno(  	struct xfs_mount	*mp = args->mp;  	xfs_agnumber_t		minimum_agno;  	bool			needs_perag = args->pag == NULL; +	uint32_t		alloc_flags = 0;  	int			error;  	if (!needs_perag) @@ -3626,9 +3713,9 @@ xfs_alloc_vextent_near_bno(  	if (needs_perag)  		args->pag = xfs_perag_grab(mp, args->agno); -	error = xfs_alloc_vextent_prepare_ag(args, 0); +	error = xfs_alloc_vextent_prepare_ag(args, alloc_flags);  	if (!error && args->agbp) -		error = xfs_alloc_ag_vextent_near(args); +		error = xfs_alloc_ag_vextent_near(args, alloc_flags);  	return xfs_alloc_vextent_finish(args, minimum_agno, error, needs_perag);  } @@ -3756,15 +3843,11 @@ xfs_alloc_query_range(  	xfs_alloc_query_range_fn		fn,  	void					*priv)  { -	union xfs_btree_irec			low_brec; -	union xfs_btree_irec			high_brec; -	struct xfs_alloc_query_range_info	query; +	union xfs_btree_irec			low_brec = { .a = *low_rec }; +	union xfs_btree_irec			high_brec = { .a = *high_rec }; +	struct xfs_alloc_query_range_info	query = { .priv = priv, .fn = fn };  	ASSERT(cur->bc_btnum == XFS_BTNUM_BNO); -	low_brec.a = *low_rec; -	high_brec.a = *high_rec; -	query.priv = priv; -	query.fn = fn;  	return xfs_btree_query_range(cur, &low_brec, &high_brec,  			xfs_alloc_query_range_helper, &query);  } diff --git a/fs/xfs/libxfs/xfs_alloc.h b/fs/xfs/libxfs/xfs_alloc.h index 85ac470be0da..6bb8d295c321 100644 --- a/fs/xfs/libxfs/xfs_alloc.h +++ b/fs/xfs/libxfs/xfs_alloc.h @@ -19,11 +19,12 @@ unsigned int xfs_agfl_size(struct xfs_mount *mp);  /*   * Flags for xfs_alloc_fix_freelist.   */ -#define	XFS_ALLOC_FLAG_TRYLOCK	0x00000001  /* use trylock for buffer locking */ -#define	XFS_ALLOC_FLAG_FREEING	0x00000002  /* indicate caller is freeing extents*/ -#define	XFS_ALLOC_FLAG_NORMAP	0x00000004  /* don't modify the rmapbt */ -#define	XFS_ALLOC_FLAG_NOSHRINK	0x00000008  /* don't shrink the freelist */ -#define	XFS_ALLOC_FLAG_CHECK	0x00000010  /* test only, don't modify args */ +#define	XFS_ALLOC_FLAG_TRYLOCK	(1U << 0)  /* use trylock for buffer locking */ +#define	XFS_ALLOC_FLAG_FREEING	(1U << 1)  /* indicate caller is freeing extents*/ +#define	XFS_ALLOC_FLAG_NORMAP	(1U << 2)  /* don't modify the rmapbt */ +#define	XFS_ALLOC_FLAG_NOSHRINK	(1U << 3)  /* don't shrink the freelist */ +#define	XFS_ALLOC_FLAG_CHECK	(1U << 4)  /* test only, don't modify args */ +#define	XFS_ALLOC_FLAG_TRYFLUSH	(1U << 5)  /* don't wait in busy extent flush */  /*   * Argument structure for xfs_alloc routines. @@ -195,7 +196,7 @@ int xfs_alloc_read_agfl(struct xfs_perag *pag, struct xfs_trans *tp,  		struct xfs_buf **bpp);  int xfs_free_agfl_block(struct xfs_trans *, xfs_agnumber_t, xfs_agblock_t,  			struct xfs_buf *, struct xfs_owner_info *); -int xfs_alloc_fix_freelist(struct xfs_alloc_arg *args, int flags); +int xfs_alloc_fix_freelist(struct xfs_alloc_arg *args, uint32_t alloc_flags);  int xfs_free_extent_fix_freelist(struct xfs_trans *tp, struct xfs_perag *pag,  		struct xfs_buf **agbp); @@ -232,7 +233,7 @@ xfs_buf_to_agfl_bno(  int __xfs_free_extent_later(struct xfs_trans *tp, xfs_fsblock_t bno,  		xfs_filblks_t len, const struct xfs_owner_info *oinfo, -		bool skip_discard); +		enum xfs_ag_resv_type type, bool skip_discard);  /*   * List of extents to be free "later". @@ -245,6 +246,7 @@ struct xfs_extent_free_item {  	xfs_extlen_t		xefi_blockcount;/* number of blocks in extent */  	struct xfs_perag	*xefi_pag;  	unsigned int		xefi_flags; +	enum xfs_ag_resv_type	xefi_agresv;  };  void xfs_extent_free_get_group(struct xfs_mount *mp, @@ -259,9 +261,10 @@ xfs_free_extent_later(  	struct xfs_trans		*tp,  	xfs_fsblock_t			bno,  	xfs_filblks_t			len, -	const struct xfs_owner_info	*oinfo) +	const struct xfs_owner_info	*oinfo, +	enum xfs_ag_resv_type		type)  { -	return __xfs_free_extent_later(tp, bno, len, oinfo, false); +	return __xfs_free_extent_later(tp, bno, len, oinfo, type, false);  } @@ -270,4 +273,7 @@ extern struct kmem_cache	*xfs_extfree_item_cache;  int __init xfs_extfree_intent_init_cache(void);  void xfs_extfree_intent_destroy_cache(void); +xfs_failaddr_t xfs_validate_ag_length(struct xfs_buf *bp, uint32_t seqno, +		uint32_t length); +  #endif	/* __XFS_ALLOC_H__ */ diff --git a/fs/xfs/libxfs/xfs_attr_leaf.c b/fs/xfs/libxfs/xfs_attr_leaf.c index beee51ad75ce..2580ae47209a 100644 --- a/fs/xfs/libxfs/xfs_attr_leaf.c +++ b/fs/xfs/libxfs/xfs_attr_leaf.c @@ -2293,8 +2293,6 @@ xfs_attr3_leaf_unbalance(  	trace_xfs_attr_leaf_unbalance(state->args); -	drop_leaf = drop_blk->bp->b_addr; -	save_leaf = save_blk->bp->b_addr;  	xfs_attr3_leaf_hdr_from_disk(state->args->geo, &drophdr, drop_leaf);  	xfs_attr3_leaf_hdr_from_disk(state->args->geo, &savehdr, save_leaf);  	entry = xfs_attr3_leaf_entryp(drop_leaf); diff --git a/fs/xfs/libxfs/xfs_bmap.c b/fs/xfs/libxfs/xfs_bmap.c index fef35696adb7..30c931b38853 100644 --- a/fs/xfs/libxfs/xfs_bmap.c +++ b/fs/xfs/libxfs/xfs_bmap.c @@ -574,7 +574,8 @@ xfs_bmap_btree_to_extents(  		return error;  	xfs_rmap_ino_bmbt_owner(&oinfo, ip->i_ino, whichfork); -	error = xfs_free_extent_later(cur->bc_tp, cbno, 1, &oinfo); +	error = xfs_free_extent_later(cur->bc_tp, cbno, 1, &oinfo, +			XFS_AG_RESV_NONE);  	if (error)  		return error; @@ -5236,8 +5237,9 @@ xfs_bmap_del_extent_real(  		} else {  			error = __xfs_free_extent_later(tp, del->br_startblock,  					del->br_blockcount, NULL, -					(bflags & XFS_BMAPI_NODISCARD) || -					del->br_state == XFS_EXT_UNWRITTEN); +					XFS_AG_RESV_NONE, +					((bflags & XFS_BMAPI_NODISCARD) || +					del->br_state == XFS_EXT_UNWRITTEN));  			if (error)  				goto done;  		} diff --git a/fs/xfs/libxfs/xfs_bmap_btree.c b/fs/xfs/libxfs/xfs_bmap_btree.c index 36564ae3084f..bf3f1b36fdd2 100644 --- a/fs/xfs/libxfs/xfs_bmap_btree.c +++ b/fs/xfs/libxfs/xfs_bmap_btree.c @@ -271,7 +271,8 @@ xfs_bmbt_free_block(  	int			error;  	xfs_rmap_ino_bmbt_owner(&oinfo, ip->i_ino, cur->bc_ino.whichfork); -	error = xfs_free_extent_later(cur->bc_tp, fsbno, 1, &oinfo); +	error = xfs_free_extent_later(cur->bc_tp, fsbno, 1, &oinfo, +			XFS_AG_RESV_NONE);  	if (error)  		return error; diff --git a/fs/xfs/libxfs/xfs_da_format.h b/fs/xfs/libxfs/xfs_da_format.h index 25e2841084e1..f9015f88eca7 100644 --- a/fs/xfs/libxfs/xfs_da_format.h +++ b/fs/xfs/libxfs/xfs_da_format.h @@ -591,7 +591,7 @@ struct xfs_attr_shortform {  		uint8_t valuelen;	/* actual length of value (no NULL) */  		uint8_t flags;	/* flags bits (see xfs_attr_leaf.h) */  		uint8_t nameval[];	/* name & value bytes concatenated */ -	} list[1];			/* variable sized array */ +	} list[];			/* variable sized array */  };  typedef struct xfs_attr_leaf_map {	/* RLE map of free bytes */ @@ -620,19 +620,29 @@ typedef struct xfs_attr_leaf_entry {	/* sorted on key, not name */  typedef struct xfs_attr_leaf_name_local {  	__be16	valuelen;		/* number of bytes in value */  	__u8	namelen;		/* length of name bytes */ -	__u8	nameval[1];		/* name/value bytes */ +	/* +	 * In Linux 6.5 this flex array was converted from nameval[1] to +	 * nameval[].  Be very careful here about extra padding at the end; +	 * see xfs_attr_leaf_entsize_local() for details. +	 */ +	__u8	nameval[];		/* name/value bytes */  } xfs_attr_leaf_name_local_t;  typedef struct xfs_attr_leaf_name_remote {  	__be32	valueblk;		/* block number of value bytes */  	__be32	valuelen;		/* number of bytes in value */  	__u8	namelen;		/* length of name bytes */ -	__u8	name[1];		/* name bytes */ +	/* +	 * In Linux 6.5 this flex array was converted from name[1] to name[]. +	 * Be very careful here about extra padding at the end; see +	 * xfs_attr_leaf_entsize_remote() for details. +	 */ +	__u8	name[];			/* name bytes */  } xfs_attr_leaf_name_remote_t;  typedef struct xfs_attr_leafblock {  	xfs_attr_leaf_hdr_t	hdr;	/* constant-structure header block */ -	xfs_attr_leaf_entry_t	entries[1];	/* sorted on key, not name */ +	xfs_attr_leaf_entry_t	entries[];	/* sorted on key, not name */  	/*  	 * The rest of the block contains the following structures after the  	 * leaf entries, growing from the bottom up. The variables are never @@ -664,7 +674,7 @@ struct xfs_attr3_leaf_hdr {  struct xfs_attr3_leafblock {  	struct xfs_attr3_leaf_hdr	hdr; -	struct xfs_attr_leaf_entry	entries[1]; +	struct xfs_attr_leaf_entry	entries[];  	/*  	 * The rest of the block contains the following structures after the @@ -747,14 +757,61 @@ xfs_attr3_leaf_name_local(xfs_attr_leafblock_t *leafp, int idx)   */  static inline int xfs_attr_leaf_entsize_remote(int nlen)  { -	return round_up(sizeof(struct xfs_attr_leaf_name_remote) - 1 + -			nlen, XFS_ATTR_LEAF_NAME_ALIGN); +	/* +	 * Prior to Linux 6.5, struct xfs_attr_leaf_name_remote ended with +	 * name[1], which was used as a flexarray.  The layout of this struct +	 * is 9 bytes of fixed-length fields followed by a __u8 flex array at +	 * offset 9. +	 * +	 * On most architectures, struct xfs_attr_leaf_name_remote had two +	 * bytes of implicit padding at the end of the struct to make the +	 * struct length 12.  After converting name[1] to name[], there are +	 * three implicit padding bytes and the struct size remains 12. +	 * However, there are compiler configurations that do not add implicit +	 * padding at all (m68k) and have been broken for years. +	 * +	 * This entsize computation historically added (the xattr name length) +	 * to (the padded struct length - 1) and rounded that sum up to the +	 * nearest multiple of 4 (NAME_ALIGN).  IOWs, round_up(11 + nlen, 4). +	 * This is encoded in the ondisk format, so we cannot change this. +	 * +	 * Compute the entsize from offsetof of the flexarray and manually +	 * adding bytes for the implicit padding. +	 */ +	const size_t remotesize = +			offsetof(struct xfs_attr_leaf_name_remote, name) + 2; + +	return round_up(remotesize + nlen, XFS_ATTR_LEAF_NAME_ALIGN);  }  static inline int xfs_attr_leaf_entsize_local(int nlen, int vlen)  { -	return round_up(sizeof(struct xfs_attr_leaf_name_local) - 1 + -			nlen + vlen, XFS_ATTR_LEAF_NAME_ALIGN); +	/* +	 * Prior to Linux 6.5, struct xfs_attr_leaf_name_local ended with +	 * nameval[1], which was used as a flexarray.  The layout of this +	 * struct is 3 bytes of fixed-length fields followed by a __u8 flex +	 * array at offset 3. +	 * +	 * struct xfs_attr_leaf_name_local had zero bytes of implicit padding +	 * at the end of the struct to make the struct length 4.  On most +	 * architectures, after converting nameval[1] to nameval[], there is +	 * one implicit padding byte and the struct size remains 4.  However, +	 * there are compiler configurations that do not add implicit padding +	 * at all (m68k) and would break. +	 * +	 * This entsize computation historically added (the xattr name and +	 * value length) to (the padded struct length - 1) and rounded that sum +	 * up to the nearest multiple of 4 (NAME_ALIGN).  IOWs, the formula is +	 * round_up(3 + nlen + vlen, 4).  This is encoded in the ondisk format, +	 * so we cannot change this. +	 * +	 * Compute the entsize from offsetof of the flexarray and manually +	 * adding bytes for the implicit padding. +	 */ +	const size_t localsize = +			offsetof(struct xfs_attr_leaf_name_local, nameval); + +	return round_up(localsize + nlen + vlen, XFS_ATTR_LEAF_NAME_ALIGN);  }  static inline int xfs_attr_leaf_entsize_local_max(int bsize) diff --git a/fs/xfs/libxfs/xfs_fs.h b/fs/xfs/libxfs/xfs_fs.h index 9c60ebb328b4..2cbf9ea39b8c 100644 --- a/fs/xfs/libxfs/xfs_fs.h +++ b/fs/xfs/libxfs/xfs_fs.h @@ -592,12 +592,12 @@ typedef struct xfs_attrlist_cursor {  struct xfs_attrlist {  	__s32	al_count;	/* number of entries in attrlist */  	__s32	al_more;	/* T/F: more attrs (do call again) */ -	__s32	al_offset[1];	/* byte offsets of attrs [var-sized] */ +	__s32	al_offset[];	/* byte offsets of attrs [var-sized] */  };  struct xfs_attrlist_ent {	/* data from attr_list() */  	__u32	a_valuelen;	/* number bytes in value of attr */ -	char	a_name[1];	/* attr name (NULL terminated) */ +	char	a_name[];	/* attr name (NULL terminated) */  };  typedef struct xfs_fsop_attrlist_handlereq { diff --git a/fs/xfs/libxfs/xfs_ialloc.c b/fs/xfs/libxfs/xfs_ialloc.c index 34600f94c2f4..b83e54c70906 100644 --- a/fs/xfs/libxfs/xfs_ialloc.c +++ b/fs/xfs/libxfs/xfs_ialloc.c @@ -1853,8 +1853,8 @@ xfs_difree_inode_chunk(  		/* not sparse, calculate extent info directly */  		return xfs_free_extent_later(tp,  				XFS_AGB_TO_FSB(mp, agno, sagbno), -				M_IGEO(mp)->ialloc_blks, -				&XFS_RMAP_OINFO_INODES); +				M_IGEO(mp)->ialloc_blks, &XFS_RMAP_OINFO_INODES, +				XFS_AG_RESV_NONE);  	}  	/* holemask is only 16-bits (fits in an unsigned long) */ @@ -1899,8 +1899,8 @@ xfs_difree_inode_chunk(  		ASSERT(agbno % mp->m_sb.sb_spino_align == 0);  		ASSERT(contigblk % mp->m_sb.sb_spino_align == 0);  		error = xfs_free_extent_later(tp, -				XFS_AGB_TO_FSB(mp, agno, agbno), -				contigblk, &XFS_RMAP_OINFO_INODES); +				XFS_AGB_TO_FSB(mp, agno, agbno), contigblk, +				&XFS_RMAP_OINFO_INODES, XFS_AG_RESV_NONE);  		if (error)  			return error; @@ -2486,11 +2486,14 @@ xfs_ialloc_log_agi(  static xfs_failaddr_t  xfs_agi_verify( -	struct xfs_buf	*bp) +	struct xfs_buf		*bp)  { -	struct xfs_mount *mp = bp->b_mount; -	struct xfs_agi	*agi = bp->b_addr; -	int		i; +	struct xfs_mount	*mp = bp->b_mount; +	struct xfs_agi		*agi = bp->b_addr; +	xfs_failaddr_t		fa; +	uint32_t		agi_seqno = be32_to_cpu(agi->agi_seqno); +	uint32_t		agi_length = be32_to_cpu(agi->agi_length); +	int			i;  	if (xfs_has_crc(mp)) {  		if (!uuid_equal(&agi->agi_uuid, &mp->m_sb.sb_meta_uuid)) @@ -2507,6 +2510,10 @@ xfs_agi_verify(  	if (!XFS_AGI_GOOD_VERSION(be32_to_cpu(agi->agi_versionnum)))  		return __this_address; +	fa = xfs_validate_ag_length(bp, agi_seqno, agi_length); +	if (fa) +		return fa; +  	if (be32_to_cpu(agi->agi_level) < 1 ||  	    be32_to_cpu(agi->agi_level) > M_IGEO(mp)->inobt_maxlevels)  		return __this_address; @@ -2516,15 +2523,6 @@ xfs_agi_verify(  	     be32_to_cpu(agi->agi_free_level) > M_IGEO(mp)->inobt_maxlevels))  		return __this_address; -	/* -	 * during growfs operations, the perag is not fully initialised, -	 * so we can't use it for any useful checking. growfs ensures we can't -	 * use it by using uncached buffers that don't have the perag attached -	 * so we can detect and avoid this problem. -	 */ -	if (bp->b_pag && be32_to_cpu(agi->agi_seqno) != bp->b_pag->pag_agno) -		return __this_address; -  	for (i = 0; i < XFS_AGI_UNLINKED_BUCKETS; i++) {  		if (agi->agi_unlinked[i] == cpu_to_be32(NULLAGINO))  			continue; diff --git a/fs/xfs/libxfs/xfs_ialloc_btree.c b/fs/xfs/libxfs/xfs_ialloc_btree.c index 5a945ae21b5d..9258f01c0015 100644 --- a/fs/xfs/libxfs/xfs_ialloc_btree.c +++ b/fs/xfs/libxfs/xfs_ialloc_btree.c @@ -160,8 +160,7 @@ __xfs_inobt_free_block(  	xfs_inobt_mod_blockcount(cur, -1);  	fsbno = XFS_DADDR_TO_FSB(cur->bc_mp, xfs_buf_daddr(bp)); -	return xfs_free_extent(cur->bc_tp, cur->bc_ag.pag, -			XFS_FSB_TO_AGBNO(cur->bc_mp, fsbno), 1, +	return xfs_free_extent_later(cur->bc_tp, fsbno, 1,  			&XFS_RMAP_OINFO_INOBT, resv);  } diff --git a/fs/xfs/libxfs/xfs_refcount.c b/fs/xfs/libxfs/xfs_refcount.c index b6e21433925c..646b3fa362ad 100644 --- a/fs/xfs/libxfs/xfs_refcount.c +++ b/fs/xfs/libxfs/xfs_refcount.c @@ -1152,7 +1152,8 @@ xfs_refcount_adjust_extents(  						cur->bc_ag.pag->pag_agno,  						tmp.rc_startblock);  				error = xfs_free_extent_later(cur->bc_tp, fsbno, -						  tmp.rc_blockcount, NULL); +						  tmp.rc_blockcount, NULL, +						  XFS_AG_RESV_NONE);  				if (error)  					goto out_error;  			} @@ -1213,7 +1214,8 @@ xfs_refcount_adjust_extents(  					cur->bc_ag.pag->pag_agno,  					ext.rc_startblock);  			error = xfs_free_extent_later(cur->bc_tp, fsbno, -					ext.rc_blockcount, NULL); +					ext.rc_blockcount, NULL, +					XFS_AG_RESV_NONE);  			if (error)  				goto out_error;  		} @@ -1919,8 +1921,13 @@ xfs_refcount_recover_cow_leftovers(  	struct xfs_buf			*agbp;  	struct xfs_refcount_recovery	*rr, *n;  	struct list_head		debris; -	union xfs_btree_irec		low; -	union xfs_btree_irec		high; +	union xfs_btree_irec		low = { +		.rc.rc_domain		= XFS_REFC_DOMAIN_COW, +	}; +	union xfs_btree_irec		high = { +		.rc.rc_domain		= XFS_REFC_DOMAIN_COW, +		.rc.rc_startblock	= -1U, +	};  	xfs_fsblock_t			fsb;  	int				error; @@ -1951,10 +1958,6 @@ xfs_refcount_recover_cow_leftovers(  	cur = xfs_refcountbt_init_cursor(mp, tp, agbp, pag);  	/* Find all the leftover CoW staging extents. */ -	memset(&low, 0, sizeof(low)); -	memset(&high, 0, sizeof(high)); -	low.rc.rc_domain = high.rc.rc_domain = XFS_REFC_DOMAIN_COW; -	high.rc.rc_startblock = -1U;  	error = xfs_btree_query_range(cur, &low, &high,  			xfs_refcount_recover_extent, &debris);  	xfs_btree_del_cursor(cur, error); @@ -1981,7 +1984,8 @@ xfs_refcount_recover_cow_leftovers(  		/* Free the block. */  		error = xfs_free_extent_later(tp, fsb, -				rr->rr_rrec.rc_blockcount, NULL); +				rr->rr_rrec.rc_blockcount, NULL, +				XFS_AG_RESV_NONE);  		if (error)  			goto out_trans; diff --git a/fs/xfs/libxfs/xfs_refcount_btree.c b/fs/xfs/libxfs/xfs_refcount_btree.c index d4afc5f4e6a5..5c3987d8dc24 100644 --- a/fs/xfs/libxfs/xfs_refcount_btree.c +++ b/fs/xfs/libxfs/xfs_refcount_btree.c @@ -106,19 +106,13 @@ xfs_refcountbt_free_block(  	struct xfs_buf		*agbp = cur->bc_ag.agbp;  	struct xfs_agf		*agf = agbp->b_addr;  	xfs_fsblock_t		fsbno = XFS_DADDR_TO_FSB(mp, xfs_buf_daddr(bp)); -	int			error;  	trace_xfs_refcountbt_free_block(cur->bc_mp, cur->bc_ag.pag->pag_agno,  			XFS_FSB_TO_AGBNO(cur->bc_mp, fsbno), 1);  	be32_add_cpu(&agf->agf_refcount_blocks, -1);  	xfs_alloc_log_agf(cur->bc_tp, agbp, XFS_AGF_REFCOUNT_BLOCKS); -	error = xfs_free_extent(cur->bc_tp, cur->bc_ag.pag, -			XFS_FSB_TO_AGBNO(cur->bc_mp, fsbno), 1, +	return xfs_free_extent_later(cur->bc_tp, fsbno, 1,  			&XFS_RMAP_OINFO_REFC, XFS_AG_RESV_METADATA); -	if (error) -		return error; - -	return error;  }  STATIC int diff --git a/fs/xfs/libxfs/xfs_rmap.c b/fs/xfs/libxfs/xfs_rmap.c index f4dc23b3b837..fbb0b2637463 100644 --- a/fs/xfs/libxfs/xfs_rmap.c +++ b/fs/xfs/libxfs/xfs_rmap.c @@ -2389,14 +2389,10 @@ xfs_rmap_query_range(  	xfs_rmap_query_range_fn			fn,  	void					*priv)  { -	union xfs_btree_irec			low_brec; -	union xfs_btree_irec			high_brec; -	struct xfs_rmap_query_range_info	query; +	union xfs_btree_irec			low_brec = { .r = *low_rec }; +	union xfs_btree_irec			high_brec = { .r = *high_rec }; +	struct xfs_rmap_query_range_info	query = { .priv = priv, .fn = fn }; -	low_brec.r = *low_rec; -	high_brec.r = *high_rec; -	query.priv = priv; -	query.fn = fn;  	return xfs_btree_query_range(cur, &low_brec, &high_brec,  			xfs_rmap_query_range_helper, &query);  } diff --git a/fs/xfs/libxfs/xfs_sb.c b/fs/xfs/libxfs/xfs_sb.c index ba0f17bc1dc0..5e174685a77c 100644 --- a/fs/xfs/libxfs/xfs_sb.c +++ b/fs/xfs/libxfs/xfs_sb.c @@ -412,7 +412,6 @@ xfs_validate_sb_common(  	    sbp->sb_inodelog < XFS_DINODE_MIN_LOG			||  	    sbp->sb_inodelog > XFS_DINODE_MAX_LOG			||  	    sbp->sb_inodesize != (1 << sbp->sb_inodelog)		|| -	    sbp->sb_logsunit > XLOG_MAX_RECORD_BSIZE			||  	    sbp->sb_inopblock != howmany(sbp->sb_blocksize,sbp->sb_inodesize) ||  	    XFS_FSB_TO_B(mp, sbp->sb_agblocks) < XFS_MIN_AG_BYTES	||  	    XFS_FSB_TO_B(mp, sbp->sb_agblocks) > XFS_MAX_AG_BYTES	|| @@ -430,6 +429,61 @@ xfs_validate_sb_common(  		return -EFSCORRUPTED;  	} +	/* +	 * Logs that are too large are not supported at all. Reject them +	 * outright. Logs that are too small are tolerated on v4 filesystems, +	 * but we can only check that when mounting the log. Hence we skip +	 * those checks here. +	 */ +	if (sbp->sb_logblocks > XFS_MAX_LOG_BLOCKS) { +		xfs_notice(mp, +		"Log size 0x%x blocks too large, maximum size is 0x%llx blocks", +			 sbp->sb_logblocks, XFS_MAX_LOG_BLOCKS); +		return -EFSCORRUPTED; +	} + +	if (XFS_FSB_TO_B(mp, sbp->sb_logblocks) > XFS_MAX_LOG_BYTES) { +		xfs_warn(mp, +		"log size 0x%llx bytes too large, maximum size is 0x%llx bytes", +			 XFS_FSB_TO_B(mp, sbp->sb_logblocks), +			 XFS_MAX_LOG_BYTES); +		return -EFSCORRUPTED; +	} + +	/* +	 * Do not allow filesystems with corrupted log sector or stripe units to +	 * be mounted. We cannot safely size the iclogs or write to the log if +	 * the log stripe unit is not valid. +	 */ +	if (sbp->sb_versionnum & XFS_SB_VERSION_SECTORBIT) { +		if (sbp->sb_logsectsize != (1U << sbp->sb_logsectlog)) { +			xfs_notice(mp, +			"log sector size in bytes/log2 (0x%x/0x%x) must match", +				sbp->sb_logsectsize, 1U << sbp->sb_logsectlog); +			return -EFSCORRUPTED; +		} +	} else if (sbp->sb_logsectsize || sbp->sb_logsectlog) { +		xfs_notice(mp, +		"log sector size in bytes/log2 (0x%x/0x%x) are not zero", +			sbp->sb_logsectsize, sbp->sb_logsectlog); +		return -EFSCORRUPTED; +	} + +	if (sbp->sb_logsunit > 1) { +		if (sbp->sb_logsunit % sbp->sb_blocksize) { +			xfs_notice(mp, +		"log stripe unit 0x%x bytes must be a multiple of block size", +				sbp->sb_logsunit); +			return -EFSCORRUPTED; +		} +		if (sbp->sb_logsunit > XLOG_MAX_RECORD_BSIZE) { +			xfs_notice(mp, +		"log stripe unit 0x%x bytes over maximum size (0x%x bytes)", +				sbp->sb_logsunit, XLOG_MAX_RECORD_BSIZE); +			return -EFSCORRUPTED; +		} +	} +  	/* Validate the realtime geometry; stolen from xfs_repair */  	if (sbp->sb_rextsize * sbp->sb_blocksize > XFS_MAX_RTEXTSIZE ||  	    sbp->sb_rextsize * sbp->sb_blocksize < XFS_MIN_RTEXTSIZE) { | 
