diff options
Diffstat (limited to 'fs/xfs/libxfs/xfs_ialloc.c')
| -rw-r--r-- | fs/xfs/libxfs/xfs_ialloc.c | 245 | 
1 files changed, 163 insertions, 82 deletions
diff --git a/fs/xfs/libxfs/xfs_ialloc.c b/fs/xfs/libxfs/xfs_ialloc.c index fe9898875097..04377ab75863 100644 --- a/fs/xfs/libxfs/xfs_ialloc.c +++ b/fs/xfs/libxfs/xfs_ialloc.c @@ -12,17 +12,14 @@  #include "xfs_bit.h"  #include "xfs_sb.h"  #include "xfs_mount.h" -#include "xfs_defer.h"  #include "xfs_inode.h"  #include "xfs_btree.h"  #include "xfs_ialloc.h"  #include "xfs_ialloc_btree.h"  #include "xfs_alloc.h" -#include "xfs_rtalloc.h"  #include "xfs_errortag.h"  #include "xfs_error.h"  #include "xfs_bmap.h" -#include "xfs_cksum.h"  #include "xfs_trans.h"  #include "xfs_buf_item.h"  #include "xfs_icreate_item.h" @@ -31,20 +28,6 @@  #include "xfs_log.h"  #include "xfs_rmap.h" - -/* - * Allocation group level functions. - */ -int -xfs_ialloc_cluster_alignment( -	struct xfs_mount	*mp) -{ -	if (xfs_sb_version_hasalign(&mp->m_sb) && -	    mp->m_sb.sb_inoalignmt >= xfs_icluster_size_fsb(mp)) -		return mp->m_sb.sb_inoalignmt; -	return 1; -} -  /*   * Lookup a record by ino in the btree given by cur.   */ @@ -299,7 +282,7 @@ xfs_ialloc_inode_init(  	 * sizes, manipulate the inodes in buffers  which are multiples of the  	 * blocks size.  	 */ -	nbufs = length / mp->m_blocks_per_cluster; +	nbufs = length / M_IGEO(mp)->blocks_per_cluster;  	/*  	 * Figure out what version number to use in the inodes we create.  If @@ -343,9 +326,10 @@ xfs_ialloc_inode_init(  		 * Get the block.  		 */  		d = XFS_AGB_TO_DADDR(mp, agno, agbno + -				(j * mp->m_blocks_per_cluster)); +				(j * M_IGEO(mp)->blocks_per_cluster));  		fbuf = xfs_trans_get_buf(tp, mp->m_ddev_targp, d, -					 mp->m_bsize * mp->m_blocks_per_cluster, +					 mp->m_bsize * +					 M_IGEO(mp)->blocks_per_cluster,  					 XBF_UNMAPPED);  		if (!fbuf)  			return -ENOMEM; @@ -353,7 +337,7 @@ xfs_ialloc_inode_init(  		/* Initialize the inode buffers and log them appropriately. */  		fbuf->b_ops = &xfs_inode_buf_ops;  		xfs_buf_zero(fbuf, 0, BBTOB(fbuf->b_length)); -		for (i = 0; i < mp->m_inodes_per_cluster; i++) { +		for (i = 0; i < M_IGEO(mp)->inodes_per_cluster; i++) {  			int	ioffset = i << mp->m_sb.sb_inodelog;  			uint	isize = xfs_dinode_size(version); @@ -616,24 +600,26 @@ error:   * Allocate new inodes in the allocation group specified by agbp.   * Return 0 for success, else error code.   */ -STATIC int				/* error code or 0 */ +STATIC int  xfs_ialloc_ag_alloc( -	xfs_trans_t	*tp,		/* transaction pointer */ -	xfs_buf_t	*agbp,		/* alloc group buffer */ -	int		*alloc) +	struct xfs_trans	*tp, +	struct xfs_buf		*agbp, +	int			*alloc)  { -	xfs_agi_t	*agi;		/* allocation group header */ -	xfs_alloc_arg_t	args;		/* allocation argument structure */ -	xfs_agnumber_t	agno; -	int		error; -	xfs_agino_t	newino;		/* new first inode's number */ -	xfs_agino_t	newlen;		/* new number of inodes */ -	int		isaligned = 0;	/* inode allocation at stripe unit */ -					/* boundary */ -	uint16_t	allocmask = (uint16_t) -1; /* init. to full chunk */ +	struct xfs_agi		*agi; +	struct xfs_alloc_arg	args; +	xfs_agnumber_t		agno; +	int			error; +	xfs_agino_t		newino;		/* new first inode's number */ +	xfs_agino_t		newlen;		/* new number of inodes */ +	int			isaligned = 0;	/* inode allocation at stripe */ +						/* unit boundary */ +	/* init. to full chunk */ +	uint16_t		allocmask = (uint16_t) -1;  	struct xfs_inobt_rec_incore rec; -	struct xfs_perag *pag; -	int		do_sparse = 0; +	struct xfs_perag	*pag; +	struct xfs_ino_geometry	*igeo = M_IGEO(tp->t_mountp); +	int			do_sparse = 0;  	memset(&args, 0, sizeof(args));  	args.tp = tp; @@ -644,7 +630,7 @@ xfs_ialloc_ag_alloc(  #ifdef DEBUG  	/* randomly do sparse inode allocations */  	if (xfs_sb_version_hassparseinodes(&tp->t_mountp->m_sb) && -	    args.mp->m_ialloc_min_blks < args.mp->m_ialloc_blks) +	    igeo->ialloc_min_blks < igeo->ialloc_blks)  		do_sparse = prandom_u32() & 1;  #endif @@ -652,12 +638,12 @@ xfs_ialloc_ag_alloc(  	 * Locking will ensure that we don't have two callers in here  	 * at one time.  	 */ -	newlen = args.mp->m_ialloc_inos; -	if (args.mp->m_maxicount && +	newlen = igeo->ialloc_inos; +	if (igeo->maxicount &&  	    percpu_counter_read_positive(&args.mp->m_icount) + newlen > -							args.mp->m_maxicount) +							igeo->maxicount)  		return -ENOSPC; -	args.minlen = args.maxlen = args.mp->m_ialloc_blks; +	args.minlen = args.maxlen = igeo->ialloc_blks;  	/*  	 * First try to allocate inodes contiguous with the last-allocated  	 * chunk of inodes.  If the filesystem is striped, this will fill @@ -667,7 +653,7 @@ xfs_ialloc_ag_alloc(  	newino = be32_to_cpu(agi->agi_newino);  	agno = be32_to_cpu(agi->agi_seqno);  	args.agbno = XFS_AGINO_TO_AGBNO(args.mp, newino) + -		     args.mp->m_ialloc_blks; +		     igeo->ialloc_blks;  	if (do_sparse)  		goto sparse_alloc;  	if (likely(newino != NULLAGINO && @@ -690,10 +676,10 @@ xfs_ialloc_ag_alloc(  		 * but not to use them in the actual exact allocation.  		 */  		args.alignment = 1; -		args.minalignslop = args.mp->m_cluster_align - 1; +		args.minalignslop = igeo->cluster_align - 1;  		/* Allow space for the inode btree to split. */ -		args.minleft = args.mp->m_in_maxlevels - 1; +		args.minleft = igeo->inobt_maxlevels - 1;  		if ((error = xfs_alloc_vextent(&args)))  			return error; @@ -720,12 +706,12 @@ xfs_ialloc_ag_alloc(  		 * pieces, so don't need alignment anyway.  		 */  		isaligned = 0; -		if (args.mp->m_sinoalign) { +		if (igeo->ialloc_align) {  			ASSERT(!(args.mp->m_flags & XFS_MOUNT_NOALIGN));  			args.alignment = args.mp->m_dalign;  			isaligned = 1;  		} else -			args.alignment = args.mp->m_cluster_align; +			args.alignment = igeo->cluster_align;  		/*  		 * Need to figure out where to allocate the inode blocks.  		 * Ideally they should be spaced out through the a.g. @@ -741,7 +727,7 @@ xfs_ialloc_ag_alloc(  		/*  		 * Allow space for the inode btree to split.  		 */ -		args.minleft = args.mp->m_in_maxlevels - 1; +		args.minleft = igeo->inobt_maxlevels - 1;  		if ((error = xfs_alloc_vextent(&args)))  			return error;  	} @@ -754,7 +740,7 @@ xfs_ialloc_ag_alloc(  		args.type = XFS_ALLOCTYPE_NEAR_BNO;  		args.agbno = be32_to_cpu(agi->agi_root);  		args.fsbno = XFS_AGB_TO_FSB(args.mp, agno, args.agbno); -		args.alignment = args.mp->m_cluster_align; +		args.alignment = igeo->cluster_align;  		if ((error = xfs_alloc_vextent(&args)))  			return error;  	} @@ -764,7 +750,7 @@ xfs_ialloc_ag_alloc(  	 * the sparse allocation length is smaller than a full chunk.  	 */  	if (xfs_sb_version_hassparseinodes(&args.mp->m_sb) && -	    args.mp->m_ialloc_min_blks < args.mp->m_ialloc_blks && +	    igeo->ialloc_min_blks < igeo->ialloc_blks &&  	    args.fsbno == NULLFSBLOCK) {  sparse_alloc:  		args.type = XFS_ALLOCTYPE_NEAR_BNO; @@ -773,7 +759,7 @@ sparse_alloc:  		args.alignment = args.mp->m_sb.sb_spino_align;  		args.prod = 1; -		args.minlen = args.mp->m_ialloc_min_blks; +		args.minlen = igeo->ialloc_min_blks;  		args.maxlen = args.minlen;  		/* @@ -789,7 +775,7 @@ sparse_alloc:  		args.min_agbno = args.mp->m_sb.sb_inoalignmt;  		args.max_agbno = round_down(args.mp->m_sb.sb_agblocks,  					    args.mp->m_sb.sb_inoalignmt) - -				 args.mp->m_ialloc_blks; +				 igeo->ialloc_blks;  		error = xfs_alloc_vextent(&args);  		if (error) @@ -1006,7 +992,7 @@ xfs_ialloc_ag_select(  		 * space needed for alignment of inode chunks when checking the  		 * longest contiguous free space in the AG - this prevents us  		 * from getting ENOSPC because we have free space larger than -		 * m_ialloc_blks but alignment constraints prevent us from using +		 * ialloc_blks but alignment constraints prevent us from using  		 * it.  		 *  		 * If we can't find an AG with space for full alignment slack to @@ -1015,9 +1001,9 @@ xfs_ialloc_ag_select(  		 * if we fail allocation due to alignment issues then it is most  		 * likely a real ENOSPC condition.  		 */ -		ineed = mp->m_ialloc_min_blks; +		ineed = M_IGEO(mp)->ialloc_min_blks;  		if (flags && ineed > 1) -			ineed += mp->m_cluster_align; +			ineed += M_IGEO(mp)->cluster_align;  		longest = pag->pagf_longest;  		if (!longest)  			longest = pag->pagf_flcount > 0; @@ -1703,6 +1689,7 @@ xfs_dialloc(  	int			noroom = 0;  	xfs_agnumber_t		start_agno;  	struct xfs_perag	*pag; +	struct xfs_ino_geometry	*igeo = M_IGEO(mp);  	int			okalloc = 1;  	if (*IO_agbp) { @@ -1733,9 +1720,9 @@ xfs_dialloc(  	 * Read rough value of mp->m_icount by percpu_counter_read_positive,  	 * which will sacrifice the preciseness but improve the performance.  	 */ -	if (mp->m_maxicount && -	    percpu_counter_read_positive(&mp->m_icount) + mp->m_ialloc_inos -							> mp->m_maxicount) { +	if (igeo->maxicount && +	    percpu_counter_read_positive(&mp->m_icount) + igeo->ialloc_inos +							> igeo->maxicount) {  		noroom = 1;  		okalloc = 0;  	} @@ -1852,7 +1839,8 @@ xfs_difree_inode_chunk(  	if (!xfs_inobt_issparse(rec->ir_holemask)) {  		/* not sparse, calculate extent info directly */  		xfs_bmap_add_free(tp, XFS_AGB_TO_FSB(mp, agno, sagbno), -				  mp->m_ialloc_blks, &XFS_RMAP_OINFO_INODES); +				  M_IGEO(mp)->ialloc_blks, +				  &XFS_RMAP_OINFO_INODES);  		return;  	} @@ -2261,7 +2249,7 @@ xfs_imap_lookup(  	/* check that the returned record contains the required inode */  	if (rec.ir_startino > agino || -	    rec.ir_startino + mp->m_ialloc_inos <= agino) +	    rec.ir_startino + M_IGEO(mp)->ialloc_inos <= agino)  		return -EINVAL;  	/* for untrusted inodes check it is allocated first */ @@ -2352,7 +2340,7 @@ xfs_imap(  	 * If the inode cluster size is the same as the blocksize or  	 * smaller we get to the buffer by simple arithmetics.  	 */ -	if (mp->m_blocks_per_cluster == 1) { +	if (M_IGEO(mp)->blocks_per_cluster == 1) {  		offset = XFS_INO_TO_OFFSET(mp, ino);  		ASSERT(offset < mp->m_sb.sb_inopblock); @@ -2368,8 +2356,8 @@ xfs_imap(  	 * find the location. Otherwise we have to do a btree  	 * lookup to find the location.  	 */ -	if (mp->m_inoalign_mask) { -		offset_agbno = agbno & mp->m_inoalign_mask; +	if (M_IGEO(mp)->inoalign_mask) { +		offset_agbno = agbno & M_IGEO(mp)->inoalign_mask;  		chunk_agbno = agbno - offset_agbno;  	} else {  		error = xfs_imap_lookup(mp, tp, agno, agino, agbno, @@ -2381,13 +2369,13 @@ xfs_imap(  out_map:  	ASSERT(agbno >= chunk_agbno);  	cluster_agbno = chunk_agbno + -		((offset_agbno / mp->m_blocks_per_cluster) * -		 mp->m_blocks_per_cluster); +		((offset_agbno / M_IGEO(mp)->blocks_per_cluster) * +		 M_IGEO(mp)->blocks_per_cluster);  	offset = ((agbno - cluster_agbno) * mp->m_sb.sb_inopblock) +  		XFS_INO_TO_OFFSET(mp, ino);  	imap->im_blkno = XFS_AGB_TO_DADDR(mp, agno, cluster_agbno); -	imap->im_len = XFS_FSB_TO_BB(mp, mp->m_blocks_per_cluster); +	imap->im_len = XFS_FSB_TO_BB(mp, M_IGEO(mp)->blocks_per_cluster);  	imap->im_boffset = (unsigned short)(offset << mp->m_sb.sb_inodelog);  	/* @@ -2409,20 +2397,6 @@ out_map:  }  /* - * Compute and fill in value of m_in_maxlevels. - */ -void -xfs_ialloc_compute_maxlevels( -	xfs_mount_t	*mp)		/* file system mount structure */ -{ -	uint		inodes; - -	inodes = (1LL << XFS_INO_AGINO_BITS(mp)) >> XFS_INODES_PER_CHUNK_LOG; -	mp->m_in_maxlevels = xfs_btree_compute_maxlevels(mp->m_inobt_mnr, -							 inodes); -} - -/*   * Log specified fields for the ag hdr (inode section). The growth of the agi   * structure over time requires that we interpret the buffer as two logical   * regions delineated by the end of the unlinked list. This is due to the size @@ -2493,7 +2467,7 @@ static xfs_failaddr_t  xfs_agi_verify(  	struct xfs_buf	*bp)  { -	struct xfs_mount *mp = bp->b_target->bt_mount; +	struct xfs_mount *mp = bp->b_mount;  	struct xfs_agi	*agi = XFS_BUF_TO_AGI(bp);  	int		i; @@ -2545,7 +2519,7 @@ static void  xfs_agi_read_verify(  	struct xfs_buf	*bp)  { -	struct xfs_mount *mp = bp->b_target->bt_mount; +	struct xfs_mount *mp = bp->b_mount;  	xfs_failaddr_t	fa;  	if (xfs_sb_version_hascrc(&mp->m_sb) && @@ -2562,7 +2536,7 @@ static void  xfs_agi_write_verify(  	struct xfs_buf	*bp)  { -	struct xfs_mount	*mp = bp->b_target->bt_mount; +	struct xfs_mount	*mp = bp->b_mount;  	struct xfs_buf_log_item	*bip = bp->b_log_item;  	xfs_failaddr_t		fa; @@ -2768,3 +2742,110 @@ xfs_ialloc_count_inodes(  	*freecount = ci.freecount;  	return 0;  } + +/* + * Initialize inode-related geometry information. + * + * Compute the inode btree min and max levels and set maxicount. + * + * Set the inode cluster size.  This may still be overridden by the file + * system block size if it is larger than the chosen cluster size. + * + * For v5 filesystems, scale the cluster size with the inode size to keep a + * constant ratio of inode per cluster buffer, but only if mkfs has set the + * inode alignment value appropriately for larger cluster sizes. + * + * Then compute the inode cluster alignment information. + */ +void +xfs_ialloc_setup_geometry( +	struct xfs_mount	*mp) +{ +	struct xfs_sb		*sbp = &mp->m_sb; +	struct xfs_ino_geometry	*igeo = M_IGEO(mp); +	uint64_t		icount; +	uint			inodes; + +	/* Compute inode btree geometry. */ +	igeo->agino_log = sbp->sb_inopblog + sbp->sb_agblklog; +	igeo->inobt_mxr[0] = xfs_inobt_maxrecs(mp, sbp->sb_blocksize, 1); +	igeo->inobt_mxr[1] = xfs_inobt_maxrecs(mp, sbp->sb_blocksize, 0); +	igeo->inobt_mnr[0] = igeo->inobt_mxr[0] / 2; +	igeo->inobt_mnr[1] = igeo->inobt_mxr[1] / 2; + +	igeo->ialloc_inos = max_t(uint16_t, XFS_INODES_PER_CHUNK, +			sbp->sb_inopblock); +	igeo->ialloc_blks = igeo->ialloc_inos >> sbp->sb_inopblog; + +	if (sbp->sb_spino_align) +		igeo->ialloc_min_blks = sbp->sb_spino_align; +	else +		igeo->ialloc_min_blks = igeo->ialloc_blks; + +	/* Compute and fill in value of m_ino_geo.inobt_maxlevels. */ +	inodes = (1LL << XFS_INO_AGINO_BITS(mp)) >> XFS_INODES_PER_CHUNK_LOG; +	igeo->inobt_maxlevels = xfs_btree_compute_maxlevels(igeo->inobt_mnr, +			inodes); + +	/* Set the maximum inode count for this filesystem. */ +	if (sbp->sb_imax_pct) { +		/* +		 * Make sure the maximum inode count is a multiple +		 * of the units we allocate inodes in. +		 */ +		icount = sbp->sb_dblocks * sbp->sb_imax_pct; +		do_div(icount, 100); +		do_div(icount, igeo->ialloc_blks); +		igeo->maxicount = XFS_FSB_TO_INO(mp, +				icount * igeo->ialloc_blks); +	} else { +		igeo->maxicount = 0; +	} + +	/* +	 * Compute the desired size of an inode cluster buffer size, which +	 * starts at 8K and (on v5 filesystems) scales up with larger inode +	 * sizes. +	 * +	 * Preserve the desired inode cluster size because the sparse inodes +	 * feature uses that desired size (not the actual size) to compute the +	 * sparse inode alignment.  The mount code validates this value, so we +	 * cannot change the behavior. +	 */ +	igeo->inode_cluster_size_raw = XFS_INODE_BIG_CLUSTER_SIZE; +	if (xfs_sb_version_hascrc(&mp->m_sb)) { +		int	new_size = igeo->inode_cluster_size_raw; + +		new_size *= mp->m_sb.sb_inodesize / XFS_DINODE_MIN_SIZE; +		if (mp->m_sb.sb_inoalignmt >= XFS_B_TO_FSBT(mp, new_size)) +			igeo->inode_cluster_size_raw = new_size; +	} + +	/* Calculate inode cluster ratios. */ +	if (igeo->inode_cluster_size_raw > mp->m_sb.sb_blocksize) +		igeo->blocks_per_cluster = XFS_B_TO_FSBT(mp, +				igeo->inode_cluster_size_raw); +	else +		igeo->blocks_per_cluster = 1; +	igeo->inode_cluster_size = XFS_FSB_TO_B(mp, igeo->blocks_per_cluster); +	igeo->inodes_per_cluster = XFS_FSB_TO_INO(mp, igeo->blocks_per_cluster); + +	/* Calculate inode cluster alignment. */ +	if (xfs_sb_version_hasalign(&mp->m_sb) && +	    mp->m_sb.sb_inoalignmt >= igeo->blocks_per_cluster) +		igeo->cluster_align = mp->m_sb.sb_inoalignmt; +	else +		igeo->cluster_align = 1; +	igeo->inoalign_mask = igeo->cluster_align - 1; +	igeo->cluster_align_inodes = XFS_FSB_TO_INO(mp, igeo->cluster_align); + +	/* +	 * If we are using stripe alignment, check whether +	 * the stripe unit is a multiple of the inode alignment +	 */ +	if (mp->m_dalign && igeo->inoalign_mask && +	    !(mp->m_dalign & igeo->inoalign_mask)) +		igeo->ialloc_align = mp->m_dalign; +	else +		igeo->ialloc_align = 0; +}  | 
