18c2ecf20Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0
28c2ecf20Sopenharmony_ci/*
38c2ecf20Sopenharmony_ci * Copyright (c) 2000-2005 Silicon Graphics, Inc.
48c2ecf20Sopenharmony_ci * Copyright (c) 2013 Red Hat, Inc.
58c2ecf20Sopenharmony_ci * All Rights Reserved.
68c2ecf20Sopenharmony_ci */
78c2ecf20Sopenharmony_ci#include "xfs.h"
88c2ecf20Sopenharmony_ci#include "xfs_fs.h"
98c2ecf20Sopenharmony_ci#include "xfs_shared.h"
108c2ecf20Sopenharmony_ci#include "xfs_format.h"
118c2ecf20Sopenharmony_ci#include "xfs_log_format.h"
128c2ecf20Sopenharmony_ci#include "xfs_trans_resv.h"
138c2ecf20Sopenharmony_ci#include "xfs_bit.h"
148c2ecf20Sopenharmony_ci#include "xfs_mount.h"
158c2ecf20Sopenharmony_ci#include "xfs_inode.h"
168c2ecf20Sopenharmony_ci#include "xfs_dir2.h"
178c2ecf20Sopenharmony_ci#include "xfs_dir2_priv.h"
188c2ecf20Sopenharmony_ci#include "xfs_trans.h"
198c2ecf20Sopenharmony_ci#include "xfs_bmap.h"
208c2ecf20Sopenharmony_ci#include "xfs_attr_leaf.h"
218c2ecf20Sopenharmony_ci#include "xfs_error.h"
228c2ecf20Sopenharmony_ci#include "xfs_trace.h"
238c2ecf20Sopenharmony_ci#include "xfs_buf_item.h"
248c2ecf20Sopenharmony_ci#include "xfs_log.h"
258c2ecf20Sopenharmony_ci
268c2ecf20Sopenharmony_ci/*
278c2ecf20Sopenharmony_ci * xfs_da_btree.c
288c2ecf20Sopenharmony_ci *
298c2ecf20Sopenharmony_ci * Routines to implement directories as Btrees of hashed names.
308c2ecf20Sopenharmony_ci */
318c2ecf20Sopenharmony_ci
328c2ecf20Sopenharmony_ci/*========================================================================
338c2ecf20Sopenharmony_ci * Function prototypes for the kernel.
348c2ecf20Sopenharmony_ci *========================================================================*/
358c2ecf20Sopenharmony_ci
368c2ecf20Sopenharmony_ci/*
378c2ecf20Sopenharmony_ci * Routines used for growing the Btree.
388c2ecf20Sopenharmony_ci */
398c2ecf20Sopenharmony_ciSTATIC int xfs_da3_root_split(xfs_da_state_t *state,
408c2ecf20Sopenharmony_ci					    xfs_da_state_blk_t *existing_root,
418c2ecf20Sopenharmony_ci					    xfs_da_state_blk_t *new_child);
428c2ecf20Sopenharmony_ciSTATIC int xfs_da3_node_split(xfs_da_state_t *state,
438c2ecf20Sopenharmony_ci					    xfs_da_state_blk_t *existing_blk,
448c2ecf20Sopenharmony_ci					    xfs_da_state_blk_t *split_blk,
458c2ecf20Sopenharmony_ci					    xfs_da_state_blk_t *blk_to_add,
468c2ecf20Sopenharmony_ci					    int treelevel,
478c2ecf20Sopenharmony_ci					    int *result);
488c2ecf20Sopenharmony_ciSTATIC void xfs_da3_node_rebalance(xfs_da_state_t *state,
498c2ecf20Sopenharmony_ci					 xfs_da_state_blk_t *node_blk_1,
508c2ecf20Sopenharmony_ci					 xfs_da_state_blk_t *node_blk_2);
518c2ecf20Sopenharmony_ciSTATIC void xfs_da3_node_add(xfs_da_state_t *state,
528c2ecf20Sopenharmony_ci				   xfs_da_state_blk_t *old_node_blk,
538c2ecf20Sopenharmony_ci				   xfs_da_state_blk_t *new_node_blk);
548c2ecf20Sopenharmony_ci
558c2ecf20Sopenharmony_ci/*
568c2ecf20Sopenharmony_ci * Routines used for shrinking the Btree.
578c2ecf20Sopenharmony_ci */
588c2ecf20Sopenharmony_ciSTATIC int xfs_da3_root_join(xfs_da_state_t *state,
598c2ecf20Sopenharmony_ci					   xfs_da_state_blk_t *root_blk);
608c2ecf20Sopenharmony_ciSTATIC int xfs_da3_node_toosmall(xfs_da_state_t *state, int *retval);
618c2ecf20Sopenharmony_ciSTATIC void xfs_da3_node_remove(xfs_da_state_t *state,
628c2ecf20Sopenharmony_ci					      xfs_da_state_blk_t *drop_blk);
638c2ecf20Sopenharmony_ciSTATIC void xfs_da3_node_unbalance(xfs_da_state_t *state,
648c2ecf20Sopenharmony_ci					 xfs_da_state_blk_t *src_node_blk,
658c2ecf20Sopenharmony_ci					 xfs_da_state_blk_t *dst_node_blk);
668c2ecf20Sopenharmony_ci
678c2ecf20Sopenharmony_ci/*
688c2ecf20Sopenharmony_ci * Utility routines.
698c2ecf20Sopenharmony_ci */
708c2ecf20Sopenharmony_ciSTATIC int	xfs_da3_blk_unlink(xfs_da_state_t *state,
718c2ecf20Sopenharmony_ci				  xfs_da_state_blk_t *drop_blk,
728c2ecf20Sopenharmony_ci				  xfs_da_state_blk_t *save_blk);
738c2ecf20Sopenharmony_ci
748c2ecf20Sopenharmony_ci
758c2ecf20Sopenharmony_cikmem_zone_t *xfs_da_state_zone;	/* anchor for state struct zone */
768c2ecf20Sopenharmony_ci
778c2ecf20Sopenharmony_ci/*
788c2ecf20Sopenharmony_ci * Allocate a dir-state structure.
798c2ecf20Sopenharmony_ci * We don't put them on the stack since they're large.
808c2ecf20Sopenharmony_ci */
818c2ecf20Sopenharmony_cistruct xfs_da_state *
828c2ecf20Sopenharmony_cixfs_da_state_alloc(
838c2ecf20Sopenharmony_ci	struct xfs_da_args	*args)
848c2ecf20Sopenharmony_ci{
858c2ecf20Sopenharmony_ci	struct xfs_da_state	*state;
868c2ecf20Sopenharmony_ci
878c2ecf20Sopenharmony_ci	state = kmem_cache_zalloc(xfs_da_state_zone, GFP_NOFS | __GFP_NOFAIL);
888c2ecf20Sopenharmony_ci	state->args = args;
898c2ecf20Sopenharmony_ci	state->mp = args->dp->i_mount;
908c2ecf20Sopenharmony_ci	return state;
918c2ecf20Sopenharmony_ci}
928c2ecf20Sopenharmony_ci
938c2ecf20Sopenharmony_ci/*
948c2ecf20Sopenharmony_ci * Kill the altpath contents of a da-state structure.
958c2ecf20Sopenharmony_ci */
968c2ecf20Sopenharmony_ciSTATIC void
978c2ecf20Sopenharmony_cixfs_da_state_kill_altpath(xfs_da_state_t *state)
988c2ecf20Sopenharmony_ci{
998c2ecf20Sopenharmony_ci	int	i;
1008c2ecf20Sopenharmony_ci
1018c2ecf20Sopenharmony_ci	for (i = 0; i < state->altpath.active; i++)
1028c2ecf20Sopenharmony_ci		state->altpath.blk[i].bp = NULL;
1038c2ecf20Sopenharmony_ci	state->altpath.active = 0;
1048c2ecf20Sopenharmony_ci}
1058c2ecf20Sopenharmony_ci
1068c2ecf20Sopenharmony_ci/*
1078c2ecf20Sopenharmony_ci * Free a da-state structure.
1088c2ecf20Sopenharmony_ci */
1098c2ecf20Sopenharmony_civoid
1108c2ecf20Sopenharmony_cixfs_da_state_free(xfs_da_state_t *state)
1118c2ecf20Sopenharmony_ci{
1128c2ecf20Sopenharmony_ci	xfs_da_state_kill_altpath(state);
1138c2ecf20Sopenharmony_ci#ifdef DEBUG
1148c2ecf20Sopenharmony_ci	memset((char *)state, 0, sizeof(*state));
1158c2ecf20Sopenharmony_ci#endif /* DEBUG */
1168c2ecf20Sopenharmony_ci	kmem_cache_free(xfs_da_state_zone, state);
1178c2ecf20Sopenharmony_ci}
1188c2ecf20Sopenharmony_ci
1198c2ecf20Sopenharmony_cistatic inline int xfs_dabuf_nfsb(struct xfs_mount *mp, int whichfork)
1208c2ecf20Sopenharmony_ci{
1218c2ecf20Sopenharmony_ci	if (whichfork == XFS_DATA_FORK)
1228c2ecf20Sopenharmony_ci		return mp->m_dir_geo->fsbcount;
1238c2ecf20Sopenharmony_ci	return mp->m_attr_geo->fsbcount;
1248c2ecf20Sopenharmony_ci}
1258c2ecf20Sopenharmony_ci
1268c2ecf20Sopenharmony_civoid
1278c2ecf20Sopenharmony_cixfs_da3_node_hdr_from_disk(
1288c2ecf20Sopenharmony_ci	struct xfs_mount		*mp,
1298c2ecf20Sopenharmony_ci	struct xfs_da3_icnode_hdr	*to,
1308c2ecf20Sopenharmony_ci	struct xfs_da_intnode		*from)
1318c2ecf20Sopenharmony_ci{
1328c2ecf20Sopenharmony_ci	if (xfs_sb_version_hascrc(&mp->m_sb)) {
1338c2ecf20Sopenharmony_ci		struct xfs_da3_intnode	*from3 = (struct xfs_da3_intnode *)from;
1348c2ecf20Sopenharmony_ci
1358c2ecf20Sopenharmony_ci		to->forw = be32_to_cpu(from3->hdr.info.hdr.forw);
1368c2ecf20Sopenharmony_ci		to->back = be32_to_cpu(from3->hdr.info.hdr.back);
1378c2ecf20Sopenharmony_ci		to->magic = be16_to_cpu(from3->hdr.info.hdr.magic);
1388c2ecf20Sopenharmony_ci		to->count = be16_to_cpu(from3->hdr.__count);
1398c2ecf20Sopenharmony_ci		to->level = be16_to_cpu(from3->hdr.__level);
1408c2ecf20Sopenharmony_ci		to->btree = from3->__btree;
1418c2ecf20Sopenharmony_ci		ASSERT(to->magic == XFS_DA3_NODE_MAGIC);
1428c2ecf20Sopenharmony_ci	} else {
1438c2ecf20Sopenharmony_ci		to->forw = be32_to_cpu(from->hdr.info.forw);
1448c2ecf20Sopenharmony_ci		to->back = be32_to_cpu(from->hdr.info.back);
1458c2ecf20Sopenharmony_ci		to->magic = be16_to_cpu(from->hdr.info.magic);
1468c2ecf20Sopenharmony_ci		to->count = be16_to_cpu(from->hdr.__count);
1478c2ecf20Sopenharmony_ci		to->level = be16_to_cpu(from->hdr.__level);
1488c2ecf20Sopenharmony_ci		to->btree = from->__btree;
1498c2ecf20Sopenharmony_ci		ASSERT(to->magic == XFS_DA_NODE_MAGIC);
1508c2ecf20Sopenharmony_ci	}
1518c2ecf20Sopenharmony_ci}
1528c2ecf20Sopenharmony_ci
1538c2ecf20Sopenharmony_civoid
1548c2ecf20Sopenharmony_cixfs_da3_node_hdr_to_disk(
1558c2ecf20Sopenharmony_ci	struct xfs_mount		*mp,
1568c2ecf20Sopenharmony_ci	struct xfs_da_intnode		*to,
1578c2ecf20Sopenharmony_ci	struct xfs_da3_icnode_hdr	*from)
1588c2ecf20Sopenharmony_ci{
1598c2ecf20Sopenharmony_ci	if (xfs_sb_version_hascrc(&mp->m_sb)) {
1608c2ecf20Sopenharmony_ci		struct xfs_da3_intnode	*to3 = (struct xfs_da3_intnode *)to;
1618c2ecf20Sopenharmony_ci
1628c2ecf20Sopenharmony_ci		ASSERT(from->magic == XFS_DA3_NODE_MAGIC);
1638c2ecf20Sopenharmony_ci		to3->hdr.info.hdr.forw = cpu_to_be32(from->forw);
1648c2ecf20Sopenharmony_ci		to3->hdr.info.hdr.back = cpu_to_be32(from->back);
1658c2ecf20Sopenharmony_ci		to3->hdr.info.hdr.magic = cpu_to_be16(from->magic);
1668c2ecf20Sopenharmony_ci		to3->hdr.__count = cpu_to_be16(from->count);
1678c2ecf20Sopenharmony_ci		to3->hdr.__level = cpu_to_be16(from->level);
1688c2ecf20Sopenharmony_ci	} else {
1698c2ecf20Sopenharmony_ci		ASSERT(from->magic == XFS_DA_NODE_MAGIC);
1708c2ecf20Sopenharmony_ci		to->hdr.info.forw = cpu_to_be32(from->forw);
1718c2ecf20Sopenharmony_ci		to->hdr.info.back = cpu_to_be32(from->back);
1728c2ecf20Sopenharmony_ci		to->hdr.info.magic = cpu_to_be16(from->magic);
1738c2ecf20Sopenharmony_ci		to->hdr.__count = cpu_to_be16(from->count);
1748c2ecf20Sopenharmony_ci		to->hdr.__level = cpu_to_be16(from->level);
1758c2ecf20Sopenharmony_ci	}
1768c2ecf20Sopenharmony_ci}
1778c2ecf20Sopenharmony_ci
1788c2ecf20Sopenharmony_ci/*
1798c2ecf20Sopenharmony_ci * Verify an xfs_da3_blkinfo structure. Note that the da3 fields are only
1808c2ecf20Sopenharmony_ci * accessible on v5 filesystems. This header format is common across da node,
1818c2ecf20Sopenharmony_ci * attr leaf and dir leaf blocks.
1828c2ecf20Sopenharmony_ci */
1838c2ecf20Sopenharmony_cixfs_failaddr_t
1848c2ecf20Sopenharmony_cixfs_da3_blkinfo_verify(
1858c2ecf20Sopenharmony_ci	struct xfs_buf		*bp,
1868c2ecf20Sopenharmony_ci	struct xfs_da3_blkinfo	*hdr3)
1878c2ecf20Sopenharmony_ci{
1888c2ecf20Sopenharmony_ci	struct xfs_mount	*mp = bp->b_mount;
1898c2ecf20Sopenharmony_ci	struct xfs_da_blkinfo	*hdr = &hdr3->hdr;
1908c2ecf20Sopenharmony_ci
1918c2ecf20Sopenharmony_ci	if (!xfs_verify_magic16(bp, hdr->magic))
1928c2ecf20Sopenharmony_ci		return __this_address;
1938c2ecf20Sopenharmony_ci
1948c2ecf20Sopenharmony_ci	if (xfs_sb_version_hascrc(&mp->m_sb)) {
1958c2ecf20Sopenharmony_ci		if (!uuid_equal(&hdr3->uuid, &mp->m_sb.sb_meta_uuid))
1968c2ecf20Sopenharmony_ci			return __this_address;
1978c2ecf20Sopenharmony_ci		if (be64_to_cpu(hdr3->blkno) != bp->b_bn)
1988c2ecf20Sopenharmony_ci			return __this_address;
1998c2ecf20Sopenharmony_ci		if (!xfs_log_check_lsn(mp, be64_to_cpu(hdr3->lsn)))
2008c2ecf20Sopenharmony_ci			return __this_address;
2018c2ecf20Sopenharmony_ci	}
2028c2ecf20Sopenharmony_ci
2038c2ecf20Sopenharmony_ci	return NULL;
2048c2ecf20Sopenharmony_ci}
2058c2ecf20Sopenharmony_ci
2068c2ecf20Sopenharmony_cistatic xfs_failaddr_t
2078c2ecf20Sopenharmony_cixfs_da3_node_verify(
2088c2ecf20Sopenharmony_ci	struct xfs_buf		*bp)
2098c2ecf20Sopenharmony_ci{
2108c2ecf20Sopenharmony_ci	struct xfs_mount	*mp = bp->b_mount;
2118c2ecf20Sopenharmony_ci	struct xfs_da_intnode	*hdr = bp->b_addr;
2128c2ecf20Sopenharmony_ci	struct xfs_da3_icnode_hdr ichdr;
2138c2ecf20Sopenharmony_ci	xfs_failaddr_t		fa;
2148c2ecf20Sopenharmony_ci
2158c2ecf20Sopenharmony_ci	xfs_da3_node_hdr_from_disk(mp, &ichdr, hdr);
2168c2ecf20Sopenharmony_ci
2178c2ecf20Sopenharmony_ci	fa = xfs_da3_blkinfo_verify(bp, bp->b_addr);
2188c2ecf20Sopenharmony_ci	if (fa)
2198c2ecf20Sopenharmony_ci		return fa;
2208c2ecf20Sopenharmony_ci
2218c2ecf20Sopenharmony_ci	if (ichdr.level == 0)
2228c2ecf20Sopenharmony_ci		return __this_address;
2238c2ecf20Sopenharmony_ci	if (ichdr.level > XFS_DA_NODE_MAXDEPTH)
2248c2ecf20Sopenharmony_ci		return __this_address;
2258c2ecf20Sopenharmony_ci	if (ichdr.count == 0)
2268c2ecf20Sopenharmony_ci		return __this_address;
2278c2ecf20Sopenharmony_ci
2288c2ecf20Sopenharmony_ci	/*
2298c2ecf20Sopenharmony_ci	 * we don't know if the node is for and attribute or directory tree,
2308c2ecf20Sopenharmony_ci	 * so only fail if the count is outside both bounds
2318c2ecf20Sopenharmony_ci	 */
2328c2ecf20Sopenharmony_ci	if (ichdr.count > mp->m_dir_geo->node_ents &&
2338c2ecf20Sopenharmony_ci	    ichdr.count > mp->m_attr_geo->node_ents)
2348c2ecf20Sopenharmony_ci		return __this_address;
2358c2ecf20Sopenharmony_ci
2368c2ecf20Sopenharmony_ci	/* XXX: hash order check? */
2378c2ecf20Sopenharmony_ci
2388c2ecf20Sopenharmony_ci	return NULL;
2398c2ecf20Sopenharmony_ci}
2408c2ecf20Sopenharmony_ci
2418c2ecf20Sopenharmony_cistatic void
2428c2ecf20Sopenharmony_cixfs_da3_node_write_verify(
2438c2ecf20Sopenharmony_ci	struct xfs_buf	*bp)
2448c2ecf20Sopenharmony_ci{
2458c2ecf20Sopenharmony_ci	struct xfs_mount	*mp = bp->b_mount;
2468c2ecf20Sopenharmony_ci	struct xfs_buf_log_item	*bip = bp->b_log_item;
2478c2ecf20Sopenharmony_ci	struct xfs_da3_node_hdr *hdr3 = bp->b_addr;
2488c2ecf20Sopenharmony_ci	xfs_failaddr_t		fa;
2498c2ecf20Sopenharmony_ci
2508c2ecf20Sopenharmony_ci	fa = xfs_da3_node_verify(bp);
2518c2ecf20Sopenharmony_ci	if (fa) {
2528c2ecf20Sopenharmony_ci		xfs_verifier_error(bp, -EFSCORRUPTED, fa);
2538c2ecf20Sopenharmony_ci		return;
2548c2ecf20Sopenharmony_ci	}
2558c2ecf20Sopenharmony_ci
2568c2ecf20Sopenharmony_ci	if (!xfs_sb_version_hascrc(&mp->m_sb))
2578c2ecf20Sopenharmony_ci		return;
2588c2ecf20Sopenharmony_ci
2598c2ecf20Sopenharmony_ci	if (bip)
2608c2ecf20Sopenharmony_ci		hdr3->info.lsn = cpu_to_be64(bip->bli_item.li_lsn);
2618c2ecf20Sopenharmony_ci
2628c2ecf20Sopenharmony_ci	xfs_buf_update_cksum(bp, XFS_DA3_NODE_CRC_OFF);
2638c2ecf20Sopenharmony_ci}
2648c2ecf20Sopenharmony_ci
2658c2ecf20Sopenharmony_ci/*
2668c2ecf20Sopenharmony_ci * leaf/node format detection on trees is sketchy, so a node read can be done on
2678c2ecf20Sopenharmony_ci * leaf level blocks when detection identifies the tree as a node format tree
2688c2ecf20Sopenharmony_ci * incorrectly. In this case, we need to swap the verifier to match the correct
2698c2ecf20Sopenharmony_ci * format of the block being read.
2708c2ecf20Sopenharmony_ci */
2718c2ecf20Sopenharmony_cistatic void
2728c2ecf20Sopenharmony_cixfs_da3_node_read_verify(
2738c2ecf20Sopenharmony_ci	struct xfs_buf		*bp)
2748c2ecf20Sopenharmony_ci{
2758c2ecf20Sopenharmony_ci	struct xfs_da_blkinfo	*info = bp->b_addr;
2768c2ecf20Sopenharmony_ci	xfs_failaddr_t		fa;
2778c2ecf20Sopenharmony_ci
2788c2ecf20Sopenharmony_ci	switch (be16_to_cpu(info->magic)) {
2798c2ecf20Sopenharmony_ci		case XFS_DA3_NODE_MAGIC:
2808c2ecf20Sopenharmony_ci			if (!xfs_buf_verify_cksum(bp, XFS_DA3_NODE_CRC_OFF)) {
2818c2ecf20Sopenharmony_ci				xfs_verifier_error(bp, -EFSBADCRC,
2828c2ecf20Sopenharmony_ci						__this_address);
2838c2ecf20Sopenharmony_ci				break;
2848c2ecf20Sopenharmony_ci			}
2858c2ecf20Sopenharmony_ci			/* fall through */
2868c2ecf20Sopenharmony_ci		case XFS_DA_NODE_MAGIC:
2878c2ecf20Sopenharmony_ci			fa = xfs_da3_node_verify(bp);
2888c2ecf20Sopenharmony_ci			if (fa)
2898c2ecf20Sopenharmony_ci				xfs_verifier_error(bp, -EFSCORRUPTED, fa);
2908c2ecf20Sopenharmony_ci			return;
2918c2ecf20Sopenharmony_ci		case XFS_ATTR_LEAF_MAGIC:
2928c2ecf20Sopenharmony_ci		case XFS_ATTR3_LEAF_MAGIC:
2938c2ecf20Sopenharmony_ci			bp->b_ops = &xfs_attr3_leaf_buf_ops;
2948c2ecf20Sopenharmony_ci			bp->b_ops->verify_read(bp);
2958c2ecf20Sopenharmony_ci			return;
2968c2ecf20Sopenharmony_ci		case XFS_DIR2_LEAFN_MAGIC:
2978c2ecf20Sopenharmony_ci		case XFS_DIR3_LEAFN_MAGIC:
2988c2ecf20Sopenharmony_ci			bp->b_ops = &xfs_dir3_leafn_buf_ops;
2998c2ecf20Sopenharmony_ci			bp->b_ops->verify_read(bp);
3008c2ecf20Sopenharmony_ci			return;
3018c2ecf20Sopenharmony_ci		default:
3028c2ecf20Sopenharmony_ci			xfs_verifier_error(bp, -EFSCORRUPTED, __this_address);
3038c2ecf20Sopenharmony_ci			break;
3048c2ecf20Sopenharmony_ci	}
3058c2ecf20Sopenharmony_ci}
3068c2ecf20Sopenharmony_ci
3078c2ecf20Sopenharmony_ci/* Verify the structure of a da3 block. */
3088c2ecf20Sopenharmony_cistatic xfs_failaddr_t
3098c2ecf20Sopenharmony_cixfs_da3_node_verify_struct(
3108c2ecf20Sopenharmony_ci	struct xfs_buf		*bp)
3118c2ecf20Sopenharmony_ci{
3128c2ecf20Sopenharmony_ci	struct xfs_da_blkinfo	*info = bp->b_addr;
3138c2ecf20Sopenharmony_ci
3148c2ecf20Sopenharmony_ci	switch (be16_to_cpu(info->magic)) {
3158c2ecf20Sopenharmony_ci	case XFS_DA3_NODE_MAGIC:
3168c2ecf20Sopenharmony_ci	case XFS_DA_NODE_MAGIC:
3178c2ecf20Sopenharmony_ci		return xfs_da3_node_verify(bp);
3188c2ecf20Sopenharmony_ci	case XFS_ATTR_LEAF_MAGIC:
3198c2ecf20Sopenharmony_ci	case XFS_ATTR3_LEAF_MAGIC:
3208c2ecf20Sopenharmony_ci		bp->b_ops = &xfs_attr3_leaf_buf_ops;
3218c2ecf20Sopenharmony_ci		return bp->b_ops->verify_struct(bp);
3228c2ecf20Sopenharmony_ci	case XFS_DIR2_LEAFN_MAGIC:
3238c2ecf20Sopenharmony_ci	case XFS_DIR3_LEAFN_MAGIC:
3248c2ecf20Sopenharmony_ci		bp->b_ops = &xfs_dir3_leafn_buf_ops;
3258c2ecf20Sopenharmony_ci		return bp->b_ops->verify_struct(bp);
3268c2ecf20Sopenharmony_ci	default:
3278c2ecf20Sopenharmony_ci		return __this_address;
3288c2ecf20Sopenharmony_ci	}
3298c2ecf20Sopenharmony_ci}
3308c2ecf20Sopenharmony_ci
3318c2ecf20Sopenharmony_ciconst struct xfs_buf_ops xfs_da3_node_buf_ops = {
3328c2ecf20Sopenharmony_ci	.name = "xfs_da3_node",
3338c2ecf20Sopenharmony_ci	.magic16 = { cpu_to_be16(XFS_DA_NODE_MAGIC),
3348c2ecf20Sopenharmony_ci		     cpu_to_be16(XFS_DA3_NODE_MAGIC) },
3358c2ecf20Sopenharmony_ci	.verify_read = xfs_da3_node_read_verify,
3368c2ecf20Sopenharmony_ci	.verify_write = xfs_da3_node_write_verify,
3378c2ecf20Sopenharmony_ci	.verify_struct = xfs_da3_node_verify_struct,
3388c2ecf20Sopenharmony_ci};
3398c2ecf20Sopenharmony_ci
3408c2ecf20Sopenharmony_cistatic int
3418c2ecf20Sopenharmony_cixfs_da3_node_set_type(
3428c2ecf20Sopenharmony_ci	struct xfs_trans	*tp,
3438c2ecf20Sopenharmony_ci	struct xfs_buf		*bp)
3448c2ecf20Sopenharmony_ci{
3458c2ecf20Sopenharmony_ci	struct xfs_da_blkinfo	*info = bp->b_addr;
3468c2ecf20Sopenharmony_ci
3478c2ecf20Sopenharmony_ci	switch (be16_to_cpu(info->magic)) {
3488c2ecf20Sopenharmony_ci	case XFS_DA_NODE_MAGIC:
3498c2ecf20Sopenharmony_ci	case XFS_DA3_NODE_MAGIC:
3508c2ecf20Sopenharmony_ci		xfs_trans_buf_set_type(tp, bp, XFS_BLFT_DA_NODE_BUF);
3518c2ecf20Sopenharmony_ci		return 0;
3528c2ecf20Sopenharmony_ci	case XFS_ATTR_LEAF_MAGIC:
3538c2ecf20Sopenharmony_ci	case XFS_ATTR3_LEAF_MAGIC:
3548c2ecf20Sopenharmony_ci		xfs_trans_buf_set_type(tp, bp, XFS_BLFT_ATTR_LEAF_BUF);
3558c2ecf20Sopenharmony_ci		return 0;
3568c2ecf20Sopenharmony_ci	case XFS_DIR2_LEAFN_MAGIC:
3578c2ecf20Sopenharmony_ci	case XFS_DIR3_LEAFN_MAGIC:
3588c2ecf20Sopenharmony_ci		xfs_trans_buf_set_type(tp, bp, XFS_BLFT_DIR_LEAFN_BUF);
3598c2ecf20Sopenharmony_ci		return 0;
3608c2ecf20Sopenharmony_ci	default:
3618c2ecf20Sopenharmony_ci		XFS_CORRUPTION_ERROR(__func__, XFS_ERRLEVEL_LOW, tp->t_mountp,
3628c2ecf20Sopenharmony_ci				info, sizeof(*info));
3638c2ecf20Sopenharmony_ci		xfs_trans_brelse(tp, bp);
3648c2ecf20Sopenharmony_ci		return -EFSCORRUPTED;
3658c2ecf20Sopenharmony_ci	}
3668c2ecf20Sopenharmony_ci}
3678c2ecf20Sopenharmony_ci
3688c2ecf20Sopenharmony_ciint
3698c2ecf20Sopenharmony_cixfs_da3_node_read(
3708c2ecf20Sopenharmony_ci	struct xfs_trans	*tp,
3718c2ecf20Sopenharmony_ci	struct xfs_inode	*dp,
3728c2ecf20Sopenharmony_ci	xfs_dablk_t		bno,
3738c2ecf20Sopenharmony_ci	struct xfs_buf		**bpp,
3748c2ecf20Sopenharmony_ci	int			whichfork)
3758c2ecf20Sopenharmony_ci{
3768c2ecf20Sopenharmony_ci	int			error;
3778c2ecf20Sopenharmony_ci
3788c2ecf20Sopenharmony_ci	error = xfs_da_read_buf(tp, dp, bno, 0, bpp, whichfork,
3798c2ecf20Sopenharmony_ci			&xfs_da3_node_buf_ops);
3808c2ecf20Sopenharmony_ci	if (error || !*bpp || !tp)
3818c2ecf20Sopenharmony_ci		return error;
3828c2ecf20Sopenharmony_ci	return xfs_da3_node_set_type(tp, *bpp);
3838c2ecf20Sopenharmony_ci}
3848c2ecf20Sopenharmony_ci
3858c2ecf20Sopenharmony_ciint
3868c2ecf20Sopenharmony_cixfs_da3_node_read_mapped(
3878c2ecf20Sopenharmony_ci	struct xfs_trans	*tp,
3888c2ecf20Sopenharmony_ci	struct xfs_inode	*dp,
3898c2ecf20Sopenharmony_ci	xfs_daddr_t		mappedbno,
3908c2ecf20Sopenharmony_ci	struct xfs_buf		**bpp,
3918c2ecf20Sopenharmony_ci	int			whichfork)
3928c2ecf20Sopenharmony_ci{
3938c2ecf20Sopenharmony_ci	struct xfs_mount	*mp = dp->i_mount;
3948c2ecf20Sopenharmony_ci	int			error;
3958c2ecf20Sopenharmony_ci
3968c2ecf20Sopenharmony_ci	error = xfs_trans_read_buf(mp, tp, mp->m_ddev_targp, mappedbno,
3978c2ecf20Sopenharmony_ci			XFS_FSB_TO_BB(mp, xfs_dabuf_nfsb(mp, whichfork)), 0,
3988c2ecf20Sopenharmony_ci			bpp, &xfs_da3_node_buf_ops);
3998c2ecf20Sopenharmony_ci	if (error || !*bpp)
4008c2ecf20Sopenharmony_ci		return error;
4018c2ecf20Sopenharmony_ci
4028c2ecf20Sopenharmony_ci	if (whichfork == XFS_ATTR_FORK)
4038c2ecf20Sopenharmony_ci		xfs_buf_set_ref(*bpp, XFS_ATTR_BTREE_REF);
4048c2ecf20Sopenharmony_ci	else
4058c2ecf20Sopenharmony_ci		xfs_buf_set_ref(*bpp, XFS_DIR_BTREE_REF);
4068c2ecf20Sopenharmony_ci
4078c2ecf20Sopenharmony_ci	if (!tp)
4088c2ecf20Sopenharmony_ci		return 0;
4098c2ecf20Sopenharmony_ci	return xfs_da3_node_set_type(tp, *bpp);
4108c2ecf20Sopenharmony_ci}
4118c2ecf20Sopenharmony_ci
4128c2ecf20Sopenharmony_ci/*========================================================================
4138c2ecf20Sopenharmony_ci * Routines used for growing the Btree.
4148c2ecf20Sopenharmony_ci *========================================================================*/
4158c2ecf20Sopenharmony_ci
4168c2ecf20Sopenharmony_ci/*
4178c2ecf20Sopenharmony_ci * Create the initial contents of an intermediate node.
4188c2ecf20Sopenharmony_ci */
4198c2ecf20Sopenharmony_ciint
4208c2ecf20Sopenharmony_cixfs_da3_node_create(
4218c2ecf20Sopenharmony_ci	struct xfs_da_args	*args,
4228c2ecf20Sopenharmony_ci	xfs_dablk_t		blkno,
4238c2ecf20Sopenharmony_ci	int			level,
4248c2ecf20Sopenharmony_ci	struct xfs_buf		**bpp,
4258c2ecf20Sopenharmony_ci	int			whichfork)
4268c2ecf20Sopenharmony_ci{
4278c2ecf20Sopenharmony_ci	struct xfs_da_intnode	*node;
4288c2ecf20Sopenharmony_ci	struct xfs_trans	*tp = args->trans;
4298c2ecf20Sopenharmony_ci	struct xfs_mount	*mp = tp->t_mountp;
4308c2ecf20Sopenharmony_ci	struct xfs_da3_icnode_hdr ichdr = {0};
4318c2ecf20Sopenharmony_ci	struct xfs_buf		*bp;
4328c2ecf20Sopenharmony_ci	int			error;
4338c2ecf20Sopenharmony_ci	struct xfs_inode	*dp = args->dp;
4348c2ecf20Sopenharmony_ci
4358c2ecf20Sopenharmony_ci	trace_xfs_da_node_create(args);
4368c2ecf20Sopenharmony_ci	ASSERT(level <= XFS_DA_NODE_MAXDEPTH);
4378c2ecf20Sopenharmony_ci
4388c2ecf20Sopenharmony_ci	error = xfs_da_get_buf(tp, dp, blkno, &bp, whichfork);
4398c2ecf20Sopenharmony_ci	if (error)
4408c2ecf20Sopenharmony_ci		return error;
4418c2ecf20Sopenharmony_ci	bp->b_ops = &xfs_da3_node_buf_ops;
4428c2ecf20Sopenharmony_ci	xfs_trans_buf_set_type(tp, bp, XFS_BLFT_DA_NODE_BUF);
4438c2ecf20Sopenharmony_ci	node = bp->b_addr;
4448c2ecf20Sopenharmony_ci
4458c2ecf20Sopenharmony_ci	if (xfs_sb_version_hascrc(&mp->m_sb)) {
4468c2ecf20Sopenharmony_ci		struct xfs_da3_node_hdr *hdr3 = bp->b_addr;
4478c2ecf20Sopenharmony_ci
4488c2ecf20Sopenharmony_ci		memset(hdr3, 0, sizeof(struct xfs_da3_node_hdr));
4498c2ecf20Sopenharmony_ci		ichdr.magic = XFS_DA3_NODE_MAGIC;
4508c2ecf20Sopenharmony_ci		hdr3->info.blkno = cpu_to_be64(bp->b_bn);
4518c2ecf20Sopenharmony_ci		hdr3->info.owner = cpu_to_be64(args->dp->i_ino);
4528c2ecf20Sopenharmony_ci		uuid_copy(&hdr3->info.uuid, &mp->m_sb.sb_meta_uuid);
4538c2ecf20Sopenharmony_ci	} else {
4548c2ecf20Sopenharmony_ci		ichdr.magic = XFS_DA_NODE_MAGIC;
4558c2ecf20Sopenharmony_ci	}
4568c2ecf20Sopenharmony_ci	ichdr.level = level;
4578c2ecf20Sopenharmony_ci
4588c2ecf20Sopenharmony_ci	xfs_da3_node_hdr_to_disk(dp->i_mount, node, &ichdr);
4598c2ecf20Sopenharmony_ci	xfs_trans_log_buf(tp, bp,
4608c2ecf20Sopenharmony_ci		XFS_DA_LOGRANGE(node, &node->hdr, args->geo->node_hdr_size));
4618c2ecf20Sopenharmony_ci
4628c2ecf20Sopenharmony_ci	*bpp = bp;
4638c2ecf20Sopenharmony_ci	return 0;
4648c2ecf20Sopenharmony_ci}
4658c2ecf20Sopenharmony_ci
4668c2ecf20Sopenharmony_ci/*
4678c2ecf20Sopenharmony_ci * Split a leaf node, rebalance, then possibly split
4688c2ecf20Sopenharmony_ci * intermediate nodes, rebalance, etc.
4698c2ecf20Sopenharmony_ci */
4708c2ecf20Sopenharmony_ciint							/* error */
4718c2ecf20Sopenharmony_cixfs_da3_split(
4728c2ecf20Sopenharmony_ci	struct xfs_da_state	*state)
4738c2ecf20Sopenharmony_ci{
4748c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*oldblk;
4758c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*newblk;
4768c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*addblk;
4778c2ecf20Sopenharmony_ci	struct xfs_da_intnode	*node;
4788c2ecf20Sopenharmony_ci	int			max;
4798c2ecf20Sopenharmony_ci	int			action = 0;
4808c2ecf20Sopenharmony_ci	int			error;
4818c2ecf20Sopenharmony_ci	int			i;
4828c2ecf20Sopenharmony_ci
4838c2ecf20Sopenharmony_ci	trace_xfs_da_split(state->args);
4848c2ecf20Sopenharmony_ci
4858c2ecf20Sopenharmony_ci	/*
4868c2ecf20Sopenharmony_ci	 * Walk back up the tree splitting/inserting/adjusting as necessary.
4878c2ecf20Sopenharmony_ci	 * If we need to insert and there isn't room, split the node, then
4888c2ecf20Sopenharmony_ci	 * decide which fragment to insert the new block from below into.
4898c2ecf20Sopenharmony_ci	 * Note that we may split the root this way, but we need more fixup.
4908c2ecf20Sopenharmony_ci	 */
4918c2ecf20Sopenharmony_ci	max = state->path.active - 1;
4928c2ecf20Sopenharmony_ci	ASSERT((max >= 0) && (max < XFS_DA_NODE_MAXDEPTH));
4938c2ecf20Sopenharmony_ci	ASSERT(state->path.blk[max].magic == XFS_ATTR_LEAF_MAGIC ||
4948c2ecf20Sopenharmony_ci	       state->path.blk[max].magic == XFS_DIR2_LEAFN_MAGIC);
4958c2ecf20Sopenharmony_ci
4968c2ecf20Sopenharmony_ci	addblk = &state->path.blk[max];		/* initial dummy value */
4978c2ecf20Sopenharmony_ci	for (i = max; (i >= 0) && addblk; state->path.active--, i--) {
4988c2ecf20Sopenharmony_ci		oldblk = &state->path.blk[i];
4998c2ecf20Sopenharmony_ci		newblk = &state->altpath.blk[i];
5008c2ecf20Sopenharmony_ci
5018c2ecf20Sopenharmony_ci		/*
5028c2ecf20Sopenharmony_ci		 * If a leaf node then
5038c2ecf20Sopenharmony_ci		 *     Allocate a new leaf node, then rebalance across them.
5048c2ecf20Sopenharmony_ci		 * else if an intermediate node then
5058c2ecf20Sopenharmony_ci		 *     We split on the last layer, must we split the node?
5068c2ecf20Sopenharmony_ci		 */
5078c2ecf20Sopenharmony_ci		switch (oldblk->magic) {
5088c2ecf20Sopenharmony_ci		case XFS_ATTR_LEAF_MAGIC:
5098c2ecf20Sopenharmony_ci			error = xfs_attr3_leaf_split(state, oldblk, newblk);
5108c2ecf20Sopenharmony_ci			if ((error != 0) && (error != -ENOSPC)) {
5118c2ecf20Sopenharmony_ci				return error;	/* GROT: attr is inconsistent */
5128c2ecf20Sopenharmony_ci			}
5138c2ecf20Sopenharmony_ci			if (!error) {
5148c2ecf20Sopenharmony_ci				addblk = newblk;
5158c2ecf20Sopenharmony_ci				break;
5168c2ecf20Sopenharmony_ci			}
5178c2ecf20Sopenharmony_ci			/*
5188c2ecf20Sopenharmony_ci			 * Entry wouldn't fit, split the leaf again. The new
5198c2ecf20Sopenharmony_ci			 * extrablk will be consumed by xfs_da3_node_split if
5208c2ecf20Sopenharmony_ci			 * the node is split.
5218c2ecf20Sopenharmony_ci			 */
5228c2ecf20Sopenharmony_ci			state->extravalid = 1;
5238c2ecf20Sopenharmony_ci			if (state->inleaf) {
5248c2ecf20Sopenharmony_ci				state->extraafter = 0;	/* before newblk */
5258c2ecf20Sopenharmony_ci				trace_xfs_attr_leaf_split_before(state->args);
5268c2ecf20Sopenharmony_ci				error = xfs_attr3_leaf_split(state, oldblk,
5278c2ecf20Sopenharmony_ci							    &state->extrablk);
5288c2ecf20Sopenharmony_ci			} else {
5298c2ecf20Sopenharmony_ci				state->extraafter = 1;	/* after newblk */
5308c2ecf20Sopenharmony_ci				trace_xfs_attr_leaf_split_after(state->args);
5318c2ecf20Sopenharmony_ci				error = xfs_attr3_leaf_split(state, newblk,
5328c2ecf20Sopenharmony_ci							    &state->extrablk);
5338c2ecf20Sopenharmony_ci			}
5348c2ecf20Sopenharmony_ci			if (error)
5358c2ecf20Sopenharmony_ci				return error;	/* GROT: attr inconsistent */
5368c2ecf20Sopenharmony_ci			addblk = newblk;
5378c2ecf20Sopenharmony_ci			break;
5388c2ecf20Sopenharmony_ci		case XFS_DIR2_LEAFN_MAGIC:
5398c2ecf20Sopenharmony_ci			error = xfs_dir2_leafn_split(state, oldblk, newblk);
5408c2ecf20Sopenharmony_ci			if (error)
5418c2ecf20Sopenharmony_ci				return error;
5428c2ecf20Sopenharmony_ci			addblk = newblk;
5438c2ecf20Sopenharmony_ci			break;
5448c2ecf20Sopenharmony_ci		case XFS_DA_NODE_MAGIC:
5458c2ecf20Sopenharmony_ci			error = xfs_da3_node_split(state, oldblk, newblk, addblk,
5468c2ecf20Sopenharmony_ci							 max - i, &action);
5478c2ecf20Sopenharmony_ci			addblk->bp = NULL;
5488c2ecf20Sopenharmony_ci			if (error)
5498c2ecf20Sopenharmony_ci				return error;	/* GROT: dir is inconsistent */
5508c2ecf20Sopenharmony_ci			/*
5518c2ecf20Sopenharmony_ci			 * Record the newly split block for the next time thru?
5528c2ecf20Sopenharmony_ci			 */
5538c2ecf20Sopenharmony_ci			if (action)
5548c2ecf20Sopenharmony_ci				addblk = newblk;
5558c2ecf20Sopenharmony_ci			else
5568c2ecf20Sopenharmony_ci				addblk = NULL;
5578c2ecf20Sopenharmony_ci			break;
5588c2ecf20Sopenharmony_ci		}
5598c2ecf20Sopenharmony_ci
5608c2ecf20Sopenharmony_ci		/*
5618c2ecf20Sopenharmony_ci		 * Update the btree to show the new hashval for this child.
5628c2ecf20Sopenharmony_ci		 */
5638c2ecf20Sopenharmony_ci		xfs_da3_fixhashpath(state, &state->path);
5648c2ecf20Sopenharmony_ci	}
5658c2ecf20Sopenharmony_ci	if (!addblk)
5668c2ecf20Sopenharmony_ci		return 0;
5678c2ecf20Sopenharmony_ci
5688c2ecf20Sopenharmony_ci	/*
5698c2ecf20Sopenharmony_ci	 * xfs_da3_node_split() should have consumed any extra blocks we added
5708c2ecf20Sopenharmony_ci	 * during a double leaf split in the attr fork. This is guaranteed as
5718c2ecf20Sopenharmony_ci	 * we can't be here if the attr fork only has a single leaf block.
5728c2ecf20Sopenharmony_ci	 */
5738c2ecf20Sopenharmony_ci	ASSERT(state->extravalid == 0 ||
5748c2ecf20Sopenharmony_ci	       state->path.blk[max].magic == XFS_DIR2_LEAFN_MAGIC);
5758c2ecf20Sopenharmony_ci
5768c2ecf20Sopenharmony_ci	/*
5778c2ecf20Sopenharmony_ci	 * Split the root node.
5788c2ecf20Sopenharmony_ci	 */
5798c2ecf20Sopenharmony_ci	ASSERT(state->path.active == 0);
5808c2ecf20Sopenharmony_ci	oldblk = &state->path.blk[0];
5818c2ecf20Sopenharmony_ci	error = xfs_da3_root_split(state, oldblk, addblk);
5828c2ecf20Sopenharmony_ci	if (error)
5838c2ecf20Sopenharmony_ci		goto out;
5848c2ecf20Sopenharmony_ci
5858c2ecf20Sopenharmony_ci	/*
5868c2ecf20Sopenharmony_ci	 * Update pointers to the node which used to be block 0 and just got
5878c2ecf20Sopenharmony_ci	 * bumped because of the addition of a new root node.  Note that the
5888c2ecf20Sopenharmony_ci	 * original block 0 could be at any position in the list of blocks in
5898c2ecf20Sopenharmony_ci	 * the tree.
5908c2ecf20Sopenharmony_ci	 *
5918c2ecf20Sopenharmony_ci	 * Note: the magic numbers and sibling pointers are in the same physical
5928c2ecf20Sopenharmony_ci	 * place for both v2 and v3 headers (by design). Hence it doesn't matter
5938c2ecf20Sopenharmony_ci	 * which version of the xfs_da_intnode structure we use here as the
5948c2ecf20Sopenharmony_ci	 * result will be the same using either structure.
5958c2ecf20Sopenharmony_ci	 */
5968c2ecf20Sopenharmony_ci	node = oldblk->bp->b_addr;
5978c2ecf20Sopenharmony_ci	if (node->hdr.info.forw) {
5988c2ecf20Sopenharmony_ci		if (be32_to_cpu(node->hdr.info.forw) != addblk->blkno) {
5998c2ecf20Sopenharmony_ci			xfs_buf_mark_corrupt(oldblk->bp);
6008c2ecf20Sopenharmony_ci			error = -EFSCORRUPTED;
6018c2ecf20Sopenharmony_ci			goto out;
6028c2ecf20Sopenharmony_ci		}
6038c2ecf20Sopenharmony_ci		node = addblk->bp->b_addr;
6048c2ecf20Sopenharmony_ci		node->hdr.info.back = cpu_to_be32(oldblk->blkno);
6058c2ecf20Sopenharmony_ci		xfs_trans_log_buf(state->args->trans, addblk->bp,
6068c2ecf20Sopenharmony_ci				  XFS_DA_LOGRANGE(node, &node->hdr.info,
6078c2ecf20Sopenharmony_ci				  sizeof(node->hdr.info)));
6088c2ecf20Sopenharmony_ci	}
6098c2ecf20Sopenharmony_ci	node = oldblk->bp->b_addr;
6108c2ecf20Sopenharmony_ci	if (node->hdr.info.back) {
6118c2ecf20Sopenharmony_ci		if (be32_to_cpu(node->hdr.info.back) != addblk->blkno) {
6128c2ecf20Sopenharmony_ci			xfs_buf_mark_corrupt(oldblk->bp);
6138c2ecf20Sopenharmony_ci			error = -EFSCORRUPTED;
6148c2ecf20Sopenharmony_ci			goto out;
6158c2ecf20Sopenharmony_ci		}
6168c2ecf20Sopenharmony_ci		node = addblk->bp->b_addr;
6178c2ecf20Sopenharmony_ci		node->hdr.info.forw = cpu_to_be32(oldblk->blkno);
6188c2ecf20Sopenharmony_ci		xfs_trans_log_buf(state->args->trans, addblk->bp,
6198c2ecf20Sopenharmony_ci				  XFS_DA_LOGRANGE(node, &node->hdr.info,
6208c2ecf20Sopenharmony_ci				  sizeof(node->hdr.info)));
6218c2ecf20Sopenharmony_ci	}
6228c2ecf20Sopenharmony_ciout:
6238c2ecf20Sopenharmony_ci	addblk->bp = NULL;
6248c2ecf20Sopenharmony_ci	return error;
6258c2ecf20Sopenharmony_ci}
6268c2ecf20Sopenharmony_ci
6278c2ecf20Sopenharmony_ci/*
6288c2ecf20Sopenharmony_ci * Split the root.  We have to create a new root and point to the two
6298c2ecf20Sopenharmony_ci * parts (the split old root) that we just created.  Copy block zero to
6308c2ecf20Sopenharmony_ci * the EOF, extending the inode in process.
6318c2ecf20Sopenharmony_ci */
6328c2ecf20Sopenharmony_ciSTATIC int						/* error */
6338c2ecf20Sopenharmony_cixfs_da3_root_split(
6348c2ecf20Sopenharmony_ci	struct xfs_da_state	*state,
6358c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*blk1,
6368c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*blk2)
6378c2ecf20Sopenharmony_ci{
6388c2ecf20Sopenharmony_ci	struct xfs_da_intnode	*node;
6398c2ecf20Sopenharmony_ci	struct xfs_da_intnode	*oldroot;
6408c2ecf20Sopenharmony_ci	struct xfs_da_node_entry *btree;
6418c2ecf20Sopenharmony_ci	struct xfs_da3_icnode_hdr nodehdr;
6428c2ecf20Sopenharmony_ci	struct xfs_da_args	*args;
6438c2ecf20Sopenharmony_ci	struct xfs_buf		*bp;
6448c2ecf20Sopenharmony_ci	struct xfs_inode	*dp;
6458c2ecf20Sopenharmony_ci	struct xfs_trans	*tp;
6468c2ecf20Sopenharmony_ci	struct xfs_dir2_leaf	*leaf;
6478c2ecf20Sopenharmony_ci	xfs_dablk_t		blkno;
6488c2ecf20Sopenharmony_ci	int			level;
6498c2ecf20Sopenharmony_ci	int			error;
6508c2ecf20Sopenharmony_ci	int			size;
6518c2ecf20Sopenharmony_ci
6528c2ecf20Sopenharmony_ci	trace_xfs_da_root_split(state->args);
6538c2ecf20Sopenharmony_ci
6548c2ecf20Sopenharmony_ci	/*
6558c2ecf20Sopenharmony_ci	 * Copy the existing (incorrect) block from the root node position
6568c2ecf20Sopenharmony_ci	 * to a free space somewhere.
6578c2ecf20Sopenharmony_ci	 */
6588c2ecf20Sopenharmony_ci	args = state->args;
6598c2ecf20Sopenharmony_ci	error = xfs_da_grow_inode(args, &blkno);
6608c2ecf20Sopenharmony_ci	if (error)
6618c2ecf20Sopenharmony_ci		return error;
6628c2ecf20Sopenharmony_ci
6638c2ecf20Sopenharmony_ci	dp = args->dp;
6648c2ecf20Sopenharmony_ci	tp = args->trans;
6658c2ecf20Sopenharmony_ci	error = xfs_da_get_buf(tp, dp, blkno, &bp, args->whichfork);
6668c2ecf20Sopenharmony_ci	if (error)
6678c2ecf20Sopenharmony_ci		return error;
6688c2ecf20Sopenharmony_ci	node = bp->b_addr;
6698c2ecf20Sopenharmony_ci	oldroot = blk1->bp->b_addr;
6708c2ecf20Sopenharmony_ci	if (oldroot->hdr.info.magic == cpu_to_be16(XFS_DA_NODE_MAGIC) ||
6718c2ecf20Sopenharmony_ci	    oldroot->hdr.info.magic == cpu_to_be16(XFS_DA3_NODE_MAGIC)) {
6728c2ecf20Sopenharmony_ci		struct xfs_da3_icnode_hdr icnodehdr;
6738c2ecf20Sopenharmony_ci
6748c2ecf20Sopenharmony_ci		xfs_da3_node_hdr_from_disk(dp->i_mount, &icnodehdr, oldroot);
6758c2ecf20Sopenharmony_ci		btree = icnodehdr.btree;
6768c2ecf20Sopenharmony_ci		size = (int)((char *)&btree[icnodehdr.count] - (char *)oldroot);
6778c2ecf20Sopenharmony_ci		level = icnodehdr.level;
6788c2ecf20Sopenharmony_ci
6798c2ecf20Sopenharmony_ci		/*
6808c2ecf20Sopenharmony_ci		 * we are about to copy oldroot to bp, so set up the type
6818c2ecf20Sopenharmony_ci		 * of bp while we know exactly what it will be.
6828c2ecf20Sopenharmony_ci		 */
6838c2ecf20Sopenharmony_ci		xfs_trans_buf_set_type(tp, bp, XFS_BLFT_DA_NODE_BUF);
6848c2ecf20Sopenharmony_ci	} else {
6858c2ecf20Sopenharmony_ci		struct xfs_dir3_icleaf_hdr leafhdr;
6868c2ecf20Sopenharmony_ci
6878c2ecf20Sopenharmony_ci		leaf = (xfs_dir2_leaf_t *)oldroot;
6888c2ecf20Sopenharmony_ci		xfs_dir2_leaf_hdr_from_disk(dp->i_mount, &leafhdr, leaf);
6898c2ecf20Sopenharmony_ci
6908c2ecf20Sopenharmony_ci		ASSERT(leafhdr.magic == XFS_DIR2_LEAFN_MAGIC ||
6918c2ecf20Sopenharmony_ci		       leafhdr.magic == XFS_DIR3_LEAFN_MAGIC);
6928c2ecf20Sopenharmony_ci		size = (int)((char *)&leafhdr.ents[leafhdr.count] -
6938c2ecf20Sopenharmony_ci			(char *)leaf);
6948c2ecf20Sopenharmony_ci		level = 0;
6958c2ecf20Sopenharmony_ci
6968c2ecf20Sopenharmony_ci		/*
6978c2ecf20Sopenharmony_ci		 * we are about to copy oldroot to bp, so set up the type
6988c2ecf20Sopenharmony_ci		 * of bp while we know exactly what it will be.
6998c2ecf20Sopenharmony_ci		 */
7008c2ecf20Sopenharmony_ci		xfs_trans_buf_set_type(tp, bp, XFS_BLFT_DIR_LEAFN_BUF);
7018c2ecf20Sopenharmony_ci	}
7028c2ecf20Sopenharmony_ci
7038c2ecf20Sopenharmony_ci	/*
7048c2ecf20Sopenharmony_ci	 * we can copy most of the information in the node from one block to
7058c2ecf20Sopenharmony_ci	 * another, but for CRC enabled headers we have to make sure that the
7068c2ecf20Sopenharmony_ci	 * block specific identifiers are kept intact. We update the buffer
7078c2ecf20Sopenharmony_ci	 * directly for this.
7088c2ecf20Sopenharmony_ci	 */
7098c2ecf20Sopenharmony_ci	memcpy(node, oldroot, size);
7108c2ecf20Sopenharmony_ci	if (oldroot->hdr.info.magic == cpu_to_be16(XFS_DA3_NODE_MAGIC) ||
7118c2ecf20Sopenharmony_ci	    oldroot->hdr.info.magic == cpu_to_be16(XFS_DIR3_LEAFN_MAGIC)) {
7128c2ecf20Sopenharmony_ci		struct xfs_da3_intnode *node3 = (struct xfs_da3_intnode *)node;
7138c2ecf20Sopenharmony_ci
7148c2ecf20Sopenharmony_ci		node3->hdr.info.blkno = cpu_to_be64(bp->b_bn);
7158c2ecf20Sopenharmony_ci	}
7168c2ecf20Sopenharmony_ci	xfs_trans_log_buf(tp, bp, 0, size - 1);
7178c2ecf20Sopenharmony_ci
7188c2ecf20Sopenharmony_ci	bp->b_ops = blk1->bp->b_ops;
7198c2ecf20Sopenharmony_ci	xfs_trans_buf_copy_type(bp, blk1->bp);
7208c2ecf20Sopenharmony_ci	blk1->bp = bp;
7218c2ecf20Sopenharmony_ci	blk1->blkno = blkno;
7228c2ecf20Sopenharmony_ci
7238c2ecf20Sopenharmony_ci	/*
7248c2ecf20Sopenharmony_ci	 * Set up the new root node.
7258c2ecf20Sopenharmony_ci	 */
7268c2ecf20Sopenharmony_ci	error = xfs_da3_node_create(args,
7278c2ecf20Sopenharmony_ci		(args->whichfork == XFS_DATA_FORK) ? args->geo->leafblk : 0,
7288c2ecf20Sopenharmony_ci		level + 1, &bp, args->whichfork);
7298c2ecf20Sopenharmony_ci	if (error)
7308c2ecf20Sopenharmony_ci		return error;
7318c2ecf20Sopenharmony_ci
7328c2ecf20Sopenharmony_ci	node = bp->b_addr;
7338c2ecf20Sopenharmony_ci	xfs_da3_node_hdr_from_disk(dp->i_mount, &nodehdr, node);
7348c2ecf20Sopenharmony_ci	btree = nodehdr.btree;
7358c2ecf20Sopenharmony_ci	btree[0].hashval = cpu_to_be32(blk1->hashval);
7368c2ecf20Sopenharmony_ci	btree[0].before = cpu_to_be32(blk1->blkno);
7378c2ecf20Sopenharmony_ci	btree[1].hashval = cpu_to_be32(blk2->hashval);
7388c2ecf20Sopenharmony_ci	btree[1].before = cpu_to_be32(blk2->blkno);
7398c2ecf20Sopenharmony_ci	nodehdr.count = 2;
7408c2ecf20Sopenharmony_ci	xfs_da3_node_hdr_to_disk(dp->i_mount, node, &nodehdr);
7418c2ecf20Sopenharmony_ci
7428c2ecf20Sopenharmony_ci#ifdef DEBUG
7438c2ecf20Sopenharmony_ci	if (oldroot->hdr.info.magic == cpu_to_be16(XFS_DIR2_LEAFN_MAGIC) ||
7448c2ecf20Sopenharmony_ci	    oldroot->hdr.info.magic == cpu_to_be16(XFS_DIR3_LEAFN_MAGIC)) {
7458c2ecf20Sopenharmony_ci		ASSERT(blk1->blkno >= args->geo->leafblk &&
7468c2ecf20Sopenharmony_ci		       blk1->blkno < args->geo->freeblk);
7478c2ecf20Sopenharmony_ci		ASSERT(blk2->blkno >= args->geo->leafblk &&
7488c2ecf20Sopenharmony_ci		       blk2->blkno < args->geo->freeblk);
7498c2ecf20Sopenharmony_ci	}
7508c2ecf20Sopenharmony_ci#endif
7518c2ecf20Sopenharmony_ci
7528c2ecf20Sopenharmony_ci	/* Header is already logged by xfs_da_node_create */
7538c2ecf20Sopenharmony_ci	xfs_trans_log_buf(tp, bp,
7548c2ecf20Sopenharmony_ci		XFS_DA_LOGRANGE(node, btree, sizeof(xfs_da_node_entry_t) * 2));
7558c2ecf20Sopenharmony_ci
7568c2ecf20Sopenharmony_ci	return 0;
7578c2ecf20Sopenharmony_ci}
7588c2ecf20Sopenharmony_ci
7598c2ecf20Sopenharmony_ci/*
7608c2ecf20Sopenharmony_ci * Split the node, rebalance, then add the new entry.
7618c2ecf20Sopenharmony_ci */
7628c2ecf20Sopenharmony_ciSTATIC int						/* error */
7638c2ecf20Sopenharmony_cixfs_da3_node_split(
7648c2ecf20Sopenharmony_ci	struct xfs_da_state	*state,
7658c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*oldblk,
7668c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*newblk,
7678c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*addblk,
7688c2ecf20Sopenharmony_ci	int			treelevel,
7698c2ecf20Sopenharmony_ci	int			*result)
7708c2ecf20Sopenharmony_ci{
7718c2ecf20Sopenharmony_ci	struct xfs_da_intnode	*node;
7728c2ecf20Sopenharmony_ci	struct xfs_da3_icnode_hdr nodehdr;
7738c2ecf20Sopenharmony_ci	xfs_dablk_t		blkno;
7748c2ecf20Sopenharmony_ci	int			newcount;
7758c2ecf20Sopenharmony_ci	int			error;
7768c2ecf20Sopenharmony_ci	int			useextra;
7778c2ecf20Sopenharmony_ci	struct xfs_inode	*dp = state->args->dp;
7788c2ecf20Sopenharmony_ci
7798c2ecf20Sopenharmony_ci	trace_xfs_da_node_split(state->args);
7808c2ecf20Sopenharmony_ci
7818c2ecf20Sopenharmony_ci	node = oldblk->bp->b_addr;
7828c2ecf20Sopenharmony_ci	xfs_da3_node_hdr_from_disk(dp->i_mount, &nodehdr, node);
7838c2ecf20Sopenharmony_ci
7848c2ecf20Sopenharmony_ci	/*
7858c2ecf20Sopenharmony_ci	 * With V2 dirs the extra block is data or freespace.
7868c2ecf20Sopenharmony_ci	 */
7878c2ecf20Sopenharmony_ci	useextra = state->extravalid && state->args->whichfork == XFS_ATTR_FORK;
7888c2ecf20Sopenharmony_ci	newcount = 1 + useextra;
7898c2ecf20Sopenharmony_ci	/*
7908c2ecf20Sopenharmony_ci	 * Do we have to split the node?
7918c2ecf20Sopenharmony_ci	 */
7928c2ecf20Sopenharmony_ci	if (nodehdr.count + newcount > state->args->geo->node_ents) {
7938c2ecf20Sopenharmony_ci		/*
7948c2ecf20Sopenharmony_ci		 * Allocate a new node, add to the doubly linked chain of
7958c2ecf20Sopenharmony_ci		 * nodes, then move some of our excess entries into it.
7968c2ecf20Sopenharmony_ci		 */
7978c2ecf20Sopenharmony_ci		error = xfs_da_grow_inode(state->args, &blkno);
7988c2ecf20Sopenharmony_ci		if (error)
7998c2ecf20Sopenharmony_ci			return error;	/* GROT: dir is inconsistent */
8008c2ecf20Sopenharmony_ci
8018c2ecf20Sopenharmony_ci		error = xfs_da3_node_create(state->args, blkno, treelevel,
8028c2ecf20Sopenharmony_ci					   &newblk->bp, state->args->whichfork);
8038c2ecf20Sopenharmony_ci		if (error)
8048c2ecf20Sopenharmony_ci			return error;	/* GROT: dir is inconsistent */
8058c2ecf20Sopenharmony_ci		newblk->blkno = blkno;
8068c2ecf20Sopenharmony_ci		newblk->magic = XFS_DA_NODE_MAGIC;
8078c2ecf20Sopenharmony_ci		xfs_da3_node_rebalance(state, oldblk, newblk);
8088c2ecf20Sopenharmony_ci		error = xfs_da3_blk_link(state, oldblk, newblk);
8098c2ecf20Sopenharmony_ci		if (error)
8108c2ecf20Sopenharmony_ci			return error;
8118c2ecf20Sopenharmony_ci		*result = 1;
8128c2ecf20Sopenharmony_ci	} else {
8138c2ecf20Sopenharmony_ci		*result = 0;
8148c2ecf20Sopenharmony_ci	}
8158c2ecf20Sopenharmony_ci
8168c2ecf20Sopenharmony_ci	/*
8178c2ecf20Sopenharmony_ci	 * Insert the new entry(s) into the correct block
8188c2ecf20Sopenharmony_ci	 * (updating last hashval in the process).
8198c2ecf20Sopenharmony_ci	 *
8208c2ecf20Sopenharmony_ci	 * xfs_da3_node_add() inserts BEFORE the given index,
8218c2ecf20Sopenharmony_ci	 * and as a result of using node_lookup_int() we always
8228c2ecf20Sopenharmony_ci	 * point to a valid entry (not after one), but a split
8238c2ecf20Sopenharmony_ci	 * operation always results in a new block whose hashvals
8248c2ecf20Sopenharmony_ci	 * FOLLOW the current block.
8258c2ecf20Sopenharmony_ci	 *
8268c2ecf20Sopenharmony_ci	 * If we had double-split op below us, then add the extra block too.
8278c2ecf20Sopenharmony_ci	 */
8288c2ecf20Sopenharmony_ci	node = oldblk->bp->b_addr;
8298c2ecf20Sopenharmony_ci	xfs_da3_node_hdr_from_disk(dp->i_mount, &nodehdr, node);
8308c2ecf20Sopenharmony_ci	if (oldblk->index <= nodehdr.count) {
8318c2ecf20Sopenharmony_ci		oldblk->index++;
8328c2ecf20Sopenharmony_ci		xfs_da3_node_add(state, oldblk, addblk);
8338c2ecf20Sopenharmony_ci		if (useextra) {
8348c2ecf20Sopenharmony_ci			if (state->extraafter)
8358c2ecf20Sopenharmony_ci				oldblk->index++;
8368c2ecf20Sopenharmony_ci			xfs_da3_node_add(state, oldblk, &state->extrablk);
8378c2ecf20Sopenharmony_ci			state->extravalid = 0;
8388c2ecf20Sopenharmony_ci		}
8398c2ecf20Sopenharmony_ci	} else {
8408c2ecf20Sopenharmony_ci		newblk->index++;
8418c2ecf20Sopenharmony_ci		xfs_da3_node_add(state, newblk, addblk);
8428c2ecf20Sopenharmony_ci		if (useextra) {
8438c2ecf20Sopenharmony_ci			if (state->extraafter)
8448c2ecf20Sopenharmony_ci				newblk->index++;
8458c2ecf20Sopenharmony_ci			xfs_da3_node_add(state, newblk, &state->extrablk);
8468c2ecf20Sopenharmony_ci			state->extravalid = 0;
8478c2ecf20Sopenharmony_ci		}
8488c2ecf20Sopenharmony_ci	}
8498c2ecf20Sopenharmony_ci
8508c2ecf20Sopenharmony_ci	return 0;
8518c2ecf20Sopenharmony_ci}
8528c2ecf20Sopenharmony_ci
8538c2ecf20Sopenharmony_ci/*
8548c2ecf20Sopenharmony_ci * Balance the btree elements between two intermediate nodes,
8558c2ecf20Sopenharmony_ci * usually one full and one empty.
8568c2ecf20Sopenharmony_ci *
8578c2ecf20Sopenharmony_ci * NOTE: if blk2 is empty, then it will get the upper half of blk1.
8588c2ecf20Sopenharmony_ci */
8598c2ecf20Sopenharmony_ciSTATIC void
8608c2ecf20Sopenharmony_cixfs_da3_node_rebalance(
8618c2ecf20Sopenharmony_ci	struct xfs_da_state	*state,
8628c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*blk1,
8638c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*blk2)
8648c2ecf20Sopenharmony_ci{
8658c2ecf20Sopenharmony_ci	struct xfs_da_intnode	*node1;
8668c2ecf20Sopenharmony_ci	struct xfs_da_intnode	*node2;
8678c2ecf20Sopenharmony_ci	struct xfs_da_intnode	*tmpnode;
8688c2ecf20Sopenharmony_ci	struct xfs_da_node_entry *btree1;
8698c2ecf20Sopenharmony_ci	struct xfs_da_node_entry *btree2;
8708c2ecf20Sopenharmony_ci	struct xfs_da_node_entry *btree_s;
8718c2ecf20Sopenharmony_ci	struct xfs_da_node_entry *btree_d;
8728c2ecf20Sopenharmony_ci	struct xfs_da3_icnode_hdr nodehdr1;
8738c2ecf20Sopenharmony_ci	struct xfs_da3_icnode_hdr nodehdr2;
8748c2ecf20Sopenharmony_ci	struct xfs_trans	*tp;
8758c2ecf20Sopenharmony_ci	int			count;
8768c2ecf20Sopenharmony_ci	int			tmp;
8778c2ecf20Sopenharmony_ci	int			swap = 0;
8788c2ecf20Sopenharmony_ci	struct xfs_inode	*dp = state->args->dp;
8798c2ecf20Sopenharmony_ci
8808c2ecf20Sopenharmony_ci	trace_xfs_da_node_rebalance(state->args);
8818c2ecf20Sopenharmony_ci
8828c2ecf20Sopenharmony_ci	node1 = blk1->bp->b_addr;
8838c2ecf20Sopenharmony_ci	node2 = blk2->bp->b_addr;
8848c2ecf20Sopenharmony_ci	xfs_da3_node_hdr_from_disk(dp->i_mount, &nodehdr1, node1);
8858c2ecf20Sopenharmony_ci	xfs_da3_node_hdr_from_disk(dp->i_mount, &nodehdr2, node2);
8868c2ecf20Sopenharmony_ci	btree1 = nodehdr1.btree;
8878c2ecf20Sopenharmony_ci	btree2 = nodehdr2.btree;
8888c2ecf20Sopenharmony_ci
8898c2ecf20Sopenharmony_ci	/*
8908c2ecf20Sopenharmony_ci	 * Figure out how many entries need to move, and in which direction.
8918c2ecf20Sopenharmony_ci	 * Swap the nodes around if that makes it simpler.
8928c2ecf20Sopenharmony_ci	 */
8938c2ecf20Sopenharmony_ci	if (nodehdr1.count > 0 && nodehdr2.count > 0 &&
8948c2ecf20Sopenharmony_ci	    ((be32_to_cpu(btree2[0].hashval) < be32_to_cpu(btree1[0].hashval)) ||
8958c2ecf20Sopenharmony_ci	     (be32_to_cpu(btree2[nodehdr2.count - 1].hashval) <
8968c2ecf20Sopenharmony_ci			be32_to_cpu(btree1[nodehdr1.count - 1].hashval)))) {
8978c2ecf20Sopenharmony_ci		tmpnode = node1;
8988c2ecf20Sopenharmony_ci		node1 = node2;
8998c2ecf20Sopenharmony_ci		node2 = tmpnode;
9008c2ecf20Sopenharmony_ci		xfs_da3_node_hdr_from_disk(dp->i_mount, &nodehdr1, node1);
9018c2ecf20Sopenharmony_ci		xfs_da3_node_hdr_from_disk(dp->i_mount, &nodehdr2, node2);
9028c2ecf20Sopenharmony_ci		btree1 = nodehdr1.btree;
9038c2ecf20Sopenharmony_ci		btree2 = nodehdr2.btree;
9048c2ecf20Sopenharmony_ci		swap = 1;
9058c2ecf20Sopenharmony_ci	}
9068c2ecf20Sopenharmony_ci
9078c2ecf20Sopenharmony_ci	count = (nodehdr1.count - nodehdr2.count) / 2;
9088c2ecf20Sopenharmony_ci	if (count == 0)
9098c2ecf20Sopenharmony_ci		return;
9108c2ecf20Sopenharmony_ci	tp = state->args->trans;
9118c2ecf20Sopenharmony_ci	/*
9128c2ecf20Sopenharmony_ci	 * Two cases: high-to-low and low-to-high.
9138c2ecf20Sopenharmony_ci	 */
9148c2ecf20Sopenharmony_ci	if (count > 0) {
9158c2ecf20Sopenharmony_ci		/*
9168c2ecf20Sopenharmony_ci		 * Move elements in node2 up to make a hole.
9178c2ecf20Sopenharmony_ci		 */
9188c2ecf20Sopenharmony_ci		tmp = nodehdr2.count;
9198c2ecf20Sopenharmony_ci		if (tmp > 0) {
9208c2ecf20Sopenharmony_ci			tmp *= (uint)sizeof(xfs_da_node_entry_t);
9218c2ecf20Sopenharmony_ci			btree_s = &btree2[0];
9228c2ecf20Sopenharmony_ci			btree_d = &btree2[count];
9238c2ecf20Sopenharmony_ci			memmove(btree_d, btree_s, tmp);
9248c2ecf20Sopenharmony_ci		}
9258c2ecf20Sopenharmony_ci
9268c2ecf20Sopenharmony_ci		/*
9278c2ecf20Sopenharmony_ci		 * Move the req'd B-tree elements from high in node1 to
9288c2ecf20Sopenharmony_ci		 * low in node2.
9298c2ecf20Sopenharmony_ci		 */
9308c2ecf20Sopenharmony_ci		nodehdr2.count += count;
9318c2ecf20Sopenharmony_ci		tmp = count * (uint)sizeof(xfs_da_node_entry_t);
9328c2ecf20Sopenharmony_ci		btree_s = &btree1[nodehdr1.count - count];
9338c2ecf20Sopenharmony_ci		btree_d = &btree2[0];
9348c2ecf20Sopenharmony_ci		memcpy(btree_d, btree_s, tmp);
9358c2ecf20Sopenharmony_ci		nodehdr1.count -= count;
9368c2ecf20Sopenharmony_ci	} else {
9378c2ecf20Sopenharmony_ci		/*
9388c2ecf20Sopenharmony_ci		 * Move the req'd B-tree elements from low in node2 to
9398c2ecf20Sopenharmony_ci		 * high in node1.
9408c2ecf20Sopenharmony_ci		 */
9418c2ecf20Sopenharmony_ci		count = -count;
9428c2ecf20Sopenharmony_ci		tmp = count * (uint)sizeof(xfs_da_node_entry_t);
9438c2ecf20Sopenharmony_ci		btree_s = &btree2[0];
9448c2ecf20Sopenharmony_ci		btree_d = &btree1[nodehdr1.count];
9458c2ecf20Sopenharmony_ci		memcpy(btree_d, btree_s, tmp);
9468c2ecf20Sopenharmony_ci		nodehdr1.count += count;
9478c2ecf20Sopenharmony_ci
9488c2ecf20Sopenharmony_ci		xfs_trans_log_buf(tp, blk1->bp,
9498c2ecf20Sopenharmony_ci			XFS_DA_LOGRANGE(node1, btree_d, tmp));
9508c2ecf20Sopenharmony_ci
9518c2ecf20Sopenharmony_ci		/*
9528c2ecf20Sopenharmony_ci		 * Move elements in node2 down to fill the hole.
9538c2ecf20Sopenharmony_ci		 */
9548c2ecf20Sopenharmony_ci		tmp  = nodehdr2.count - count;
9558c2ecf20Sopenharmony_ci		tmp *= (uint)sizeof(xfs_da_node_entry_t);
9568c2ecf20Sopenharmony_ci		btree_s = &btree2[count];
9578c2ecf20Sopenharmony_ci		btree_d = &btree2[0];
9588c2ecf20Sopenharmony_ci		memmove(btree_d, btree_s, tmp);
9598c2ecf20Sopenharmony_ci		nodehdr2.count -= count;
9608c2ecf20Sopenharmony_ci	}
9618c2ecf20Sopenharmony_ci
9628c2ecf20Sopenharmony_ci	/*
9638c2ecf20Sopenharmony_ci	 * Log header of node 1 and all current bits of node 2.
9648c2ecf20Sopenharmony_ci	 */
9658c2ecf20Sopenharmony_ci	xfs_da3_node_hdr_to_disk(dp->i_mount, node1, &nodehdr1);
9668c2ecf20Sopenharmony_ci	xfs_trans_log_buf(tp, blk1->bp,
9678c2ecf20Sopenharmony_ci		XFS_DA_LOGRANGE(node1, &node1->hdr,
9688c2ecf20Sopenharmony_ci				state->args->geo->node_hdr_size));
9698c2ecf20Sopenharmony_ci
9708c2ecf20Sopenharmony_ci	xfs_da3_node_hdr_to_disk(dp->i_mount, node2, &nodehdr2);
9718c2ecf20Sopenharmony_ci	xfs_trans_log_buf(tp, blk2->bp,
9728c2ecf20Sopenharmony_ci		XFS_DA_LOGRANGE(node2, &node2->hdr,
9738c2ecf20Sopenharmony_ci				state->args->geo->node_hdr_size +
9748c2ecf20Sopenharmony_ci				(sizeof(btree2[0]) * nodehdr2.count)));
9758c2ecf20Sopenharmony_ci
9768c2ecf20Sopenharmony_ci	/*
9778c2ecf20Sopenharmony_ci	 * Record the last hashval from each block for upward propagation.
9788c2ecf20Sopenharmony_ci	 * (note: don't use the swapped node pointers)
9798c2ecf20Sopenharmony_ci	 */
9808c2ecf20Sopenharmony_ci	if (swap) {
9818c2ecf20Sopenharmony_ci		node1 = blk1->bp->b_addr;
9828c2ecf20Sopenharmony_ci		node2 = blk2->bp->b_addr;
9838c2ecf20Sopenharmony_ci		xfs_da3_node_hdr_from_disk(dp->i_mount, &nodehdr1, node1);
9848c2ecf20Sopenharmony_ci		xfs_da3_node_hdr_from_disk(dp->i_mount, &nodehdr2, node2);
9858c2ecf20Sopenharmony_ci		btree1 = nodehdr1.btree;
9868c2ecf20Sopenharmony_ci		btree2 = nodehdr2.btree;
9878c2ecf20Sopenharmony_ci	}
9888c2ecf20Sopenharmony_ci	blk1->hashval = be32_to_cpu(btree1[nodehdr1.count - 1].hashval);
9898c2ecf20Sopenharmony_ci	blk2->hashval = be32_to_cpu(btree2[nodehdr2.count - 1].hashval);
9908c2ecf20Sopenharmony_ci
9918c2ecf20Sopenharmony_ci	/*
9928c2ecf20Sopenharmony_ci	 * Adjust the expected index for insertion.
9938c2ecf20Sopenharmony_ci	 */
9948c2ecf20Sopenharmony_ci	if (blk1->index >= nodehdr1.count) {
9958c2ecf20Sopenharmony_ci		blk2->index = blk1->index - nodehdr1.count;
9968c2ecf20Sopenharmony_ci		blk1->index = nodehdr1.count + 1;	/* make it invalid */
9978c2ecf20Sopenharmony_ci	}
9988c2ecf20Sopenharmony_ci}
9998c2ecf20Sopenharmony_ci
10008c2ecf20Sopenharmony_ci/*
10018c2ecf20Sopenharmony_ci * Add a new entry to an intermediate node.
10028c2ecf20Sopenharmony_ci */
10038c2ecf20Sopenharmony_ciSTATIC void
10048c2ecf20Sopenharmony_cixfs_da3_node_add(
10058c2ecf20Sopenharmony_ci	struct xfs_da_state	*state,
10068c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*oldblk,
10078c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*newblk)
10088c2ecf20Sopenharmony_ci{
10098c2ecf20Sopenharmony_ci	struct xfs_da_intnode	*node;
10108c2ecf20Sopenharmony_ci	struct xfs_da3_icnode_hdr nodehdr;
10118c2ecf20Sopenharmony_ci	struct xfs_da_node_entry *btree;
10128c2ecf20Sopenharmony_ci	int			tmp;
10138c2ecf20Sopenharmony_ci	struct xfs_inode	*dp = state->args->dp;
10148c2ecf20Sopenharmony_ci
10158c2ecf20Sopenharmony_ci	trace_xfs_da_node_add(state->args);
10168c2ecf20Sopenharmony_ci
10178c2ecf20Sopenharmony_ci	node = oldblk->bp->b_addr;
10188c2ecf20Sopenharmony_ci	xfs_da3_node_hdr_from_disk(dp->i_mount, &nodehdr, node);
10198c2ecf20Sopenharmony_ci	btree = nodehdr.btree;
10208c2ecf20Sopenharmony_ci
10218c2ecf20Sopenharmony_ci	ASSERT(oldblk->index >= 0 && oldblk->index <= nodehdr.count);
10228c2ecf20Sopenharmony_ci	ASSERT(newblk->blkno != 0);
10238c2ecf20Sopenharmony_ci	if (state->args->whichfork == XFS_DATA_FORK)
10248c2ecf20Sopenharmony_ci		ASSERT(newblk->blkno >= state->args->geo->leafblk &&
10258c2ecf20Sopenharmony_ci		       newblk->blkno < state->args->geo->freeblk);
10268c2ecf20Sopenharmony_ci
10278c2ecf20Sopenharmony_ci	/*
10288c2ecf20Sopenharmony_ci	 * We may need to make some room before we insert the new node.
10298c2ecf20Sopenharmony_ci	 */
10308c2ecf20Sopenharmony_ci	tmp = 0;
10318c2ecf20Sopenharmony_ci	if (oldblk->index < nodehdr.count) {
10328c2ecf20Sopenharmony_ci		tmp = (nodehdr.count - oldblk->index) * (uint)sizeof(*btree);
10338c2ecf20Sopenharmony_ci		memmove(&btree[oldblk->index + 1], &btree[oldblk->index], tmp);
10348c2ecf20Sopenharmony_ci	}
10358c2ecf20Sopenharmony_ci	btree[oldblk->index].hashval = cpu_to_be32(newblk->hashval);
10368c2ecf20Sopenharmony_ci	btree[oldblk->index].before = cpu_to_be32(newblk->blkno);
10378c2ecf20Sopenharmony_ci	xfs_trans_log_buf(state->args->trans, oldblk->bp,
10388c2ecf20Sopenharmony_ci		XFS_DA_LOGRANGE(node, &btree[oldblk->index],
10398c2ecf20Sopenharmony_ci				tmp + sizeof(*btree)));
10408c2ecf20Sopenharmony_ci
10418c2ecf20Sopenharmony_ci	nodehdr.count += 1;
10428c2ecf20Sopenharmony_ci	xfs_da3_node_hdr_to_disk(dp->i_mount, node, &nodehdr);
10438c2ecf20Sopenharmony_ci	xfs_trans_log_buf(state->args->trans, oldblk->bp,
10448c2ecf20Sopenharmony_ci		XFS_DA_LOGRANGE(node, &node->hdr,
10458c2ecf20Sopenharmony_ci				state->args->geo->node_hdr_size));
10468c2ecf20Sopenharmony_ci
10478c2ecf20Sopenharmony_ci	/*
10488c2ecf20Sopenharmony_ci	 * Copy the last hash value from the oldblk to propagate upwards.
10498c2ecf20Sopenharmony_ci	 */
10508c2ecf20Sopenharmony_ci	oldblk->hashval = be32_to_cpu(btree[nodehdr.count - 1].hashval);
10518c2ecf20Sopenharmony_ci}
10528c2ecf20Sopenharmony_ci
10538c2ecf20Sopenharmony_ci/*========================================================================
10548c2ecf20Sopenharmony_ci * Routines used for shrinking the Btree.
10558c2ecf20Sopenharmony_ci *========================================================================*/
10568c2ecf20Sopenharmony_ci
10578c2ecf20Sopenharmony_ci/*
10588c2ecf20Sopenharmony_ci * Deallocate an empty leaf node, remove it from its parent,
10598c2ecf20Sopenharmony_ci * possibly deallocating that block, etc...
10608c2ecf20Sopenharmony_ci */
10618c2ecf20Sopenharmony_ciint
10628c2ecf20Sopenharmony_cixfs_da3_join(
10638c2ecf20Sopenharmony_ci	struct xfs_da_state	*state)
10648c2ecf20Sopenharmony_ci{
10658c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*drop_blk;
10668c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*save_blk;
10678c2ecf20Sopenharmony_ci	int			action = 0;
10688c2ecf20Sopenharmony_ci	int			error;
10698c2ecf20Sopenharmony_ci
10708c2ecf20Sopenharmony_ci	trace_xfs_da_join(state->args);
10718c2ecf20Sopenharmony_ci
10728c2ecf20Sopenharmony_ci	drop_blk = &state->path.blk[ state->path.active-1 ];
10738c2ecf20Sopenharmony_ci	save_blk = &state->altpath.blk[ state->path.active-1 ];
10748c2ecf20Sopenharmony_ci	ASSERT(state->path.blk[0].magic == XFS_DA_NODE_MAGIC);
10758c2ecf20Sopenharmony_ci	ASSERT(drop_blk->magic == XFS_ATTR_LEAF_MAGIC ||
10768c2ecf20Sopenharmony_ci	       drop_blk->magic == XFS_DIR2_LEAFN_MAGIC);
10778c2ecf20Sopenharmony_ci
10788c2ecf20Sopenharmony_ci	/*
10798c2ecf20Sopenharmony_ci	 * Walk back up the tree joining/deallocating as necessary.
10808c2ecf20Sopenharmony_ci	 * When we stop dropping blocks, break out.
10818c2ecf20Sopenharmony_ci	 */
10828c2ecf20Sopenharmony_ci	for (  ; state->path.active >= 2; drop_blk--, save_blk--,
10838c2ecf20Sopenharmony_ci		 state->path.active--) {
10848c2ecf20Sopenharmony_ci		/*
10858c2ecf20Sopenharmony_ci		 * See if we can combine the block with a neighbor.
10868c2ecf20Sopenharmony_ci		 *   (action == 0) => no options, just leave
10878c2ecf20Sopenharmony_ci		 *   (action == 1) => coalesce, then unlink
10888c2ecf20Sopenharmony_ci		 *   (action == 2) => block empty, unlink it
10898c2ecf20Sopenharmony_ci		 */
10908c2ecf20Sopenharmony_ci		switch (drop_blk->magic) {
10918c2ecf20Sopenharmony_ci		case XFS_ATTR_LEAF_MAGIC:
10928c2ecf20Sopenharmony_ci			error = xfs_attr3_leaf_toosmall(state, &action);
10938c2ecf20Sopenharmony_ci			if (error)
10948c2ecf20Sopenharmony_ci				return error;
10958c2ecf20Sopenharmony_ci			if (action == 0)
10968c2ecf20Sopenharmony_ci				return 0;
10978c2ecf20Sopenharmony_ci			xfs_attr3_leaf_unbalance(state, drop_blk, save_blk);
10988c2ecf20Sopenharmony_ci			break;
10998c2ecf20Sopenharmony_ci		case XFS_DIR2_LEAFN_MAGIC:
11008c2ecf20Sopenharmony_ci			error = xfs_dir2_leafn_toosmall(state, &action);
11018c2ecf20Sopenharmony_ci			if (error)
11028c2ecf20Sopenharmony_ci				return error;
11038c2ecf20Sopenharmony_ci			if (action == 0)
11048c2ecf20Sopenharmony_ci				return 0;
11058c2ecf20Sopenharmony_ci			xfs_dir2_leafn_unbalance(state, drop_blk, save_blk);
11068c2ecf20Sopenharmony_ci			break;
11078c2ecf20Sopenharmony_ci		case XFS_DA_NODE_MAGIC:
11088c2ecf20Sopenharmony_ci			/*
11098c2ecf20Sopenharmony_ci			 * Remove the offending node, fixup hashvals,
11108c2ecf20Sopenharmony_ci			 * check for a toosmall neighbor.
11118c2ecf20Sopenharmony_ci			 */
11128c2ecf20Sopenharmony_ci			xfs_da3_node_remove(state, drop_blk);
11138c2ecf20Sopenharmony_ci			xfs_da3_fixhashpath(state, &state->path);
11148c2ecf20Sopenharmony_ci			error = xfs_da3_node_toosmall(state, &action);
11158c2ecf20Sopenharmony_ci			if (error)
11168c2ecf20Sopenharmony_ci				return error;
11178c2ecf20Sopenharmony_ci			if (action == 0)
11188c2ecf20Sopenharmony_ci				return 0;
11198c2ecf20Sopenharmony_ci			xfs_da3_node_unbalance(state, drop_blk, save_blk);
11208c2ecf20Sopenharmony_ci			break;
11218c2ecf20Sopenharmony_ci		}
11228c2ecf20Sopenharmony_ci		xfs_da3_fixhashpath(state, &state->altpath);
11238c2ecf20Sopenharmony_ci		error = xfs_da3_blk_unlink(state, drop_blk, save_blk);
11248c2ecf20Sopenharmony_ci		xfs_da_state_kill_altpath(state);
11258c2ecf20Sopenharmony_ci		if (error)
11268c2ecf20Sopenharmony_ci			return error;
11278c2ecf20Sopenharmony_ci		error = xfs_da_shrink_inode(state->args, drop_blk->blkno,
11288c2ecf20Sopenharmony_ci							 drop_blk->bp);
11298c2ecf20Sopenharmony_ci		drop_blk->bp = NULL;
11308c2ecf20Sopenharmony_ci		if (error)
11318c2ecf20Sopenharmony_ci			return error;
11328c2ecf20Sopenharmony_ci	}
11338c2ecf20Sopenharmony_ci	/*
11348c2ecf20Sopenharmony_ci	 * We joined all the way to the top.  If it turns out that
11358c2ecf20Sopenharmony_ci	 * we only have one entry in the root, make the child block
11368c2ecf20Sopenharmony_ci	 * the new root.
11378c2ecf20Sopenharmony_ci	 */
11388c2ecf20Sopenharmony_ci	xfs_da3_node_remove(state, drop_blk);
11398c2ecf20Sopenharmony_ci	xfs_da3_fixhashpath(state, &state->path);
11408c2ecf20Sopenharmony_ci	error = xfs_da3_root_join(state, &state->path.blk[0]);
11418c2ecf20Sopenharmony_ci	return error;
11428c2ecf20Sopenharmony_ci}
11438c2ecf20Sopenharmony_ci
11448c2ecf20Sopenharmony_ci#ifdef	DEBUG
11458c2ecf20Sopenharmony_cistatic void
11468c2ecf20Sopenharmony_cixfs_da_blkinfo_onlychild_validate(struct xfs_da_blkinfo *blkinfo, __u16 level)
11478c2ecf20Sopenharmony_ci{
11488c2ecf20Sopenharmony_ci	__be16	magic = blkinfo->magic;
11498c2ecf20Sopenharmony_ci
11508c2ecf20Sopenharmony_ci	if (level == 1) {
11518c2ecf20Sopenharmony_ci		ASSERT(magic == cpu_to_be16(XFS_DIR2_LEAFN_MAGIC) ||
11528c2ecf20Sopenharmony_ci		       magic == cpu_to_be16(XFS_DIR3_LEAFN_MAGIC) ||
11538c2ecf20Sopenharmony_ci		       magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC) ||
11548c2ecf20Sopenharmony_ci		       magic == cpu_to_be16(XFS_ATTR3_LEAF_MAGIC));
11558c2ecf20Sopenharmony_ci	} else {
11568c2ecf20Sopenharmony_ci		ASSERT(magic == cpu_to_be16(XFS_DA_NODE_MAGIC) ||
11578c2ecf20Sopenharmony_ci		       magic == cpu_to_be16(XFS_DA3_NODE_MAGIC));
11588c2ecf20Sopenharmony_ci	}
11598c2ecf20Sopenharmony_ci	ASSERT(!blkinfo->forw);
11608c2ecf20Sopenharmony_ci	ASSERT(!blkinfo->back);
11618c2ecf20Sopenharmony_ci}
11628c2ecf20Sopenharmony_ci#else	/* !DEBUG */
11638c2ecf20Sopenharmony_ci#define	xfs_da_blkinfo_onlychild_validate(blkinfo, level)
11648c2ecf20Sopenharmony_ci#endif	/* !DEBUG */
11658c2ecf20Sopenharmony_ci
11668c2ecf20Sopenharmony_ci/*
11678c2ecf20Sopenharmony_ci * We have only one entry in the root.  Copy the only remaining child of
11688c2ecf20Sopenharmony_ci * the old root to block 0 as the new root node.
11698c2ecf20Sopenharmony_ci */
11708c2ecf20Sopenharmony_ciSTATIC int
11718c2ecf20Sopenharmony_cixfs_da3_root_join(
11728c2ecf20Sopenharmony_ci	struct xfs_da_state	*state,
11738c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*root_blk)
11748c2ecf20Sopenharmony_ci{
11758c2ecf20Sopenharmony_ci	struct xfs_da_intnode	*oldroot;
11768c2ecf20Sopenharmony_ci	struct xfs_da_args	*args;
11778c2ecf20Sopenharmony_ci	xfs_dablk_t		child;
11788c2ecf20Sopenharmony_ci	struct xfs_buf		*bp;
11798c2ecf20Sopenharmony_ci	struct xfs_da3_icnode_hdr oldroothdr;
11808c2ecf20Sopenharmony_ci	int			error;
11818c2ecf20Sopenharmony_ci	struct xfs_inode	*dp = state->args->dp;
11828c2ecf20Sopenharmony_ci
11838c2ecf20Sopenharmony_ci	trace_xfs_da_root_join(state->args);
11848c2ecf20Sopenharmony_ci
11858c2ecf20Sopenharmony_ci	ASSERT(root_blk->magic == XFS_DA_NODE_MAGIC);
11868c2ecf20Sopenharmony_ci
11878c2ecf20Sopenharmony_ci	args = state->args;
11888c2ecf20Sopenharmony_ci	oldroot = root_blk->bp->b_addr;
11898c2ecf20Sopenharmony_ci	xfs_da3_node_hdr_from_disk(dp->i_mount, &oldroothdr, oldroot);
11908c2ecf20Sopenharmony_ci	ASSERT(oldroothdr.forw == 0);
11918c2ecf20Sopenharmony_ci	ASSERT(oldroothdr.back == 0);
11928c2ecf20Sopenharmony_ci
11938c2ecf20Sopenharmony_ci	/*
11948c2ecf20Sopenharmony_ci	 * If the root has more than one child, then don't do anything.
11958c2ecf20Sopenharmony_ci	 */
11968c2ecf20Sopenharmony_ci	if (oldroothdr.count > 1)
11978c2ecf20Sopenharmony_ci		return 0;
11988c2ecf20Sopenharmony_ci
11998c2ecf20Sopenharmony_ci	/*
12008c2ecf20Sopenharmony_ci	 * Read in the (only) child block, then copy those bytes into
12018c2ecf20Sopenharmony_ci	 * the root block's buffer and free the original child block.
12028c2ecf20Sopenharmony_ci	 */
12038c2ecf20Sopenharmony_ci	child = be32_to_cpu(oldroothdr.btree[0].before);
12048c2ecf20Sopenharmony_ci	ASSERT(child != 0);
12058c2ecf20Sopenharmony_ci	error = xfs_da3_node_read(args->trans, dp, child, &bp, args->whichfork);
12068c2ecf20Sopenharmony_ci	if (error)
12078c2ecf20Sopenharmony_ci		return error;
12088c2ecf20Sopenharmony_ci	xfs_da_blkinfo_onlychild_validate(bp->b_addr, oldroothdr.level);
12098c2ecf20Sopenharmony_ci
12108c2ecf20Sopenharmony_ci	/*
12118c2ecf20Sopenharmony_ci	 * This could be copying a leaf back into the root block in the case of
12128c2ecf20Sopenharmony_ci	 * there only being a single leaf block left in the tree. Hence we have
12138c2ecf20Sopenharmony_ci	 * to update the b_ops pointer as well to match the buffer type change
12148c2ecf20Sopenharmony_ci	 * that could occur. For dir3 blocks we also need to update the block
12158c2ecf20Sopenharmony_ci	 * number in the buffer header.
12168c2ecf20Sopenharmony_ci	 */
12178c2ecf20Sopenharmony_ci	memcpy(root_blk->bp->b_addr, bp->b_addr, args->geo->blksize);
12188c2ecf20Sopenharmony_ci	root_blk->bp->b_ops = bp->b_ops;
12198c2ecf20Sopenharmony_ci	xfs_trans_buf_copy_type(root_blk->bp, bp);
12208c2ecf20Sopenharmony_ci	if (oldroothdr.magic == XFS_DA3_NODE_MAGIC) {
12218c2ecf20Sopenharmony_ci		struct xfs_da3_blkinfo *da3 = root_blk->bp->b_addr;
12228c2ecf20Sopenharmony_ci		da3->blkno = cpu_to_be64(root_blk->bp->b_bn);
12238c2ecf20Sopenharmony_ci	}
12248c2ecf20Sopenharmony_ci	xfs_trans_log_buf(args->trans, root_blk->bp, 0,
12258c2ecf20Sopenharmony_ci			  args->geo->blksize - 1);
12268c2ecf20Sopenharmony_ci	error = xfs_da_shrink_inode(args, child, bp);
12278c2ecf20Sopenharmony_ci	return error;
12288c2ecf20Sopenharmony_ci}
12298c2ecf20Sopenharmony_ci
12308c2ecf20Sopenharmony_ci/*
12318c2ecf20Sopenharmony_ci * Check a node block and its neighbors to see if the block should be
12328c2ecf20Sopenharmony_ci * collapsed into one or the other neighbor.  Always keep the block
12338c2ecf20Sopenharmony_ci * with the smaller block number.
12348c2ecf20Sopenharmony_ci * If the current block is over 50% full, don't try to join it, return 0.
12358c2ecf20Sopenharmony_ci * If the block is empty, fill in the state structure and return 2.
12368c2ecf20Sopenharmony_ci * If it can be collapsed, fill in the state structure and return 1.
12378c2ecf20Sopenharmony_ci * If nothing can be done, return 0.
12388c2ecf20Sopenharmony_ci */
12398c2ecf20Sopenharmony_ciSTATIC int
12408c2ecf20Sopenharmony_cixfs_da3_node_toosmall(
12418c2ecf20Sopenharmony_ci	struct xfs_da_state	*state,
12428c2ecf20Sopenharmony_ci	int			*action)
12438c2ecf20Sopenharmony_ci{
12448c2ecf20Sopenharmony_ci	struct xfs_da_intnode	*node;
12458c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*blk;
12468c2ecf20Sopenharmony_ci	struct xfs_da_blkinfo	*info;
12478c2ecf20Sopenharmony_ci	xfs_dablk_t		blkno;
12488c2ecf20Sopenharmony_ci	struct xfs_buf		*bp;
12498c2ecf20Sopenharmony_ci	struct xfs_da3_icnode_hdr nodehdr;
12508c2ecf20Sopenharmony_ci	int			count;
12518c2ecf20Sopenharmony_ci	int			forward;
12528c2ecf20Sopenharmony_ci	int			error;
12538c2ecf20Sopenharmony_ci	int			retval;
12548c2ecf20Sopenharmony_ci	int			i;
12558c2ecf20Sopenharmony_ci	struct xfs_inode	*dp = state->args->dp;
12568c2ecf20Sopenharmony_ci
12578c2ecf20Sopenharmony_ci	trace_xfs_da_node_toosmall(state->args);
12588c2ecf20Sopenharmony_ci
12598c2ecf20Sopenharmony_ci	/*
12608c2ecf20Sopenharmony_ci	 * Check for the degenerate case of the block being over 50% full.
12618c2ecf20Sopenharmony_ci	 * If so, it's not worth even looking to see if we might be able
12628c2ecf20Sopenharmony_ci	 * to coalesce with a sibling.
12638c2ecf20Sopenharmony_ci	 */
12648c2ecf20Sopenharmony_ci	blk = &state->path.blk[ state->path.active-1 ];
12658c2ecf20Sopenharmony_ci	info = blk->bp->b_addr;
12668c2ecf20Sopenharmony_ci	node = (xfs_da_intnode_t *)info;
12678c2ecf20Sopenharmony_ci	xfs_da3_node_hdr_from_disk(dp->i_mount, &nodehdr, node);
12688c2ecf20Sopenharmony_ci	if (nodehdr.count > (state->args->geo->node_ents >> 1)) {
12698c2ecf20Sopenharmony_ci		*action = 0;	/* blk over 50%, don't try to join */
12708c2ecf20Sopenharmony_ci		return 0;	/* blk over 50%, don't try to join */
12718c2ecf20Sopenharmony_ci	}
12728c2ecf20Sopenharmony_ci
12738c2ecf20Sopenharmony_ci	/*
12748c2ecf20Sopenharmony_ci	 * Check for the degenerate case of the block being empty.
12758c2ecf20Sopenharmony_ci	 * If the block is empty, we'll simply delete it, no need to
12768c2ecf20Sopenharmony_ci	 * coalesce it with a sibling block.  We choose (arbitrarily)
12778c2ecf20Sopenharmony_ci	 * to merge with the forward block unless it is NULL.
12788c2ecf20Sopenharmony_ci	 */
12798c2ecf20Sopenharmony_ci	if (nodehdr.count == 0) {
12808c2ecf20Sopenharmony_ci		/*
12818c2ecf20Sopenharmony_ci		 * Make altpath point to the block we want to keep and
12828c2ecf20Sopenharmony_ci		 * path point to the block we want to drop (this one).
12838c2ecf20Sopenharmony_ci		 */
12848c2ecf20Sopenharmony_ci		forward = (info->forw != 0);
12858c2ecf20Sopenharmony_ci		memcpy(&state->altpath, &state->path, sizeof(state->path));
12868c2ecf20Sopenharmony_ci		error = xfs_da3_path_shift(state, &state->altpath, forward,
12878c2ecf20Sopenharmony_ci						 0, &retval);
12888c2ecf20Sopenharmony_ci		if (error)
12898c2ecf20Sopenharmony_ci			return error;
12908c2ecf20Sopenharmony_ci		if (retval) {
12918c2ecf20Sopenharmony_ci			*action = 0;
12928c2ecf20Sopenharmony_ci		} else {
12938c2ecf20Sopenharmony_ci			*action = 2;
12948c2ecf20Sopenharmony_ci		}
12958c2ecf20Sopenharmony_ci		return 0;
12968c2ecf20Sopenharmony_ci	}
12978c2ecf20Sopenharmony_ci
12988c2ecf20Sopenharmony_ci	/*
12998c2ecf20Sopenharmony_ci	 * Examine each sibling block to see if we can coalesce with
13008c2ecf20Sopenharmony_ci	 * at least 25% free space to spare.  We need to figure out
13018c2ecf20Sopenharmony_ci	 * whether to merge with the forward or the backward block.
13028c2ecf20Sopenharmony_ci	 * We prefer coalescing with the lower numbered sibling so as
13038c2ecf20Sopenharmony_ci	 * to shrink a directory over time.
13048c2ecf20Sopenharmony_ci	 */
13058c2ecf20Sopenharmony_ci	count  = state->args->geo->node_ents;
13068c2ecf20Sopenharmony_ci	count -= state->args->geo->node_ents >> 2;
13078c2ecf20Sopenharmony_ci	count -= nodehdr.count;
13088c2ecf20Sopenharmony_ci
13098c2ecf20Sopenharmony_ci	/* start with smaller blk num */
13108c2ecf20Sopenharmony_ci	forward = nodehdr.forw < nodehdr.back;
13118c2ecf20Sopenharmony_ci	for (i = 0; i < 2; forward = !forward, i++) {
13128c2ecf20Sopenharmony_ci		struct xfs_da3_icnode_hdr thdr;
13138c2ecf20Sopenharmony_ci		if (forward)
13148c2ecf20Sopenharmony_ci			blkno = nodehdr.forw;
13158c2ecf20Sopenharmony_ci		else
13168c2ecf20Sopenharmony_ci			blkno = nodehdr.back;
13178c2ecf20Sopenharmony_ci		if (blkno == 0)
13188c2ecf20Sopenharmony_ci			continue;
13198c2ecf20Sopenharmony_ci		error = xfs_da3_node_read(state->args->trans, dp, blkno, &bp,
13208c2ecf20Sopenharmony_ci				state->args->whichfork);
13218c2ecf20Sopenharmony_ci		if (error)
13228c2ecf20Sopenharmony_ci			return error;
13238c2ecf20Sopenharmony_ci
13248c2ecf20Sopenharmony_ci		node = bp->b_addr;
13258c2ecf20Sopenharmony_ci		xfs_da3_node_hdr_from_disk(dp->i_mount, &thdr, node);
13268c2ecf20Sopenharmony_ci		xfs_trans_brelse(state->args->trans, bp);
13278c2ecf20Sopenharmony_ci
13288c2ecf20Sopenharmony_ci		if (count - thdr.count >= 0)
13298c2ecf20Sopenharmony_ci			break;	/* fits with at least 25% to spare */
13308c2ecf20Sopenharmony_ci	}
13318c2ecf20Sopenharmony_ci	if (i >= 2) {
13328c2ecf20Sopenharmony_ci		*action = 0;
13338c2ecf20Sopenharmony_ci		return 0;
13348c2ecf20Sopenharmony_ci	}
13358c2ecf20Sopenharmony_ci
13368c2ecf20Sopenharmony_ci	/*
13378c2ecf20Sopenharmony_ci	 * Make altpath point to the block we want to keep (the lower
13388c2ecf20Sopenharmony_ci	 * numbered block) and path point to the block we want to drop.
13398c2ecf20Sopenharmony_ci	 */
13408c2ecf20Sopenharmony_ci	memcpy(&state->altpath, &state->path, sizeof(state->path));
13418c2ecf20Sopenharmony_ci	if (blkno < blk->blkno) {
13428c2ecf20Sopenharmony_ci		error = xfs_da3_path_shift(state, &state->altpath, forward,
13438c2ecf20Sopenharmony_ci						 0, &retval);
13448c2ecf20Sopenharmony_ci	} else {
13458c2ecf20Sopenharmony_ci		error = xfs_da3_path_shift(state, &state->path, forward,
13468c2ecf20Sopenharmony_ci						 0, &retval);
13478c2ecf20Sopenharmony_ci	}
13488c2ecf20Sopenharmony_ci	if (error)
13498c2ecf20Sopenharmony_ci		return error;
13508c2ecf20Sopenharmony_ci	if (retval) {
13518c2ecf20Sopenharmony_ci		*action = 0;
13528c2ecf20Sopenharmony_ci		return 0;
13538c2ecf20Sopenharmony_ci	}
13548c2ecf20Sopenharmony_ci	*action = 1;
13558c2ecf20Sopenharmony_ci	return 0;
13568c2ecf20Sopenharmony_ci}
13578c2ecf20Sopenharmony_ci
13588c2ecf20Sopenharmony_ci/*
13598c2ecf20Sopenharmony_ci * Pick up the last hashvalue from an intermediate node.
13608c2ecf20Sopenharmony_ci */
13618c2ecf20Sopenharmony_ciSTATIC uint
13628c2ecf20Sopenharmony_cixfs_da3_node_lasthash(
13638c2ecf20Sopenharmony_ci	struct xfs_inode	*dp,
13648c2ecf20Sopenharmony_ci	struct xfs_buf		*bp,
13658c2ecf20Sopenharmony_ci	int			*count)
13668c2ecf20Sopenharmony_ci{
13678c2ecf20Sopenharmony_ci	struct xfs_da3_icnode_hdr nodehdr;
13688c2ecf20Sopenharmony_ci
13698c2ecf20Sopenharmony_ci	xfs_da3_node_hdr_from_disk(dp->i_mount, &nodehdr, bp->b_addr);
13708c2ecf20Sopenharmony_ci	if (count)
13718c2ecf20Sopenharmony_ci		*count = nodehdr.count;
13728c2ecf20Sopenharmony_ci	if (!nodehdr.count)
13738c2ecf20Sopenharmony_ci		return 0;
13748c2ecf20Sopenharmony_ci	return be32_to_cpu(nodehdr.btree[nodehdr.count - 1].hashval);
13758c2ecf20Sopenharmony_ci}
13768c2ecf20Sopenharmony_ci
13778c2ecf20Sopenharmony_ci/*
13788c2ecf20Sopenharmony_ci * Walk back up the tree adjusting hash values as necessary,
13798c2ecf20Sopenharmony_ci * when we stop making changes, return.
13808c2ecf20Sopenharmony_ci */
13818c2ecf20Sopenharmony_civoid
13828c2ecf20Sopenharmony_cixfs_da3_fixhashpath(
13838c2ecf20Sopenharmony_ci	struct xfs_da_state	*state,
13848c2ecf20Sopenharmony_ci	struct xfs_da_state_path *path)
13858c2ecf20Sopenharmony_ci{
13868c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*blk;
13878c2ecf20Sopenharmony_ci	struct xfs_da_intnode	*node;
13888c2ecf20Sopenharmony_ci	struct xfs_da_node_entry *btree;
13898c2ecf20Sopenharmony_ci	xfs_dahash_t		lasthash=0;
13908c2ecf20Sopenharmony_ci	int			level;
13918c2ecf20Sopenharmony_ci	int			count;
13928c2ecf20Sopenharmony_ci	struct xfs_inode	*dp = state->args->dp;
13938c2ecf20Sopenharmony_ci
13948c2ecf20Sopenharmony_ci	trace_xfs_da_fixhashpath(state->args);
13958c2ecf20Sopenharmony_ci
13968c2ecf20Sopenharmony_ci	level = path->active-1;
13978c2ecf20Sopenharmony_ci	blk = &path->blk[ level ];
13988c2ecf20Sopenharmony_ci	switch (blk->magic) {
13998c2ecf20Sopenharmony_ci	case XFS_ATTR_LEAF_MAGIC:
14008c2ecf20Sopenharmony_ci		lasthash = xfs_attr_leaf_lasthash(blk->bp, &count);
14018c2ecf20Sopenharmony_ci		if (count == 0)
14028c2ecf20Sopenharmony_ci			return;
14038c2ecf20Sopenharmony_ci		break;
14048c2ecf20Sopenharmony_ci	case XFS_DIR2_LEAFN_MAGIC:
14058c2ecf20Sopenharmony_ci		lasthash = xfs_dir2_leaf_lasthash(dp, blk->bp, &count);
14068c2ecf20Sopenharmony_ci		if (count == 0)
14078c2ecf20Sopenharmony_ci			return;
14088c2ecf20Sopenharmony_ci		break;
14098c2ecf20Sopenharmony_ci	case XFS_DA_NODE_MAGIC:
14108c2ecf20Sopenharmony_ci		lasthash = xfs_da3_node_lasthash(dp, blk->bp, &count);
14118c2ecf20Sopenharmony_ci		if (count == 0)
14128c2ecf20Sopenharmony_ci			return;
14138c2ecf20Sopenharmony_ci		break;
14148c2ecf20Sopenharmony_ci	}
14158c2ecf20Sopenharmony_ci	for (blk--, level--; level >= 0; blk--, level--) {
14168c2ecf20Sopenharmony_ci		struct xfs_da3_icnode_hdr nodehdr;
14178c2ecf20Sopenharmony_ci
14188c2ecf20Sopenharmony_ci		node = blk->bp->b_addr;
14198c2ecf20Sopenharmony_ci		xfs_da3_node_hdr_from_disk(dp->i_mount, &nodehdr, node);
14208c2ecf20Sopenharmony_ci		btree = nodehdr.btree;
14218c2ecf20Sopenharmony_ci		if (be32_to_cpu(btree[blk->index].hashval) == lasthash)
14228c2ecf20Sopenharmony_ci			break;
14238c2ecf20Sopenharmony_ci		blk->hashval = lasthash;
14248c2ecf20Sopenharmony_ci		btree[blk->index].hashval = cpu_to_be32(lasthash);
14258c2ecf20Sopenharmony_ci		xfs_trans_log_buf(state->args->trans, blk->bp,
14268c2ecf20Sopenharmony_ci				  XFS_DA_LOGRANGE(node, &btree[blk->index],
14278c2ecf20Sopenharmony_ci						  sizeof(*btree)));
14288c2ecf20Sopenharmony_ci
14298c2ecf20Sopenharmony_ci		lasthash = be32_to_cpu(btree[nodehdr.count - 1].hashval);
14308c2ecf20Sopenharmony_ci	}
14318c2ecf20Sopenharmony_ci}
14328c2ecf20Sopenharmony_ci
14338c2ecf20Sopenharmony_ci/*
14348c2ecf20Sopenharmony_ci * Remove an entry from an intermediate node.
14358c2ecf20Sopenharmony_ci */
14368c2ecf20Sopenharmony_ciSTATIC void
14378c2ecf20Sopenharmony_cixfs_da3_node_remove(
14388c2ecf20Sopenharmony_ci	struct xfs_da_state	*state,
14398c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*drop_blk)
14408c2ecf20Sopenharmony_ci{
14418c2ecf20Sopenharmony_ci	struct xfs_da_intnode	*node;
14428c2ecf20Sopenharmony_ci	struct xfs_da3_icnode_hdr nodehdr;
14438c2ecf20Sopenharmony_ci	struct xfs_da_node_entry *btree;
14448c2ecf20Sopenharmony_ci	int			index;
14458c2ecf20Sopenharmony_ci	int			tmp;
14468c2ecf20Sopenharmony_ci	struct xfs_inode	*dp = state->args->dp;
14478c2ecf20Sopenharmony_ci
14488c2ecf20Sopenharmony_ci	trace_xfs_da_node_remove(state->args);
14498c2ecf20Sopenharmony_ci
14508c2ecf20Sopenharmony_ci	node = drop_blk->bp->b_addr;
14518c2ecf20Sopenharmony_ci	xfs_da3_node_hdr_from_disk(dp->i_mount, &nodehdr, node);
14528c2ecf20Sopenharmony_ci	ASSERT(drop_blk->index < nodehdr.count);
14538c2ecf20Sopenharmony_ci	ASSERT(drop_blk->index >= 0);
14548c2ecf20Sopenharmony_ci
14558c2ecf20Sopenharmony_ci	/*
14568c2ecf20Sopenharmony_ci	 * Copy over the offending entry, or just zero it out.
14578c2ecf20Sopenharmony_ci	 */
14588c2ecf20Sopenharmony_ci	index = drop_blk->index;
14598c2ecf20Sopenharmony_ci	btree = nodehdr.btree;
14608c2ecf20Sopenharmony_ci	if (index < nodehdr.count - 1) {
14618c2ecf20Sopenharmony_ci		tmp  = nodehdr.count - index - 1;
14628c2ecf20Sopenharmony_ci		tmp *= (uint)sizeof(xfs_da_node_entry_t);
14638c2ecf20Sopenharmony_ci		memmove(&btree[index], &btree[index + 1], tmp);
14648c2ecf20Sopenharmony_ci		xfs_trans_log_buf(state->args->trans, drop_blk->bp,
14658c2ecf20Sopenharmony_ci		    XFS_DA_LOGRANGE(node, &btree[index], tmp));
14668c2ecf20Sopenharmony_ci		index = nodehdr.count - 1;
14678c2ecf20Sopenharmony_ci	}
14688c2ecf20Sopenharmony_ci	memset(&btree[index], 0, sizeof(xfs_da_node_entry_t));
14698c2ecf20Sopenharmony_ci	xfs_trans_log_buf(state->args->trans, drop_blk->bp,
14708c2ecf20Sopenharmony_ci	    XFS_DA_LOGRANGE(node, &btree[index], sizeof(btree[index])));
14718c2ecf20Sopenharmony_ci	nodehdr.count -= 1;
14728c2ecf20Sopenharmony_ci	xfs_da3_node_hdr_to_disk(dp->i_mount, node, &nodehdr);
14738c2ecf20Sopenharmony_ci	xfs_trans_log_buf(state->args->trans, drop_blk->bp,
14748c2ecf20Sopenharmony_ci	    XFS_DA_LOGRANGE(node, &node->hdr, state->args->geo->node_hdr_size));
14758c2ecf20Sopenharmony_ci
14768c2ecf20Sopenharmony_ci	/*
14778c2ecf20Sopenharmony_ci	 * Copy the last hash value from the block to propagate upwards.
14788c2ecf20Sopenharmony_ci	 */
14798c2ecf20Sopenharmony_ci	drop_blk->hashval = be32_to_cpu(btree[index - 1].hashval);
14808c2ecf20Sopenharmony_ci}
14818c2ecf20Sopenharmony_ci
14828c2ecf20Sopenharmony_ci/*
14838c2ecf20Sopenharmony_ci * Unbalance the elements between two intermediate nodes,
14848c2ecf20Sopenharmony_ci * move all Btree elements from one node into another.
14858c2ecf20Sopenharmony_ci */
14868c2ecf20Sopenharmony_ciSTATIC void
14878c2ecf20Sopenharmony_cixfs_da3_node_unbalance(
14888c2ecf20Sopenharmony_ci	struct xfs_da_state	*state,
14898c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*drop_blk,
14908c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*save_blk)
14918c2ecf20Sopenharmony_ci{
14928c2ecf20Sopenharmony_ci	struct xfs_da_intnode	*drop_node;
14938c2ecf20Sopenharmony_ci	struct xfs_da_intnode	*save_node;
14948c2ecf20Sopenharmony_ci	struct xfs_da_node_entry *drop_btree;
14958c2ecf20Sopenharmony_ci	struct xfs_da_node_entry *save_btree;
14968c2ecf20Sopenharmony_ci	struct xfs_da3_icnode_hdr drop_hdr;
14978c2ecf20Sopenharmony_ci	struct xfs_da3_icnode_hdr save_hdr;
14988c2ecf20Sopenharmony_ci	struct xfs_trans	*tp;
14998c2ecf20Sopenharmony_ci	int			sindex;
15008c2ecf20Sopenharmony_ci	int			tmp;
15018c2ecf20Sopenharmony_ci	struct xfs_inode	*dp = state->args->dp;
15028c2ecf20Sopenharmony_ci
15038c2ecf20Sopenharmony_ci	trace_xfs_da_node_unbalance(state->args);
15048c2ecf20Sopenharmony_ci
15058c2ecf20Sopenharmony_ci	drop_node = drop_blk->bp->b_addr;
15068c2ecf20Sopenharmony_ci	save_node = save_blk->bp->b_addr;
15078c2ecf20Sopenharmony_ci	xfs_da3_node_hdr_from_disk(dp->i_mount, &drop_hdr, drop_node);
15088c2ecf20Sopenharmony_ci	xfs_da3_node_hdr_from_disk(dp->i_mount, &save_hdr, save_node);
15098c2ecf20Sopenharmony_ci	drop_btree = drop_hdr.btree;
15108c2ecf20Sopenharmony_ci	save_btree = save_hdr.btree;
15118c2ecf20Sopenharmony_ci	tp = state->args->trans;
15128c2ecf20Sopenharmony_ci
15138c2ecf20Sopenharmony_ci	/*
15148c2ecf20Sopenharmony_ci	 * If the dying block has lower hashvals, then move all the
15158c2ecf20Sopenharmony_ci	 * elements in the remaining block up to make a hole.
15168c2ecf20Sopenharmony_ci	 */
15178c2ecf20Sopenharmony_ci	if ((be32_to_cpu(drop_btree[0].hashval) <
15188c2ecf20Sopenharmony_ci			be32_to_cpu(save_btree[0].hashval)) ||
15198c2ecf20Sopenharmony_ci	    (be32_to_cpu(drop_btree[drop_hdr.count - 1].hashval) <
15208c2ecf20Sopenharmony_ci			be32_to_cpu(save_btree[save_hdr.count - 1].hashval))) {
15218c2ecf20Sopenharmony_ci		/* XXX: check this - is memmove dst correct? */
15228c2ecf20Sopenharmony_ci		tmp = save_hdr.count * sizeof(xfs_da_node_entry_t);
15238c2ecf20Sopenharmony_ci		memmove(&save_btree[drop_hdr.count], &save_btree[0], tmp);
15248c2ecf20Sopenharmony_ci
15258c2ecf20Sopenharmony_ci		sindex = 0;
15268c2ecf20Sopenharmony_ci		xfs_trans_log_buf(tp, save_blk->bp,
15278c2ecf20Sopenharmony_ci			XFS_DA_LOGRANGE(save_node, &save_btree[0],
15288c2ecf20Sopenharmony_ci				(save_hdr.count + drop_hdr.count) *
15298c2ecf20Sopenharmony_ci						sizeof(xfs_da_node_entry_t)));
15308c2ecf20Sopenharmony_ci	} else {
15318c2ecf20Sopenharmony_ci		sindex = save_hdr.count;
15328c2ecf20Sopenharmony_ci		xfs_trans_log_buf(tp, save_blk->bp,
15338c2ecf20Sopenharmony_ci			XFS_DA_LOGRANGE(save_node, &save_btree[sindex],
15348c2ecf20Sopenharmony_ci				drop_hdr.count * sizeof(xfs_da_node_entry_t)));
15358c2ecf20Sopenharmony_ci	}
15368c2ecf20Sopenharmony_ci
15378c2ecf20Sopenharmony_ci	/*
15388c2ecf20Sopenharmony_ci	 * Move all the B-tree elements from drop_blk to save_blk.
15398c2ecf20Sopenharmony_ci	 */
15408c2ecf20Sopenharmony_ci	tmp = drop_hdr.count * (uint)sizeof(xfs_da_node_entry_t);
15418c2ecf20Sopenharmony_ci	memcpy(&save_btree[sindex], &drop_btree[0], tmp);
15428c2ecf20Sopenharmony_ci	save_hdr.count += drop_hdr.count;
15438c2ecf20Sopenharmony_ci
15448c2ecf20Sopenharmony_ci	xfs_da3_node_hdr_to_disk(dp->i_mount, save_node, &save_hdr);
15458c2ecf20Sopenharmony_ci	xfs_trans_log_buf(tp, save_blk->bp,
15468c2ecf20Sopenharmony_ci		XFS_DA_LOGRANGE(save_node, &save_node->hdr,
15478c2ecf20Sopenharmony_ci				state->args->geo->node_hdr_size));
15488c2ecf20Sopenharmony_ci
15498c2ecf20Sopenharmony_ci	/*
15508c2ecf20Sopenharmony_ci	 * Save the last hashval in the remaining block for upward propagation.
15518c2ecf20Sopenharmony_ci	 */
15528c2ecf20Sopenharmony_ci	save_blk->hashval = be32_to_cpu(save_btree[save_hdr.count - 1].hashval);
15538c2ecf20Sopenharmony_ci}
15548c2ecf20Sopenharmony_ci
15558c2ecf20Sopenharmony_ci/*========================================================================
15568c2ecf20Sopenharmony_ci * Routines used for finding things in the Btree.
15578c2ecf20Sopenharmony_ci *========================================================================*/
15588c2ecf20Sopenharmony_ci
15598c2ecf20Sopenharmony_ci/*
15608c2ecf20Sopenharmony_ci * Walk down the Btree looking for a particular filename, filling
15618c2ecf20Sopenharmony_ci * in the state structure as we go.
15628c2ecf20Sopenharmony_ci *
15638c2ecf20Sopenharmony_ci * We will set the state structure to point to each of the elements
15648c2ecf20Sopenharmony_ci * in each of the nodes where either the hashval is or should be.
15658c2ecf20Sopenharmony_ci *
15668c2ecf20Sopenharmony_ci * We support duplicate hashval's so for each entry in the current
15678c2ecf20Sopenharmony_ci * node that could contain the desired hashval, descend.  This is a
15688c2ecf20Sopenharmony_ci * pruned depth-first tree search.
15698c2ecf20Sopenharmony_ci */
15708c2ecf20Sopenharmony_ciint							/* error */
15718c2ecf20Sopenharmony_cixfs_da3_node_lookup_int(
15728c2ecf20Sopenharmony_ci	struct xfs_da_state	*state,
15738c2ecf20Sopenharmony_ci	int			*result)
15748c2ecf20Sopenharmony_ci{
15758c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*blk;
15768c2ecf20Sopenharmony_ci	struct xfs_da_blkinfo	*curr;
15778c2ecf20Sopenharmony_ci	struct xfs_da_intnode	*node;
15788c2ecf20Sopenharmony_ci	struct xfs_da_node_entry *btree;
15798c2ecf20Sopenharmony_ci	struct xfs_da3_icnode_hdr nodehdr;
15808c2ecf20Sopenharmony_ci	struct xfs_da_args	*args;
15818c2ecf20Sopenharmony_ci	xfs_dablk_t		blkno;
15828c2ecf20Sopenharmony_ci	xfs_dahash_t		hashval;
15838c2ecf20Sopenharmony_ci	xfs_dahash_t		btreehashval;
15848c2ecf20Sopenharmony_ci	int			probe;
15858c2ecf20Sopenharmony_ci	int			span;
15868c2ecf20Sopenharmony_ci	int			max;
15878c2ecf20Sopenharmony_ci	int			error;
15888c2ecf20Sopenharmony_ci	int			retval;
15898c2ecf20Sopenharmony_ci	unsigned int		expected_level = 0;
15908c2ecf20Sopenharmony_ci	uint16_t		magic;
15918c2ecf20Sopenharmony_ci	struct xfs_inode	*dp = state->args->dp;
15928c2ecf20Sopenharmony_ci
15938c2ecf20Sopenharmony_ci	args = state->args;
15948c2ecf20Sopenharmony_ci
15958c2ecf20Sopenharmony_ci	/*
15968c2ecf20Sopenharmony_ci	 * Descend thru the B-tree searching each level for the right
15978c2ecf20Sopenharmony_ci	 * node to use, until the right hashval is found.
15988c2ecf20Sopenharmony_ci	 */
15998c2ecf20Sopenharmony_ci	blkno = args->geo->leafblk;
16008c2ecf20Sopenharmony_ci	for (blk = &state->path.blk[0], state->path.active = 1;
16018c2ecf20Sopenharmony_ci			 state->path.active <= XFS_DA_NODE_MAXDEPTH;
16028c2ecf20Sopenharmony_ci			 blk++, state->path.active++) {
16038c2ecf20Sopenharmony_ci		/*
16048c2ecf20Sopenharmony_ci		 * Read the next node down in the tree.
16058c2ecf20Sopenharmony_ci		 */
16068c2ecf20Sopenharmony_ci		blk->blkno = blkno;
16078c2ecf20Sopenharmony_ci		error = xfs_da3_node_read(args->trans, args->dp, blkno,
16088c2ecf20Sopenharmony_ci					&blk->bp, args->whichfork);
16098c2ecf20Sopenharmony_ci		if (error) {
16108c2ecf20Sopenharmony_ci			blk->blkno = 0;
16118c2ecf20Sopenharmony_ci			state->path.active--;
16128c2ecf20Sopenharmony_ci			return error;
16138c2ecf20Sopenharmony_ci		}
16148c2ecf20Sopenharmony_ci		curr = blk->bp->b_addr;
16158c2ecf20Sopenharmony_ci		magic = be16_to_cpu(curr->magic);
16168c2ecf20Sopenharmony_ci
16178c2ecf20Sopenharmony_ci		if (magic == XFS_ATTR_LEAF_MAGIC ||
16188c2ecf20Sopenharmony_ci		    magic == XFS_ATTR3_LEAF_MAGIC) {
16198c2ecf20Sopenharmony_ci			blk->magic = XFS_ATTR_LEAF_MAGIC;
16208c2ecf20Sopenharmony_ci			blk->hashval = xfs_attr_leaf_lasthash(blk->bp, NULL);
16218c2ecf20Sopenharmony_ci			break;
16228c2ecf20Sopenharmony_ci		}
16238c2ecf20Sopenharmony_ci
16248c2ecf20Sopenharmony_ci		if (magic == XFS_DIR2_LEAFN_MAGIC ||
16258c2ecf20Sopenharmony_ci		    magic == XFS_DIR3_LEAFN_MAGIC) {
16268c2ecf20Sopenharmony_ci			blk->magic = XFS_DIR2_LEAFN_MAGIC;
16278c2ecf20Sopenharmony_ci			blk->hashval = xfs_dir2_leaf_lasthash(args->dp,
16288c2ecf20Sopenharmony_ci							      blk->bp, NULL);
16298c2ecf20Sopenharmony_ci			break;
16308c2ecf20Sopenharmony_ci		}
16318c2ecf20Sopenharmony_ci
16328c2ecf20Sopenharmony_ci		if (magic != XFS_DA_NODE_MAGIC && magic != XFS_DA3_NODE_MAGIC) {
16338c2ecf20Sopenharmony_ci			xfs_buf_mark_corrupt(blk->bp);
16348c2ecf20Sopenharmony_ci			return -EFSCORRUPTED;
16358c2ecf20Sopenharmony_ci		}
16368c2ecf20Sopenharmony_ci
16378c2ecf20Sopenharmony_ci		blk->magic = XFS_DA_NODE_MAGIC;
16388c2ecf20Sopenharmony_ci
16398c2ecf20Sopenharmony_ci		/*
16408c2ecf20Sopenharmony_ci		 * Search an intermediate node for a match.
16418c2ecf20Sopenharmony_ci		 */
16428c2ecf20Sopenharmony_ci		node = blk->bp->b_addr;
16438c2ecf20Sopenharmony_ci		xfs_da3_node_hdr_from_disk(dp->i_mount, &nodehdr, node);
16448c2ecf20Sopenharmony_ci		btree = nodehdr.btree;
16458c2ecf20Sopenharmony_ci
16468c2ecf20Sopenharmony_ci		/* Tree taller than we can handle; bail out! */
16478c2ecf20Sopenharmony_ci		if (nodehdr.level >= XFS_DA_NODE_MAXDEPTH) {
16488c2ecf20Sopenharmony_ci			xfs_buf_mark_corrupt(blk->bp);
16498c2ecf20Sopenharmony_ci			return -EFSCORRUPTED;
16508c2ecf20Sopenharmony_ci		}
16518c2ecf20Sopenharmony_ci
16528c2ecf20Sopenharmony_ci		/* Check the level from the root. */
16538c2ecf20Sopenharmony_ci		if (blkno == args->geo->leafblk)
16548c2ecf20Sopenharmony_ci			expected_level = nodehdr.level - 1;
16558c2ecf20Sopenharmony_ci		else if (expected_level != nodehdr.level) {
16568c2ecf20Sopenharmony_ci			xfs_buf_mark_corrupt(blk->bp);
16578c2ecf20Sopenharmony_ci			return -EFSCORRUPTED;
16588c2ecf20Sopenharmony_ci		} else
16598c2ecf20Sopenharmony_ci			expected_level--;
16608c2ecf20Sopenharmony_ci
16618c2ecf20Sopenharmony_ci		max = nodehdr.count;
16628c2ecf20Sopenharmony_ci		blk->hashval = be32_to_cpu(btree[max - 1].hashval);
16638c2ecf20Sopenharmony_ci
16648c2ecf20Sopenharmony_ci		/*
16658c2ecf20Sopenharmony_ci		 * Binary search.  (note: small blocks will skip loop)
16668c2ecf20Sopenharmony_ci		 */
16678c2ecf20Sopenharmony_ci		probe = span = max / 2;
16688c2ecf20Sopenharmony_ci		hashval = args->hashval;
16698c2ecf20Sopenharmony_ci		while (span > 4) {
16708c2ecf20Sopenharmony_ci			span /= 2;
16718c2ecf20Sopenharmony_ci			btreehashval = be32_to_cpu(btree[probe].hashval);
16728c2ecf20Sopenharmony_ci			if (btreehashval < hashval)
16738c2ecf20Sopenharmony_ci				probe += span;
16748c2ecf20Sopenharmony_ci			else if (btreehashval > hashval)
16758c2ecf20Sopenharmony_ci				probe -= span;
16768c2ecf20Sopenharmony_ci			else
16778c2ecf20Sopenharmony_ci				break;
16788c2ecf20Sopenharmony_ci		}
16798c2ecf20Sopenharmony_ci		ASSERT((probe >= 0) && (probe < max));
16808c2ecf20Sopenharmony_ci		ASSERT((span <= 4) ||
16818c2ecf20Sopenharmony_ci			(be32_to_cpu(btree[probe].hashval) == hashval));
16828c2ecf20Sopenharmony_ci
16838c2ecf20Sopenharmony_ci		/*
16848c2ecf20Sopenharmony_ci		 * Since we may have duplicate hashval's, find the first
16858c2ecf20Sopenharmony_ci		 * matching hashval in the node.
16868c2ecf20Sopenharmony_ci		 */
16878c2ecf20Sopenharmony_ci		while (probe > 0 &&
16888c2ecf20Sopenharmony_ci		       be32_to_cpu(btree[probe].hashval) >= hashval) {
16898c2ecf20Sopenharmony_ci			probe--;
16908c2ecf20Sopenharmony_ci		}
16918c2ecf20Sopenharmony_ci		while (probe < max &&
16928c2ecf20Sopenharmony_ci		       be32_to_cpu(btree[probe].hashval) < hashval) {
16938c2ecf20Sopenharmony_ci			probe++;
16948c2ecf20Sopenharmony_ci		}
16958c2ecf20Sopenharmony_ci
16968c2ecf20Sopenharmony_ci		/*
16978c2ecf20Sopenharmony_ci		 * Pick the right block to descend on.
16988c2ecf20Sopenharmony_ci		 */
16998c2ecf20Sopenharmony_ci		if (probe == max) {
17008c2ecf20Sopenharmony_ci			blk->index = max - 1;
17018c2ecf20Sopenharmony_ci			blkno = be32_to_cpu(btree[max - 1].before);
17028c2ecf20Sopenharmony_ci		} else {
17038c2ecf20Sopenharmony_ci			blk->index = probe;
17048c2ecf20Sopenharmony_ci			blkno = be32_to_cpu(btree[probe].before);
17058c2ecf20Sopenharmony_ci		}
17068c2ecf20Sopenharmony_ci
17078c2ecf20Sopenharmony_ci		/* We can't point back to the root. */
17088c2ecf20Sopenharmony_ci		if (XFS_IS_CORRUPT(dp->i_mount, blkno == args->geo->leafblk))
17098c2ecf20Sopenharmony_ci			return -EFSCORRUPTED;
17108c2ecf20Sopenharmony_ci	}
17118c2ecf20Sopenharmony_ci
17128c2ecf20Sopenharmony_ci	if (XFS_IS_CORRUPT(dp->i_mount, expected_level != 0))
17138c2ecf20Sopenharmony_ci		return -EFSCORRUPTED;
17148c2ecf20Sopenharmony_ci
17158c2ecf20Sopenharmony_ci	/*
17168c2ecf20Sopenharmony_ci	 * A leaf block that ends in the hashval that we are interested in
17178c2ecf20Sopenharmony_ci	 * (final hashval == search hashval) means that the next block may
17188c2ecf20Sopenharmony_ci	 * contain more entries with the same hashval, shift upward to the
17198c2ecf20Sopenharmony_ci	 * next leaf and keep searching.
17208c2ecf20Sopenharmony_ci	 */
17218c2ecf20Sopenharmony_ci	for (;;) {
17228c2ecf20Sopenharmony_ci		if (blk->magic == XFS_DIR2_LEAFN_MAGIC) {
17238c2ecf20Sopenharmony_ci			retval = xfs_dir2_leafn_lookup_int(blk->bp, args,
17248c2ecf20Sopenharmony_ci							&blk->index, state);
17258c2ecf20Sopenharmony_ci		} else if (blk->magic == XFS_ATTR_LEAF_MAGIC) {
17268c2ecf20Sopenharmony_ci			retval = xfs_attr3_leaf_lookup_int(blk->bp, args);
17278c2ecf20Sopenharmony_ci			blk->index = args->index;
17288c2ecf20Sopenharmony_ci			args->blkno = blk->blkno;
17298c2ecf20Sopenharmony_ci		} else {
17308c2ecf20Sopenharmony_ci			ASSERT(0);
17318c2ecf20Sopenharmony_ci			return -EFSCORRUPTED;
17328c2ecf20Sopenharmony_ci		}
17338c2ecf20Sopenharmony_ci		if (((retval == -ENOENT) || (retval == -ENOATTR)) &&
17348c2ecf20Sopenharmony_ci		    (blk->hashval == args->hashval)) {
17358c2ecf20Sopenharmony_ci			error = xfs_da3_path_shift(state, &state->path, 1, 1,
17368c2ecf20Sopenharmony_ci							 &retval);
17378c2ecf20Sopenharmony_ci			if (error)
17388c2ecf20Sopenharmony_ci				return error;
17398c2ecf20Sopenharmony_ci			if (retval == 0) {
17408c2ecf20Sopenharmony_ci				continue;
17418c2ecf20Sopenharmony_ci			} else if (blk->magic == XFS_ATTR_LEAF_MAGIC) {
17428c2ecf20Sopenharmony_ci				/* path_shift() gives ENOENT */
17438c2ecf20Sopenharmony_ci				retval = -ENOATTR;
17448c2ecf20Sopenharmony_ci			}
17458c2ecf20Sopenharmony_ci		}
17468c2ecf20Sopenharmony_ci		break;
17478c2ecf20Sopenharmony_ci	}
17488c2ecf20Sopenharmony_ci	*result = retval;
17498c2ecf20Sopenharmony_ci	return 0;
17508c2ecf20Sopenharmony_ci}
17518c2ecf20Sopenharmony_ci
17528c2ecf20Sopenharmony_ci/*========================================================================
17538c2ecf20Sopenharmony_ci * Utility routines.
17548c2ecf20Sopenharmony_ci *========================================================================*/
17558c2ecf20Sopenharmony_ci
17568c2ecf20Sopenharmony_ci/*
17578c2ecf20Sopenharmony_ci * Compare two intermediate nodes for "order".
17588c2ecf20Sopenharmony_ci */
17598c2ecf20Sopenharmony_ciSTATIC int
17608c2ecf20Sopenharmony_cixfs_da3_node_order(
17618c2ecf20Sopenharmony_ci	struct xfs_inode *dp,
17628c2ecf20Sopenharmony_ci	struct xfs_buf	*node1_bp,
17638c2ecf20Sopenharmony_ci	struct xfs_buf	*node2_bp)
17648c2ecf20Sopenharmony_ci{
17658c2ecf20Sopenharmony_ci	struct xfs_da_intnode	*node1;
17668c2ecf20Sopenharmony_ci	struct xfs_da_intnode	*node2;
17678c2ecf20Sopenharmony_ci	struct xfs_da_node_entry *btree1;
17688c2ecf20Sopenharmony_ci	struct xfs_da_node_entry *btree2;
17698c2ecf20Sopenharmony_ci	struct xfs_da3_icnode_hdr node1hdr;
17708c2ecf20Sopenharmony_ci	struct xfs_da3_icnode_hdr node2hdr;
17718c2ecf20Sopenharmony_ci
17728c2ecf20Sopenharmony_ci	node1 = node1_bp->b_addr;
17738c2ecf20Sopenharmony_ci	node2 = node2_bp->b_addr;
17748c2ecf20Sopenharmony_ci	xfs_da3_node_hdr_from_disk(dp->i_mount, &node1hdr, node1);
17758c2ecf20Sopenharmony_ci	xfs_da3_node_hdr_from_disk(dp->i_mount, &node2hdr, node2);
17768c2ecf20Sopenharmony_ci	btree1 = node1hdr.btree;
17778c2ecf20Sopenharmony_ci	btree2 = node2hdr.btree;
17788c2ecf20Sopenharmony_ci
17798c2ecf20Sopenharmony_ci	if (node1hdr.count > 0 && node2hdr.count > 0 &&
17808c2ecf20Sopenharmony_ci	    ((be32_to_cpu(btree2[0].hashval) < be32_to_cpu(btree1[0].hashval)) ||
17818c2ecf20Sopenharmony_ci	     (be32_to_cpu(btree2[node2hdr.count - 1].hashval) <
17828c2ecf20Sopenharmony_ci	      be32_to_cpu(btree1[node1hdr.count - 1].hashval)))) {
17838c2ecf20Sopenharmony_ci		return 1;
17848c2ecf20Sopenharmony_ci	}
17858c2ecf20Sopenharmony_ci	return 0;
17868c2ecf20Sopenharmony_ci}
17878c2ecf20Sopenharmony_ci
17888c2ecf20Sopenharmony_ci/*
17898c2ecf20Sopenharmony_ci * Link a new block into a doubly linked list of blocks (of whatever type).
17908c2ecf20Sopenharmony_ci */
17918c2ecf20Sopenharmony_ciint							/* error */
17928c2ecf20Sopenharmony_cixfs_da3_blk_link(
17938c2ecf20Sopenharmony_ci	struct xfs_da_state	*state,
17948c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*old_blk,
17958c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*new_blk)
17968c2ecf20Sopenharmony_ci{
17978c2ecf20Sopenharmony_ci	struct xfs_da_blkinfo	*old_info;
17988c2ecf20Sopenharmony_ci	struct xfs_da_blkinfo	*new_info;
17998c2ecf20Sopenharmony_ci	struct xfs_da_blkinfo	*tmp_info;
18008c2ecf20Sopenharmony_ci	struct xfs_da_args	*args;
18018c2ecf20Sopenharmony_ci	struct xfs_buf		*bp;
18028c2ecf20Sopenharmony_ci	int			before = 0;
18038c2ecf20Sopenharmony_ci	int			error;
18048c2ecf20Sopenharmony_ci	struct xfs_inode	*dp = state->args->dp;
18058c2ecf20Sopenharmony_ci
18068c2ecf20Sopenharmony_ci	/*
18078c2ecf20Sopenharmony_ci	 * Set up environment.
18088c2ecf20Sopenharmony_ci	 */
18098c2ecf20Sopenharmony_ci	args = state->args;
18108c2ecf20Sopenharmony_ci	ASSERT(args != NULL);
18118c2ecf20Sopenharmony_ci	old_info = old_blk->bp->b_addr;
18128c2ecf20Sopenharmony_ci	new_info = new_blk->bp->b_addr;
18138c2ecf20Sopenharmony_ci	ASSERT(old_blk->magic == XFS_DA_NODE_MAGIC ||
18148c2ecf20Sopenharmony_ci	       old_blk->magic == XFS_DIR2_LEAFN_MAGIC ||
18158c2ecf20Sopenharmony_ci	       old_blk->magic == XFS_ATTR_LEAF_MAGIC);
18168c2ecf20Sopenharmony_ci
18178c2ecf20Sopenharmony_ci	switch (old_blk->magic) {
18188c2ecf20Sopenharmony_ci	case XFS_ATTR_LEAF_MAGIC:
18198c2ecf20Sopenharmony_ci		before = xfs_attr_leaf_order(old_blk->bp, new_blk->bp);
18208c2ecf20Sopenharmony_ci		break;
18218c2ecf20Sopenharmony_ci	case XFS_DIR2_LEAFN_MAGIC:
18228c2ecf20Sopenharmony_ci		before = xfs_dir2_leafn_order(dp, old_blk->bp, new_blk->bp);
18238c2ecf20Sopenharmony_ci		break;
18248c2ecf20Sopenharmony_ci	case XFS_DA_NODE_MAGIC:
18258c2ecf20Sopenharmony_ci		before = xfs_da3_node_order(dp, old_blk->bp, new_blk->bp);
18268c2ecf20Sopenharmony_ci		break;
18278c2ecf20Sopenharmony_ci	}
18288c2ecf20Sopenharmony_ci
18298c2ecf20Sopenharmony_ci	/*
18308c2ecf20Sopenharmony_ci	 * Link blocks in appropriate order.
18318c2ecf20Sopenharmony_ci	 */
18328c2ecf20Sopenharmony_ci	if (before) {
18338c2ecf20Sopenharmony_ci		/*
18348c2ecf20Sopenharmony_ci		 * Link new block in before existing block.
18358c2ecf20Sopenharmony_ci		 */
18368c2ecf20Sopenharmony_ci		trace_xfs_da_link_before(args);
18378c2ecf20Sopenharmony_ci		new_info->forw = cpu_to_be32(old_blk->blkno);
18388c2ecf20Sopenharmony_ci		new_info->back = old_info->back;
18398c2ecf20Sopenharmony_ci		if (old_info->back) {
18408c2ecf20Sopenharmony_ci			error = xfs_da3_node_read(args->trans, dp,
18418c2ecf20Sopenharmony_ci						be32_to_cpu(old_info->back),
18428c2ecf20Sopenharmony_ci						&bp, args->whichfork);
18438c2ecf20Sopenharmony_ci			if (error)
18448c2ecf20Sopenharmony_ci				return error;
18458c2ecf20Sopenharmony_ci			ASSERT(bp != NULL);
18468c2ecf20Sopenharmony_ci			tmp_info = bp->b_addr;
18478c2ecf20Sopenharmony_ci			ASSERT(tmp_info->magic == old_info->magic);
18488c2ecf20Sopenharmony_ci			ASSERT(be32_to_cpu(tmp_info->forw) == old_blk->blkno);
18498c2ecf20Sopenharmony_ci			tmp_info->forw = cpu_to_be32(new_blk->blkno);
18508c2ecf20Sopenharmony_ci			xfs_trans_log_buf(args->trans, bp, 0, sizeof(*tmp_info)-1);
18518c2ecf20Sopenharmony_ci		}
18528c2ecf20Sopenharmony_ci		old_info->back = cpu_to_be32(new_blk->blkno);
18538c2ecf20Sopenharmony_ci	} else {
18548c2ecf20Sopenharmony_ci		/*
18558c2ecf20Sopenharmony_ci		 * Link new block in after existing block.
18568c2ecf20Sopenharmony_ci		 */
18578c2ecf20Sopenharmony_ci		trace_xfs_da_link_after(args);
18588c2ecf20Sopenharmony_ci		new_info->forw = old_info->forw;
18598c2ecf20Sopenharmony_ci		new_info->back = cpu_to_be32(old_blk->blkno);
18608c2ecf20Sopenharmony_ci		if (old_info->forw) {
18618c2ecf20Sopenharmony_ci			error = xfs_da3_node_read(args->trans, dp,
18628c2ecf20Sopenharmony_ci						be32_to_cpu(old_info->forw),
18638c2ecf20Sopenharmony_ci						&bp, args->whichfork);
18648c2ecf20Sopenharmony_ci			if (error)
18658c2ecf20Sopenharmony_ci				return error;
18668c2ecf20Sopenharmony_ci			ASSERT(bp != NULL);
18678c2ecf20Sopenharmony_ci			tmp_info = bp->b_addr;
18688c2ecf20Sopenharmony_ci			ASSERT(tmp_info->magic == old_info->magic);
18698c2ecf20Sopenharmony_ci			ASSERT(be32_to_cpu(tmp_info->back) == old_blk->blkno);
18708c2ecf20Sopenharmony_ci			tmp_info->back = cpu_to_be32(new_blk->blkno);
18718c2ecf20Sopenharmony_ci			xfs_trans_log_buf(args->trans, bp, 0, sizeof(*tmp_info)-1);
18728c2ecf20Sopenharmony_ci		}
18738c2ecf20Sopenharmony_ci		old_info->forw = cpu_to_be32(new_blk->blkno);
18748c2ecf20Sopenharmony_ci	}
18758c2ecf20Sopenharmony_ci
18768c2ecf20Sopenharmony_ci	xfs_trans_log_buf(args->trans, old_blk->bp, 0, sizeof(*tmp_info) - 1);
18778c2ecf20Sopenharmony_ci	xfs_trans_log_buf(args->trans, new_blk->bp, 0, sizeof(*tmp_info) - 1);
18788c2ecf20Sopenharmony_ci	return 0;
18798c2ecf20Sopenharmony_ci}
18808c2ecf20Sopenharmony_ci
18818c2ecf20Sopenharmony_ci/*
18828c2ecf20Sopenharmony_ci * Unlink a block from a doubly linked list of blocks.
18838c2ecf20Sopenharmony_ci */
18848c2ecf20Sopenharmony_ciSTATIC int						/* error */
18858c2ecf20Sopenharmony_cixfs_da3_blk_unlink(
18868c2ecf20Sopenharmony_ci	struct xfs_da_state	*state,
18878c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*drop_blk,
18888c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*save_blk)
18898c2ecf20Sopenharmony_ci{
18908c2ecf20Sopenharmony_ci	struct xfs_da_blkinfo	*drop_info;
18918c2ecf20Sopenharmony_ci	struct xfs_da_blkinfo	*save_info;
18928c2ecf20Sopenharmony_ci	struct xfs_da_blkinfo	*tmp_info;
18938c2ecf20Sopenharmony_ci	struct xfs_da_args	*args;
18948c2ecf20Sopenharmony_ci	struct xfs_buf		*bp;
18958c2ecf20Sopenharmony_ci	int			error;
18968c2ecf20Sopenharmony_ci
18978c2ecf20Sopenharmony_ci	/*
18988c2ecf20Sopenharmony_ci	 * Set up environment.
18998c2ecf20Sopenharmony_ci	 */
19008c2ecf20Sopenharmony_ci	args = state->args;
19018c2ecf20Sopenharmony_ci	ASSERT(args != NULL);
19028c2ecf20Sopenharmony_ci	save_info = save_blk->bp->b_addr;
19038c2ecf20Sopenharmony_ci	drop_info = drop_blk->bp->b_addr;
19048c2ecf20Sopenharmony_ci	ASSERT(save_blk->magic == XFS_DA_NODE_MAGIC ||
19058c2ecf20Sopenharmony_ci	       save_blk->magic == XFS_DIR2_LEAFN_MAGIC ||
19068c2ecf20Sopenharmony_ci	       save_blk->magic == XFS_ATTR_LEAF_MAGIC);
19078c2ecf20Sopenharmony_ci	ASSERT(save_blk->magic == drop_blk->magic);
19088c2ecf20Sopenharmony_ci	ASSERT((be32_to_cpu(save_info->forw) == drop_blk->blkno) ||
19098c2ecf20Sopenharmony_ci	       (be32_to_cpu(save_info->back) == drop_blk->blkno));
19108c2ecf20Sopenharmony_ci	ASSERT((be32_to_cpu(drop_info->forw) == save_blk->blkno) ||
19118c2ecf20Sopenharmony_ci	       (be32_to_cpu(drop_info->back) == save_blk->blkno));
19128c2ecf20Sopenharmony_ci
19138c2ecf20Sopenharmony_ci	/*
19148c2ecf20Sopenharmony_ci	 * Unlink the leaf block from the doubly linked chain of leaves.
19158c2ecf20Sopenharmony_ci	 */
19168c2ecf20Sopenharmony_ci	if (be32_to_cpu(save_info->back) == drop_blk->blkno) {
19178c2ecf20Sopenharmony_ci		trace_xfs_da_unlink_back(args);
19188c2ecf20Sopenharmony_ci		save_info->back = drop_info->back;
19198c2ecf20Sopenharmony_ci		if (drop_info->back) {
19208c2ecf20Sopenharmony_ci			error = xfs_da3_node_read(args->trans, args->dp,
19218c2ecf20Sopenharmony_ci						be32_to_cpu(drop_info->back),
19228c2ecf20Sopenharmony_ci						&bp, args->whichfork);
19238c2ecf20Sopenharmony_ci			if (error)
19248c2ecf20Sopenharmony_ci				return error;
19258c2ecf20Sopenharmony_ci			ASSERT(bp != NULL);
19268c2ecf20Sopenharmony_ci			tmp_info = bp->b_addr;
19278c2ecf20Sopenharmony_ci			ASSERT(tmp_info->magic == save_info->magic);
19288c2ecf20Sopenharmony_ci			ASSERT(be32_to_cpu(tmp_info->forw) == drop_blk->blkno);
19298c2ecf20Sopenharmony_ci			tmp_info->forw = cpu_to_be32(save_blk->blkno);
19308c2ecf20Sopenharmony_ci			xfs_trans_log_buf(args->trans, bp, 0,
19318c2ecf20Sopenharmony_ci						    sizeof(*tmp_info) - 1);
19328c2ecf20Sopenharmony_ci		}
19338c2ecf20Sopenharmony_ci	} else {
19348c2ecf20Sopenharmony_ci		trace_xfs_da_unlink_forward(args);
19358c2ecf20Sopenharmony_ci		save_info->forw = drop_info->forw;
19368c2ecf20Sopenharmony_ci		if (drop_info->forw) {
19378c2ecf20Sopenharmony_ci			error = xfs_da3_node_read(args->trans, args->dp,
19388c2ecf20Sopenharmony_ci						be32_to_cpu(drop_info->forw),
19398c2ecf20Sopenharmony_ci						&bp, args->whichfork);
19408c2ecf20Sopenharmony_ci			if (error)
19418c2ecf20Sopenharmony_ci				return error;
19428c2ecf20Sopenharmony_ci			ASSERT(bp != NULL);
19438c2ecf20Sopenharmony_ci			tmp_info = bp->b_addr;
19448c2ecf20Sopenharmony_ci			ASSERT(tmp_info->magic == save_info->magic);
19458c2ecf20Sopenharmony_ci			ASSERT(be32_to_cpu(tmp_info->back) == drop_blk->blkno);
19468c2ecf20Sopenharmony_ci			tmp_info->back = cpu_to_be32(save_blk->blkno);
19478c2ecf20Sopenharmony_ci			xfs_trans_log_buf(args->trans, bp, 0,
19488c2ecf20Sopenharmony_ci						    sizeof(*tmp_info) - 1);
19498c2ecf20Sopenharmony_ci		}
19508c2ecf20Sopenharmony_ci	}
19518c2ecf20Sopenharmony_ci
19528c2ecf20Sopenharmony_ci	xfs_trans_log_buf(args->trans, save_blk->bp, 0, sizeof(*save_info) - 1);
19538c2ecf20Sopenharmony_ci	return 0;
19548c2ecf20Sopenharmony_ci}
19558c2ecf20Sopenharmony_ci
19568c2ecf20Sopenharmony_ci/*
19578c2ecf20Sopenharmony_ci * Move a path "forward" or "!forward" one block at the current level.
19588c2ecf20Sopenharmony_ci *
19598c2ecf20Sopenharmony_ci * This routine will adjust a "path" to point to the next block
19608c2ecf20Sopenharmony_ci * "forward" (higher hashvalues) or "!forward" (lower hashvals) in the
19618c2ecf20Sopenharmony_ci * Btree, including updating pointers to the intermediate nodes between
19628c2ecf20Sopenharmony_ci * the new bottom and the root.
19638c2ecf20Sopenharmony_ci */
19648c2ecf20Sopenharmony_ciint							/* error */
19658c2ecf20Sopenharmony_cixfs_da3_path_shift(
19668c2ecf20Sopenharmony_ci	struct xfs_da_state	*state,
19678c2ecf20Sopenharmony_ci	struct xfs_da_state_path *path,
19688c2ecf20Sopenharmony_ci	int			forward,
19698c2ecf20Sopenharmony_ci	int			release,
19708c2ecf20Sopenharmony_ci	int			*result)
19718c2ecf20Sopenharmony_ci{
19728c2ecf20Sopenharmony_ci	struct xfs_da_state_blk	*blk;
19738c2ecf20Sopenharmony_ci	struct xfs_da_blkinfo	*info;
19748c2ecf20Sopenharmony_ci	struct xfs_da_args	*args;
19758c2ecf20Sopenharmony_ci	struct xfs_da_node_entry *btree;
19768c2ecf20Sopenharmony_ci	struct xfs_da3_icnode_hdr nodehdr;
19778c2ecf20Sopenharmony_ci	struct xfs_buf		*bp;
19788c2ecf20Sopenharmony_ci	xfs_dablk_t		blkno = 0;
19798c2ecf20Sopenharmony_ci	int			level;
19808c2ecf20Sopenharmony_ci	int			error;
19818c2ecf20Sopenharmony_ci	struct xfs_inode	*dp = state->args->dp;
19828c2ecf20Sopenharmony_ci
19838c2ecf20Sopenharmony_ci	trace_xfs_da_path_shift(state->args);
19848c2ecf20Sopenharmony_ci
19858c2ecf20Sopenharmony_ci	/*
19868c2ecf20Sopenharmony_ci	 * Roll up the Btree looking for the first block where our
19878c2ecf20Sopenharmony_ci	 * current index is not at the edge of the block.  Note that
19888c2ecf20Sopenharmony_ci	 * we skip the bottom layer because we want the sibling block.
19898c2ecf20Sopenharmony_ci	 */
19908c2ecf20Sopenharmony_ci	args = state->args;
19918c2ecf20Sopenharmony_ci	ASSERT(args != NULL);
19928c2ecf20Sopenharmony_ci	ASSERT(path != NULL);
19938c2ecf20Sopenharmony_ci	ASSERT((path->active > 0) && (path->active < XFS_DA_NODE_MAXDEPTH));
19948c2ecf20Sopenharmony_ci	level = (path->active-1) - 1;	/* skip bottom layer in path */
19958c2ecf20Sopenharmony_ci	for (; level >= 0; level--) {
19968c2ecf20Sopenharmony_ci		blk = &path->blk[level];
19978c2ecf20Sopenharmony_ci		xfs_da3_node_hdr_from_disk(dp->i_mount, &nodehdr,
19988c2ecf20Sopenharmony_ci					   blk->bp->b_addr);
19998c2ecf20Sopenharmony_ci
20008c2ecf20Sopenharmony_ci		if (forward && (blk->index < nodehdr.count - 1)) {
20018c2ecf20Sopenharmony_ci			blk->index++;
20028c2ecf20Sopenharmony_ci			blkno = be32_to_cpu(nodehdr.btree[blk->index].before);
20038c2ecf20Sopenharmony_ci			break;
20048c2ecf20Sopenharmony_ci		} else if (!forward && (blk->index > 0)) {
20058c2ecf20Sopenharmony_ci			blk->index--;
20068c2ecf20Sopenharmony_ci			blkno = be32_to_cpu(nodehdr.btree[blk->index].before);
20078c2ecf20Sopenharmony_ci			break;
20088c2ecf20Sopenharmony_ci		}
20098c2ecf20Sopenharmony_ci	}
20108c2ecf20Sopenharmony_ci	if (level < 0) {
20118c2ecf20Sopenharmony_ci		*result = -ENOENT;	/* we're out of our tree */
20128c2ecf20Sopenharmony_ci		ASSERT(args->op_flags & XFS_DA_OP_OKNOENT);
20138c2ecf20Sopenharmony_ci		return 0;
20148c2ecf20Sopenharmony_ci	}
20158c2ecf20Sopenharmony_ci
20168c2ecf20Sopenharmony_ci	/*
20178c2ecf20Sopenharmony_ci	 * Roll down the edge of the subtree until we reach the
20188c2ecf20Sopenharmony_ci	 * same depth we were at originally.
20198c2ecf20Sopenharmony_ci	 */
20208c2ecf20Sopenharmony_ci	for (blk++, level++; level < path->active; blk++, level++) {
20218c2ecf20Sopenharmony_ci		/*
20228c2ecf20Sopenharmony_ci		 * Read the next child block into a local buffer.
20238c2ecf20Sopenharmony_ci		 */
20248c2ecf20Sopenharmony_ci		error = xfs_da3_node_read(args->trans, dp, blkno, &bp,
20258c2ecf20Sopenharmony_ci					  args->whichfork);
20268c2ecf20Sopenharmony_ci		if (error)
20278c2ecf20Sopenharmony_ci			return error;
20288c2ecf20Sopenharmony_ci
20298c2ecf20Sopenharmony_ci		/*
20308c2ecf20Sopenharmony_ci		 * Release the old block (if it's dirty, the trans doesn't
20318c2ecf20Sopenharmony_ci		 * actually let go) and swap the local buffer into the path
20328c2ecf20Sopenharmony_ci		 * structure. This ensures failure of the above read doesn't set
20338c2ecf20Sopenharmony_ci		 * a NULL buffer in an active slot in the path.
20348c2ecf20Sopenharmony_ci		 */
20358c2ecf20Sopenharmony_ci		if (release)
20368c2ecf20Sopenharmony_ci			xfs_trans_brelse(args->trans, blk->bp);
20378c2ecf20Sopenharmony_ci		blk->blkno = blkno;
20388c2ecf20Sopenharmony_ci		blk->bp = bp;
20398c2ecf20Sopenharmony_ci
20408c2ecf20Sopenharmony_ci		info = blk->bp->b_addr;
20418c2ecf20Sopenharmony_ci		ASSERT(info->magic == cpu_to_be16(XFS_DA_NODE_MAGIC) ||
20428c2ecf20Sopenharmony_ci		       info->magic == cpu_to_be16(XFS_DA3_NODE_MAGIC) ||
20438c2ecf20Sopenharmony_ci		       info->magic == cpu_to_be16(XFS_DIR2_LEAFN_MAGIC) ||
20448c2ecf20Sopenharmony_ci		       info->magic == cpu_to_be16(XFS_DIR3_LEAFN_MAGIC) ||
20458c2ecf20Sopenharmony_ci		       info->magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC) ||
20468c2ecf20Sopenharmony_ci		       info->magic == cpu_to_be16(XFS_ATTR3_LEAF_MAGIC));
20478c2ecf20Sopenharmony_ci
20488c2ecf20Sopenharmony_ci
20498c2ecf20Sopenharmony_ci		/*
20508c2ecf20Sopenharmony_ci		 * Note: we flatten the magic number to a single type so we
20518c2ecf20Sopenharmony_ci		 * don't have to compare against crc/non-crc types elsewhere.
20528c2ecf20Sopenharmony_ci		 */
20538c2ecf20Sopenharmony_ci		switch (be16_to_cpu(info->magic)) {
20548c2ecf20Sopenharmony_ci		case XFS_DA_NODE_MAGIC:
20558c2ecf20Sopenharmony_ci		case XFS_DA3_NODE_MAGIC:
20568c2ecf20Sopenharmony_ci			blk->magic = XFS_DA_NODE_MAGIC;
20578c2ecf20Sopenharmony_ci			xfs_da3_node_hdr_from_disk(dp->i_mount, &nodehdr,
20588c2ecf20Sopenharmony_ci						   bp->b_addr);
20598c2ecf20Sopenharmony_ci			btree = nodehdr.btree;
20608c2ecf20Sopenharmony_ci			blk->hashval = be32_to_cpu(btree[nodehdr.count - 1].hashval);
20618c2ecf20Sopenharmony_ci			if (forward)
20628c2ecf20Sopenharmony_ci				blk->index = 0;
20638c2ecf20Sopenharmony_ci			else
20648c2ecf20Sopenharmony_ci				blk->index = nodehdr.count - 1;
20658c2ecf20Sopenharmony_ci			blkno = be32_to_cpu(btree[blk->index].before);
20668c2ecf20Sopenharmony_ci			break;
20678c2ecf20Sopenharmony_ci		case XFS_ATTR_LEAF_MAGIC:
20688c2ecf20Sopenharmony_ci		case XFS_ATTR3_LEAF_MAGIC:
20698c2ecf20Sopenharmony_ci			blk->magic = XFS_ATTR_LEAF_MAGIC;
20708c2ecf20Sopenharmony_ci			ASSERT(level == path->active-1);
20718c2ecf20Sopenharmony_ci			blk->index = 0;
20728c2ecf20Sopenharmony_ci			blk->hashval = xfs_attr_leaf_lasthash(blk->bp, NULL);
20738c2ecf20Sopenharmony_ci			break;
20748c2ecf20Sopenharmony_ci		case XFS_DIR2_LEAFN_MAGIC:
20758c2ecf20Sopenharmony_ci		case XFS_DIR3_LEAFN_MAGIC:
20768c2ecf20Sopenharmony_ci			blk->magic = XFS_DIR2_LEAFN_MAGIC;
20778c2ecf20Sopenharmony_ci			ASSERT(level == path->active-1);
20788c2ecf20Sopenharmony_ci			blk->index = 0;
20798c2ecf20Sopenharmony_ci			blk->hashval = xfs_dir2_leaf_lasthash(args->dp,
20808c2ecf20Sopenharmony_ci							      blk->bp, NULL);
20818c2ecf20Sopenharmony_ci			break;
20828c2ecf20Sopenharmony_ci		default:
20838c2ecf20Sopenharmony_ci			ASSERT(0);
20848c2ecf20Sopenharmony_ci			break;
20858c2ecf20Sopenharmony_ci		}
20868c2ecf20Sopenharmony_ci	}
20878c2ecf20Sopenharmony_ci	*result = 0;
20888c2ecf20Sopenharmony_ci	return 0;
20898c2ecf20Sopenharmony_ci}
20908c2ecf20Sopenharmony_ci
20918c2ecf20Sopenharmony_ci
20928c2ecf20Sopenharmony_ci/*========================================================================
20938c2ecf20Sopenharmony_ci * Utility routines.
20948c2ecf20Sopenharmony_ci *========================================================================*/
20958c2ecf20Sopenharmony_ci
20968c2ecf20Sopenharmony_ci/*
20978c2ecf20Sopenharmony_ci * Implement a simple hash on a character string.
20988c2ecf20Sopenharmony_ci * Rotate the hash value by 7 bits, then XOR each character in.
20998c2ecf20Sopenharmony_ci * This is implemented with some source-level loop unrolling.
21008c2ecf20Sopenharmony_ci */
21018c2ecf20Sopenharmony_cixfs_dahash_t
21028c2ecf20Sopenharmony_cixfs_da_hashname(const uint8_t *name, int namelen)
21038c2ecf20Sopenharmony_ci{
21048c2ecf20Sopenharmony_ci	xfs_dahash_t hash;
21058c2ecf20Sopenharmony_ci
21068c2ecf20Sopenharmony_ci	/*
21078c2ecf20Sopenharmony_ci	 * Do four characters at a time as long as we can.
21088c2ecf20Sopenharmony_ci	 */
21098c2ecf20Sopenharmony_ci	for (hash = 0; namelen >= 4; namelen -= 4, name += 4)
21108c2ecf20Sopenharmony_ci		hash = (name[0] << 21) ^ (name[1] << 14) ^ (name[2] << 7) ^
21118c2ecf20Sopenharmony_ci		       (name[3] << 0) ^ rol32(hash, 7 * 4);
21128c2ecf20Sopenharmony_ci
21138c2ecf20Sopenharmony_ci	/*
21148c2ecf20Sopenharmony_ci	 * Now do the rest of the characters.
21158c2ecf20Sopenharmony_ci	 */
21168c2ecf20Sopenharmony_ci	switch (namelen) {
21178c2ecf20Sopenharmony_ci	case 3:
21188c2ecf20Sopenharmony_ci		return (name[0] << 14) ^ (name[1] << 7) ^ (name[2] << 0) ^
21198c2ecf20Sopenharmony_ci		       rol32(hash, 7 * 3);
21208c2ecf20Sopenharmony_ci	case 2:
21218c2ecf20Sopenharmony_ci		return (name[0] << 7) ^ (name[1] << 0) ^ rol32(hash, 7 * 2);
21228c2ecf20Sopenharmony_ci	case 1:
21238c2ecf20Sopenharmony_ci		return (name[0] << 0) ^ rol32(hash, 7 * 1);
21248c2ecf20Sopenharmony_ci	default: /* case 0: */
21258c2ecf20Sopenharmony_ci		return hash;
21268c2ecf20Sopenharmony_ci	}
21278c2ecf20Sopenharmony_ci}
21288c2ecf20Sopenharmony_ci
21298c2ecf20Sopenharmony_cienum xfs_dacmp
21308c2ecf20Sopenharmony_cixfs_da_compname(
21318c2ecf20Sopenharmony_ci	struct xfs_da_args *args,
21328c2ecf20Sopenharmony_ci	const unsigned char *name,
21338c2ecf20Sopenharmony_ci	int		len)
21348c2ecf20Sopenharmony_ci{
21358c2ecf20Sopenharmony_ci	return (args->namelen == len && memcmp(args->name, name, len) == 0) ?
21368c2ecf20Sopenharmony_ci					XFS_CMP_EXACT : XFS_CMP_DIFFERENT;
21378c2ecf20Sopenharmony_ci}
21388c2ecf20Sopenharmony_ci
21398c2ecf20Sopenharmony_ciint
21408c2ecf20Sopenharmony_cixfs_da_grow_inode_int(
21418c2ecf20Sopenharmony_ci	struct xfs_da_args	*args,
21428c2ecf20Sopenharmony_ci	xfs_fileoff_t		*bno,
21438c2ecf20Sopenharmony_ci	int			count)
21448c2ecf20Sopenharmony_ci{
21458c2ecf20Sopenharmony_ci	struct xfs_trans	*tp = args->trans;
21468c2ecf20Sopenharmony_ci	struct xfs_inode	*dp = args->dp;
21478c2ecf20Sopenharmony_ci	int			w = args->whichfork;
21488c2ecf20Sopenharmony_ci	xfs_rfsblock_t		nblks = dp->i_d.di_nblocks;
21498c2ecf20Sopenharmony_ci	struct xfs_bmbt_irec	map, *mapp;
21508c2ecf20Sopenharmony_ci	int			nmap, error, got, i, mapi;
21518c2ecf20Sopenharmony_ci
21528c2ecf20Sopenharmony_ci	/*
21538c2ecf20Sopenharmony_ci	 * Find a spot in the file space to put the new block.
21548c2ecf20Sopenharmony_ci	 */
21558c2ecf20Sopenharmony_ci	error = xfs_bmap_first_unused(tp, dp, count, bno, w);
21568c2ecf20Sopenharmony_ci	if (error)
21578c2ecf20Sopenharmony_ci		return error;
21588c2ecf20Sopenharmony_ci
21598c2ecf20Sopenharmony_ci	/*
21608c2ecf20Sopenharmony_ci	 * Try mapping it in one filesystem block.
21618c2ecf20Sopenharmony_ci	 */
21628c2ecf20Sopenharmony_ci	nmap = 1;
21638c2ecf20Sopenharmony_ci	error = xfs_bmapi_write(tp, dp, *bno, count,
21648c2ecf20Sopenharmony_ci			xfs_bmapi_aflag(w)|XFS_BMAPI_METADATA|XFS_BMAPI_CONTIG,
21658c2ecf20Sopenharmony_ci			args->total, &map, &nmap);
21668c2ecf20Sopenharmony_ci	if (error)
21678c2ecf20Sopenharmony_ci		return error;
21688c2ecf20Sopenharmony_ci
21698c2ecf20Sopenharmony_ci	ASSERT(nmap <= 1);
21708c2ecf20Sopenharmony_ci	if (nmap == 1) {
21718c2ecf20Sopenharmony_ci		mapp = &map;
21728c2ecf20Sopenharmony_ci		mapi = 1;
21738c2ecf20Sopenharmony_ci	} else if (nmap == 0 && count > 1) {
21748c2ecf20Sopenharmony_ci		xfs_fileoff_t		b;
21758c2ecf20Sopenharmony_ci		int			c;
21768c2ecf20Sopenharmony_ci
21778c2ecf20Sopenharmony_ci		/*
21788c2ecf20Sopenharmony_ci		 * If we didn't get it and the block might work if fragmented,
21798c2ecf20Sopenharmony_ci		 * try without the CONTIG flag.  Loop until we get it all.
21808c2ecf20Sopenharmony_ci		 */
21818c2ecf20Sopenharmony_ci		mapp = kmem_alloc(sizeof(*mapp) * count, 0);
21828c2ecf20Sopenharmony_ci		for (b = *bno, mapi = 0; b < *bno + count; ) {
21838c2ecf20Sopenharmony_ci			nmap = min(XFS_BMAP_MAX_NMAP, count);
21848c2ecf20Sopenharmony_ci			c = (int)(*bno + count - b);
21858c2ecf20Sopenharmony_ci			error = xfs_bmapi_write(tp, dp, b, c,
21868c2ecf20Sopenharmony_ci					xfs_bmapi_aflag(w)|XFS_BMAPI_METADATA,
21878c2ecf20Sopenharmony_ci					args->total, &mapp[mapi], &nmap);
21888c2ecf20Sopenharmony_ci			if (error)
21898c2ecf20Sopenharmony_ci				goto out_free_map;
21908c2ecf20Sopenharmony_ci			if (nmap < 1)
21918c2ecf20Sopenharmony_ci				break;
21928c2ecf20Sopenharmony_ci			mapi += nmap;
21938c2ecf20Sopenharmony_ci			b = mapp[mapi - 1].br_startoff +
21948c2ecf20Sopenharmony_ci			    mapp[mapi - 1].br_blockcount;
21958c2ecf20Sopenharmony_ci		}
21968c2ecf20Sopenharmony_ci	} else {
21978c2ecf20Sopenharmony_ci		mapi = 0;
21988c2ecf20Sopenharmony_ci		mapp = NULL;
21998c2ecf20Sopenharmony_ci	}
22008c2ecf20Sopenharmony_ci
22018c2ecf20Sopenharmony_ci	/*
22028c2ecf20Sopenharmony_ci	 * Count the blocks we got, make sure it matches the total.
22038c2ecf20Sopenharmony_ci	 */
22048c2ecf20Sopenharmony_ci	for (i = 0, got = 0; i < mapi; i++)
22058c2ecf20Sopenharmony_ci		got += mapp[i].br_blockcount;
22068c2ecf20Sopenharmony_ci	if (got != count || mapp[0].br_startoff != *bno ||
22078c2ecf20Sopenharmony_ci	    mapp[mapi - 1].br_startoff + mapp[mapi - 1].br_blockcount !=
22088c2ecf20Sopenharmony_ci	    *bno + count) {
22098c2ecf20Sopenharmony_ci		error = -ENOSPC;
22108c2ecf20Sopenharmony_ci		goto out_free_map;
22118c2ecf20Sopenharmony_ci	}
22128c2ecf20Sopenharmony_ci
22138c2ecf20Sopenharmony_ci	/* account for newly allocated blocks in reserved blocks total */
22148c2ecf20Sopenharmony_ci	args->total -= dp->i_d.di_nblocks - nblks;
22158c2ecf20Sopenharmony_ci
22168c2ecf20Sopenharmony_ciout_free_map:
22178c2ecf20Sopenharmony_ci	if (mapp != &map)
22188c2ecf20Sopenharmony_ci		kmem_free(mapp);
22198c2ecf20Sopenharmony_ci	return error;
22208c2ecf20Sopenharmony_ci}
22218c2ecf20Sopenharmony_ci
22228c2ecf20Sopenharmony_ci/*
22238c2ecf20Sopenharmony_ci * Add a block to the btree ahead of the file.
22248c2ecf20Sopenharmony_ci * Return the new block number to the caller.
22258c2ecf20Sopenharmony_ci */
22268c2ecf20Sopenharmony_ciint
22278c2ecf20Sopenharmony_cixfs_da_grow_inode(
22288c2ecf20Sopenharmony_ci	struct xfs_da_args	*args,
22298c2ecf20Sopenharmony_ci	xfs_dablk_t		*new_blkno)
22308c2ecf20Sopenharmony_ci{
22318c2ecf20Sopenharmony_ci	xfs_fileoff_t		bno;
22328c2ecf20Sopenharmony_ci	int			error;
22338c2ecf20Sopenharmony_ci
22348c2ecf20Sopenharmony_ci	trace_xfs_da_grow_inode(args);
22358c2ecf20Sopenharmony_ci
22368c2ecf20Sopenharmony_ci	bno = args->geo->leafblk;
22378c2ecf20Sopenharmony_ci	error = xfs_da_grow_inode_int(args, &bno, args->geo->fsbcount);
22388c2ecf20Sopenharmony_ci	if (!error)
22398c2ecf20Sopenharmony_ci		*new_blkno = (xfs_dablk_t)bno;
22408c2ecf20Sopenharmony_ci	return error;
22418c2ecf20Sopenharmony_ci}
22428c2ecf20Sopenharmony_ci
22438c2ecf20Sopenharmony_ci/*
22448c2ecf20Sopenharmony_ci * Ick.  We need to always be able to remove a btree block, even
22458c2ecf20Sopenharmony_ci * if there's no space reservation because the filesystem is full.
22468c2ecf20Sopenharmony_ci * This is called if xfs_bunmapi on a btree block fails due to ENOSPC.
22478c2ecf20Sopenharmony_ci * It swaps the target block with the last block in the file.  The
22488c2ecf20Sopenharmony_ci * last block in the file can always be removed since it can't cause
22498c2ecf20Sopenharmony_ci * a bmap btree split to do that.
22508c2ecf20Sopenharmony_ci */
22518c2ecf20Sopenharmony_ciSTATIC int
22528c2ecf20Sopenharmony_cixfs_da3_swap_lastblock(
22538c2ecf20Sopenharmony_ci	struct xfs_da_args	*args,
22548c2ecf20Sopenharmony_ci	xfs_dablk_t		*dead_blknop,
22558c2ecf20Sopenharmony_ci	struct xfs_buf		**dead_bufp)
22568c2ecf20Sopenharmony_ci{
22578c2ecf20Sopenharmony_ci	struct xfs_da_blkinfo	*dead_info;
22588c2ecf20Sopenharmony_ci	struct xfs_da_blkinfo	*sib_info;
22598c2ecf20Sopenharmony_ci	struct xfs_da_intnode	*par_node;
22608c2ecf20Sopenharmony_ci	struct xfs_da_intnode	*dead_node;
22618c2ecf20Sopenharmony_ci	struct xfs_dir2_leaf	*dead_leaf2;
22628c2ecf20Sopenharmony_ci	struct xfs_da_node_entry *btree;
22638c2ecf20Sopenharmony_ci	struct xfs_da3_icnode_hdr par_hdr;
22648c2ecf20Sopenharmony_ci	struct xfs_inode	*dp;
22658c2ecf20Sopenharmony_ci	struct xfs_trans	*tp;
22668c2ecf20Sopenharmony_ci	struct xfs_mount	*mp;
22678c2ecf20Sopenharmony_ci	struct xfs_buf		*dead_buf;
22688c2ecf20Sopenharmony_ci	struct xfs_buf		*last_buf;
22698c2ecf20Sopenharmony_ci	struct xfs_buf		*sib_buf;
22708c2ecf20Sopenharmony_ci	struct xfs_buf		*par_buf;
22718c2ecf20Sopenharmony_ci	xfs_dahash_t		dead_hash;
22728c2ecf20Sopenharmony_ci	xfs_fileoff_t		lastoff;
22738c2ecf20Sopenharmony_ci	xfs_dablk_t		dead_blkno;
22748c2ecf20Sopenharmony_ci	xfs_dablk_t		last_blkno;
22758c2ecf20Sopenharmony_ci	xfs_dablk_t		sib_blkno;
22768c2ecf20Sopenharmony_ci	xfs_dablk_t		par_blkno;
22778c2ecf20Sopenharmony_ci	int			error;
22788c2ecf20Sopenharmony_ci	int			w;
22798c2ecf20Sopenharmony_ci	int			entno;
22808c2ecf20Sopenharmony_ci	int			level;
22818c2ecf20Sopenharmony_ci	int			dead_level;
22828c2ecf20Sopenharmony_ci
22838c2ecf20Sopenharmony_ci	trace_xfs_da_swap_lastblock(args);
22848c2ecf20Sopenharmony_ci
22858c2ecf20Sopenharmony_ci	dead_buf = *dead_bufp;
22868c2ecf20Sopenharmony_ci	dead_blkno = *dead_blknop;
22878c2ecf20Sopenharmony_ci	tp = args->trans;
22888c2ecf20Sopenharmony_ci	dp = args->dp;
22898c2ecf20Sopenharmony_ci	w = args->whichfork;
22908c2ecf20Sopenharmony_ci	ASSERT(w == XFS_DATA_FORK);
22918c2ecf20Sopenharmony_ci	mp = dp->i_mount;
22928c2ecf20Sopenharmony_ci	lastoff = args->geo->freeblk;
22938c2ecf20Sopenharmony_ci	error = xfs_bmap_last_before(tp, dp, &lastoff, w);
22948c2ecf20Sopenharmony_ci	if (error)
22958c2ecf20Sopenharmony_ci		return error;
22968c2ecf20Sopenharmony_ci	if (XFS_IS_CORRUPT(mp, lastoff == 0))
22978c2ecf20Sopenharmony_ci		return -EFSCORRUPTED;
22988c2ecf20Sopenharmony_ci	/*
22998c2ecf20Sopenharmony_ci	 * Read the last block in the btree space.
23008c2ecf20Sopenharmony_ci	 */
23018c2ecf20Sopenharmony_ci	last_blkno = (xfs_dablk_t)lastoff - args->geo->fsbcount;
23028c2ecf20Sopenharmony_ci	error = xfs_da3_node_read(tp, dp, last_blkno, &last_buf, w);
23038c2ecf20Sopenharmony_ci	if (error)
23048c2ecf20Sopenharmony_ci		return error;
23058c2ecf20Sopenharmony_ci	/*
23068c2ecf20Sopenharmony_ci	 * Copy the last block into the dead buffer and log it.
23078c2ecf20Sopenharmony_ci	 */
23088c2ecf20Sopenharmony_ci	memcpy(dead_buf->b_addr, last_buf->b_addr, args->geo->blksize);
23098c2ecf20Sopenharmony_ci	xfs_trans_log_buf(tp, dead_buf, 0, args->geo->blksize - 1);
23108c2ecf20Sopenharmony_ci	dead_info = dead_buf->b_addr;
23118c2ecf20Sopenharmony_ci	/*
23128c2ecf20Sopenharmony_ci	 * Get values from the moved block.
23138c2ecf20Sopenharmony_ci	 */
23148c2ecf20Sopenharmony_ci	if (dead_info->magic == cpu_to_be16(XFS_DIR2_LEAFN_MAGIC) ||
23158c2ecf20Sopenharmony_ci	    dead_info->magic == cpu_to_be16(XFS_DIR3_LEAFN_MAGIC)) {
23168c2ecf20Sopenharmony_ci		struct xfs_dir3_icleaf_hdr leafhdr;
23178c2ecf20Sopenharmony_ci		struct xfs_dir2_leaf_entry *ents;
23188c2ecf20Sopenharmony_ci
23198c2ecf20Sopenharmony_ci		dead_leaf2 = (xfs_dir2_leaf_t *)dead_info;
23208c2ecf20Sopenharmony_ci		xfs_dir2_leaf_hdr_from_disk(dp->i_mount, &leafhdr,
23218c2ecf20Sopenharmony_ci					    dead_leaf2);
23228c2ecf20Sopenharmony_ci		ents = leafhdr.ents;
23238c2ecf20Sopenharmony_ci		dead_level = 0;
23248c2ecf20Sopenharmony_ci		dead_hash = be32_to_cpu(ents[leafhdr.count - 1].hashval);
23258c2ecf20Sopenharmony_ci	} else {
23268c2ecf20Sopenharmony_ci		struct xfs_da3_icnode_hdr deadhdr;
23278c2ecf20Sopenharmony_ci
23288c2ecf20Sopenharmony_ci		dead_node = (xfs_da_intnode_t *)dead_info;
23298c2ecf20Sopenharmony_ci		xfs_da3_node_hdr_from_disk(dp->i_mount, &deadhdr, dead_node);
23308c2ecf20Sopenharmony_ci		btree = deadhdr.btree;
23318c2ecf20Sopenharmony_ci		dead_level = deadhdr.level;
23328c2ecf20Sopenharmony_ci		dead_hash = be32_to_cpu(btree[deadhdr.count - 1].hashval);
23338c2ecf20Sopenharmony_ci	}
23348c2ecf20Sopenharmony_ci	sib_buf = par_buf = NULL;
23358c2ecf20Sopenharmony_ci	/*
23368c2ecf20Sopenharmony_ci	 * If the moved block has a left sibling, fix up the pointers.
23378c2ecf20Sopenharmony_ci	 */
23388c2ecf20Sopenharmony_ci	if ((sib_blkno = be32_to_cpu(dead_info->back))) {
23398c2ecf20Sopenharmony_ci		error = xfs_da3_node_read(tp, dp, sib_blkno, &sib_buf, w);
23408c2ecf20Sopenharmony_ci		if (error)
23418c2ecf20Sopenharmony_ci			goto done;
23428c2ecf20Sopenharmony_ci		sib_info = sib_buf->b_addr;
23438c2ecf20Sopenharmony_ci		if (XFS_IS_CORRUPT(mp,
23448c2ecf20Sopenharmony_ci				   be32_to_cpu(sib_info->forw) != last_blkno ||
23458c2ecf20Sopenharmony_ci				   sib_info->magic != dead_info->magic)) {
23468c2ecf20Sopenharmony_ci			error = -EFSCORRUPTED;
23478c2ecf20Sopenharmony_ci			goto done;
23488c2ecf20Sopenharmony_ci		}
23498c2ecf20Sopenharmony_ci		sib_info->forw = cpu_to_be32(dead_blkno);
23508c2ecf20Sopenharmony_ci		xfs_trans_log_buf(tp, sib_buf,
23518c2ecf20Sopenharmony_ci			XFS_DA_LOGRANGE(sib_info, &sib_info->forw,
23528c2ecf20Sopenharmony_ci					sizeof(sib_info->forw)));
23538c2ecf20Sopenharmony_ci		sib_buf = NULL;
23548c2ecf20Sopenharmony_ci	}
23558c2ecf20Sopenharmony_ci	/*
23568c2ecf20Sopenharmony_ci	 * If the moved block has a right sibling, fix up the pointers.
23578c2ecf20Sopenharmony_ci	 */
23588c2ecf20Sopenharmony_ci	if ((sib_blkno = be32_to_cpu(dead_info->forw))) {
23598c2ecf20Sopenharmony_ci		error = xfs_da3_node_read(tp, dp, sib_blkno, &sib_buf, w);
23608c2ecf20Sopenharmony_ci		if (error)
23618c2ecf20Sopenharmony_ci			goto done;
23628c2ecf20Sopenharmony_ci		sib_info = sib_buf->b_addr;
23638c2ecf20Sopenharmony_ci		if (XFS_IS_CORRUPT(mp,
23648c2ecf20Sopenharmony_ci				   be32_to_cpu(sib_info->back) != last_blkno ||
23658c2ecf20Sopenharmony_ci				   sib_info->magic != dead_info->magic)) {
23668c2ecf20Sopenharmony_ci			error = -EFSCORRUPTED;
23678c2ecf20Sopenharmony_ci			goto done;
23688c2ecf20Sopenharmony_ci		}
23698c2ecf20Sopenharmony_ci		sib_info->back = cpu_to_be32(dead_blkno);
23708c2ecf20Sopenharmony_ci		xfs_trans_log_buf(tp, sib_buf,
23718c2ecf20Sopenharmony_ci			XFS_DA_LOGRANGE(sib_info, &sib_info->back,
23728c2ecf20Sopenharmony_ci					sizeof(sib_info->back)));
23738c2ecf20Sopenharmony_ci		sib_buf = NULL;
23748c2ecf20Sopenharmony_ci	}
23758c2ecf20Sopenharmony_ci	par_blkno = args->geo->leafblk;
23768c2ecf20Sopenharmony_ci	level = -1;
23778c2ecf20Sopenharmony_ci	/*
23788c2ecf20Sopenharmony_ci	 * Walk down the tree looking for the parent of the moved block.
23798c2ecf20Sopenharmony_ci	 */
23808c2ecf20Sopenharmony_ci	for (;;) {
23818c2ecf20Sopenharmony_ci		error = xfs_da3_node_read(tp, dp, par_blkno, &par_buf, w);
23828c2ecf20Sopenharmony_ci		if (error)
23838c2ecf20Sopenharmony_ci			goto done;
23848c2ecf20Sopenharmony_ci		par_node = par_buf->b_addr;
23858c2ecf20Sopenharmony_ci		xfs_da3_node_hdr_from_disk(dp->i_mount, &par_hdr, par_node);
23868c2ecf20Sopenharmony_ci		if (XFS_IS_CORRUPT(mp,
23878c2ecf20Sopenharmony_ci				   level >= 0 && level != par_hdr.level + 1)) {
23888c2ecf20Sopenharmony_ci			error = -EFSCORRUPTED;
23898c2ecf20Sopenharmony_ci			goto done;
23908c2ecf20Sopenharmony_ci		}
23918c2ecf20Sopenharmony_ci		level = par_hdr.level;
23928c2ecf20Sopenharmony_ci		btree = par_hdr.btree;
23938c2ecf20Sopenharmony_ci		for (entno = 0;
23948c2ecf20Sopenharmony_ci		     entno < par_hdr.count &&
23958c2ecf20Sopenharmony_ci		     be32_to_cpu(btree[entno].hashval) < dead_hash;
23968c2ecf20Sopenharmony_ci		     entno++)
23978c2ecf20Sopenharmony_ci			continue;
23988c2ecf20Sopenharmony_ci		if (XFS_IS_CORRUPT(mp, entno == par_hdr.count)) {
23998c2ecf20Sopenharmony_ci			error = -EFSCORRUPTED;
24008c2ecf20Sopenharmony_ci			goto done;
24018c2ecf20Sopenharmony_ci		}
24028c2ecf20Sopenharmony_ci		par_blkno = be32_to_cpu(btree[entno].before);
24038c2ecf20Sopenharmony_ci		if (level == dead_level + 1)
24048c2ecf20Sopenharmony_ci			break;
24058c2ecf20Sopenharmony_ci		xfs_trans_brelse(tp, par_buf);
24068c2ecf20Sopenharmony_ci		par_buf = NULL;
24078c2ecf20Sopenharmony_ci	}
24088c2ecf20Sopenharmony_ci	/*
24098c2ecf20Sopenharmony_ci	 * We're in the right parent block.
24108c2ecf20Sopenharmony_ci	 * Look for the right entry.
24118c2ecf20Sopenharmony_ci	 */
24128c2ecf20Sopenharmony_ci	for (;;) {
24138c2ecf20Sopenharmony_ci		for (;
24148c2ecf20Sopenharmony_ci		     entno < par_hdr.count &&
24158c2ecf20Sopenharmony_ci		     be32_to_cpu(btree[entno].before) != last_blkno;
24168c2ecf20Sopenharmony_ci		     entno++)
24178c2ecf20Sopenharmony_ci			continue;
24188c2ecf20Sopenharmony_ci		if (entno < par_hdr.count)
24198c2ecf20Sopenharmony_ci			break;
24208c2ecf20Sopenharmony_ci		par_blkno = par_hdr.forw;
24218c2ecf20Sopenharmony_ci		xfs_trans_brelse(tp, par_buf);
24228c2ecf20Sopenharmony_ci		par_buf = NULL;
24238c2ecf20Sopenharmony_ci		if (XFS_IS_CORRUPT(mp, par_blkno == 0)) {
24248c2ecf20Sopenharmony_ci			error = -EFSCORRUPTED;
24258c2ecf20Sopenharmony_ci			goto done;
24268c2ecf20Sopenharmony_ci		}
24278c2ecf20Sopenharmony_ci		error = xfs_da3_node_read(tp, dp, par_blkno, &par_buf, w);
24288c2ecf20Sopenharmony_ci		if (error)
24298c2ecf20Sopenharmony_ci			goto done;
24308c2ecf20Sopenharmony_ci		par_node = par_buf->b_addr;
24318c2ecf20Sopenharmony_ci		xfs_da3_node_hdr_from_disk(dp->i_mount, &par_hdr, par_node);
24328c2ecf20Sopenharmony_ci		if (XFS_IS_CORRUPT(mp, par_hdr.level != level)) {
24338c2ecf20Sopenharmony_ci			error = -EFSCORRUPTED;
24348c2ecf20Sopenharmony_ci			goto done;
24358c2ecf20Sopenharmony_ci		}
24368c2ecf20Sopenharmony_ci		btree = par_hdr.btree;
24378c2ecf20Sopenharmony_ci		entno = 0;
24388c2ecf20Sopenharmony_ci	}
24398c2ecf20Sopenharmony_ci	/*
24408c2ecf20Sopenharmony_ci	 * Update the parent entry pointing to the moved block.
24418c2ecf20Sopenharmony_ci	 */
24428c2ecf20Sopenharmony_ci	btree[entno].before = cpu_to_be32(dead_blkno);
24438c2ecf20Sopenharmony_ci	xfs_trans_log_buf(tp, par_buf,
24448c2ecf20Sopenharmony_ci		XFS_DA_LOGRANGE(par_node, &btree[entno].before,
24458c2ecf20Sopenharmony_ci				sizeof(btree[entno].before)));
24468c2ecf20Sopenharmony_ci	*dead_blknop = last_blkno;
24478c2ecf20Sopenharmony_ci	*dead_bufp = last_buf;
24488c2ecf20Sopenharmony_ci	return 0;
24498c2ecf20Sopenharmony_cidone:
24508c2ecf20Sopenharmony_ci	if (par_buf)
24518c2ecf20Sopenharmony_ci		xfs_trans_brelse(tp, par_buf);
24528c2ecf20Sopenharmony_ci	if (sib_buf)
24538c2ecf20Sopenharmony_ci		xfs_trans_brelse(tp, sib_buf);
24548c2ecf20Sopenharmony_ci	xfs_trans_brelse(tp, last_buf);
24558c2ecf20Sopenharmony_ci	return error;
24568c2ecf20Sopenharmony_ci}
24578c2ecf20Sopenharmony_ci
24588c2ecf20Sopenharmony_ci/*
24598c2ecf20Sopenharmony_ci * Remove a btree block from a directory or attribute.
24608c2ecf20Sopenharmony_ci */
24618c2ecf20Sopenharmony_ciint
24628c2ecf20Sopenharmony_cixfs_da_shrink_inode(
24638c2ecf20Sopenharmony_ci	struct xfs_da_args	*args,
24648c2ecf20Sopenharmony_ci	xfs_dablk_t		dead_blkno,
24658c2ecf20Sopenharmony_ci	struct xfs_buf		*dead_buf)
24668c2ecf20Sopenharmony_ci{
24678c2ecf20Sopenharmony_ci	struct xfs_inode	*dp;
24688c2ecf20Sopenharmony_ci	int			done, error, w, count;
24698c2ecf20Sopenharmony_ci	struct xfs_trans	*tp;
24708c2ecf20Sopenharmony_ci
24718c2ecf20Sopenharmony_ci	trace_xfs_da_shrink_inode(args);
24728c2ecf20Sopenharmony_ci
24738c2ecf20Sopenharmony_ci	dp = args->dp;
24748c2ecf20Sopenharmony_ci	w = args->whichfork;
24758c2ecf20Sopenharmony_ci	tp = args->trans;
24768c2ecf20Sopenharmony_ci	count = args->geo->fsbcount;
24778c2ecf20Sopenharmony_ci	for (;;) {
24788c2ecf20Sopenharmony_ci		/*
24798c2ecf20Sopenharmony_ci		 * Remove extents.  If we get ENOSPC for a dir we have to move
24808c2ecf20Sopenharmony_ci		 * the last block to the place we want to kill.
24818c2ecf20Sopenharmony_ci		 */
24828c2ecf20Sopenharmony_ci		error = xfs_bunmapi(tp, dp, dead_blkno, count,
24838c2ecf20Sopenharmony_ci				    xfs_bmapi_aflag(w), 0, &done);
24848c2ecf20Sopenharmony_ci		if (error == -ENOSPC) {
24858c2ecf20Sopenharmony_ci			if (w != XFS_DATA_FORK)
24868c2ecf20Sopenharmony_ci				break;
24878c2ecf20Sopenharmony_ci			error = xfs_da3_swap_lastblock(args, &dead_blkno,
24888c2ecf20Sopenharmony_ci						      &dead_buf);
24898c2ecf20Sopenharmony_ci			if (error)
24908c2ecf20Sopenharmony_ci				break;
24918c2ecf20Sopenharmony_ci		} else {
24928c2ecf20Sopenharmony_ci			break;
24938c2ecf20Sopenharmony_ci		}
24948c2ecf20Sopenharmony_ci	}
24958c2ecf20Sopenharmony_ci	xfs_trans_binval(tp, dead_buf);
24968c2ecf20Sopenharmony_ci	return error;
24978c2ecf20Sopenharmony_ci}
24988c2ecf20Sopenharmony_ci
24998c2ecf20Sopenharmony_cistatic int
25008c2ecf20Sopenharmony_cixfs_dabuf_map(
25018c2ecf20Sopenharmony_ci	struct xfs_inode	*dp,
25028c2ecf20Sopenharmony_ci	xfs_dablk_t		bno,
25038c2ecf20Sopenharmony_ci	unsigned int		flags,
25048c2ecf20Sopenharmony_ci	int			whichfork,
25058c2ecf20Sopenharmony_ci	struct xfs_buf_map	**mapp,
25068c2ecf20Sopenharmony_ci	int			*nmaps)
25078c2ecf20Sopenharmony_ci{
25088c2ecf20Sopenharmony_ci	struct xfs_mount	*mp = dp->i_mount;
25098c2ecf20Sopenharmony_ci	int			nfsb = xfs_dabuf_nfsb(mp, whichfork);
25108c2ecf20Sopenharmony_ci	struct xfs_bmbt_irec	irec, *irecs = &irec;
25118c2ecf20Sopenharmony_ci	struct xfs_buf_map	*map = *mapp;
25128c2ecf20Sopenharmony_ci	xfs_fileoff_t		off = bno;
25138c2ecf20Sopenharmony_ci	int			error = 0, nirecs, i;
25148c2ecf20Sopenharmony_ci
25158c2ecf20Sopenharmony_ci	if (nfsb > 1)
25168c2ecf20Sopenharmony_ci		irecs = kmem_zalloc(sizeof(irec) * nfsb, KM_NOFS);
25178c2ecf20Sopenharmony_ci
25188c2ecf20Sopenharmony_ci	nirecs = nfsb;
25198c2ecf20Sopenharmony_ci	error = xfs_bmapi_read(dp, bno, nfsb, irecs, &nirecs,
25208c2ecf20Sopenharmony_ci			xfs_bmapi_aflag(whichfork));
25218c2ecf20Sopenharmony_ci	if (error)
25228c2ecf20Sopenharmony_ci		goto out_free_irecs;
25238c2ecf20Sopenharmony_ci
25248c2ecf20Sopenharmony_ci	/*
25258c2ecf20Sopenharmony_ci	 * Use the caller provided map for the single map case, else allocate a
25268c2ecf20Sopenharmony_ci	 * larger one that needs to be free by the caller.
25278c2ecf20Sopenharmony_ci	 */
25288c2ecf20Sopenharmony_ci	if (nirecs > 1) {
25298c2ecf20Sopenharmony_ci		map = kmem_zalloc(nirecs * sizeof(struct xfs_buf_map), KM_NOFS);
25308c2ecf20Sopenharmony_ci		if (!map) {
25318c2ecf20Sopenharmony_ci			error = -ENOMEM;
25328c2ecf20Sopenharmony_ci			goto out_free_irecs;
25338c2ecf20Sopenharmony_ci		}
25348c2ecf20Sopenharmony_ci		*mapp = map;
25358c2ecf20Sopenharmony_ci	}
25368c2ecf20Sopenharmony_ci
25378c2ecf20Sopenharmony_ci	for (i = 0; i < nirecs; i++) {
25388c2ecf20Sopenharmony_ci		if (irecs[i].br_startblock == HOLESTARTBLOCK ||
25398c2ecf20Sopenharmony_ci		    irecs[i].br_startblock == DELAYSTARTBLOCK)
25408c2ecf20Sopenharmony_ci			goto invalid_mapping;
25418c2ecf20Sopenharmony_ci		if (off != irecs[i].br_startoff)
25428c2ecf20Sopenharmony_ci			goto invalid_mapping;
25438c2ecf20Sopenharmony_ci
25448c2ecf20Sopenharmony_ci		map[i].bm_bn = XFS_FSB_TO_DADDR(mp, irecs[i].br_startblock);
25458c2ecf20Sopenharmony_ci		map[i].bm_len = XFS_FSB_TO_BB(mp, irecs[i].br_blockcount);
25468c2ecf20Sopenharmony_ci		off += irecs[i].br_blockcount;
25478c2ecf20Sopenharmony_ci	}
25488c2ecf20Sopenharmony_ci
25498c2ecf20Sopenharmony_ci	if (off != bno + nfsb)
25508c2ecf20Sopenharmony_ci		goto invalid_mapping;
25518c2ecf20Sopenharmony_ci
25528c2ecf20Sopenharmony_ci	*nmaps = nirecs;
25538c2ecf20Sopenharmony_ciout_free_irecs:
25548c2ecf20Sopenharmony_ci	if (irecs != &irec)
25558c2ecf20Sopenharmony_ci		kmem_free(irecs);
25568c2ecf20Sopenharmony_ci	return error;
25578c2ecf20Sopenharmony_ci
25588c2ecf20Sopenharmony_ciinvalid_mapping:
25598c2ecf20Sopenharmony_ci	/* Caller ok with no mapping. */
25608c2ecf20Sopenharmony_ci	if (XFS_IS_CORRUPT(mp, !(flags & XFS_DABUF_MAP_HOLE_OK))) {
25618c2ecf20Sopenharmony_ci		error = -EFSCORRUPTED;
25628c2ecf20Sopenharmony_ci		if (xfs_error_level >= XFS_ERRLEVEL_LOW) {
25638c2ecf20Sopenharmony_ci			xfs_alert(mp, "%s: bno %u inode %llu",
25648c2ecf20Sopenharmony_ci					__func__, bno, dp->i_ino);
25658c2ecf20Sopenharmony_ci
25668c2ecf20Sopenharmony_ci			for (i = 0; i < nirecs; i++) {
25678c2ecf20Sopenharmony_ci				xfs_alert(mp,
25688c2ecf20Sopenharmony_ci"[%02d] br_startoff %lld br_startblock %lld br_blockcount %lld br_state %d",
25698c2ecf20Sopenharmony_ci					i, irecs[i].br_startoff,
25708c2ecf20Sopenharmony_ci					irecs[i].br_startblock,
25718c2ecf20Sopenharmony_ci					irecs[i].br_blockcount,
25728c2ecf20Sopenharmony_ci					irecs[i].br_state);
25738c2ecf20Sopenharmony_ci			}
25748c2ecf20Sopenharmony_ci		}
25758c2ecf20Sopenharmony_ci	} else {
25768c2ecf20Sopenharmony_ci		*nmaps = 0;
25778c2ecf20Sopenharmony_ci	}
25788c2ecf20Sopenharmony_ci	goto out_free_irecs;
25798c2ecf20Sopenharmony_ci}
25808c2ecf20Sopenharmony_ci
25818c2ecf20Sopenharmony_ci/*
25828c2ecf20Sopenharmony_ci * Get a buffer for the dir/attr block.
25838c2ecf20Sopenharmony_ci */
25848c2ecf20Sopenharmony_ciint
25858c2ecf20Sopenharmony_cixfs_da_get_buf(
25868c2ecf20Sopenharmony_ci	struct xfs_trans	*tp,
25878c2ecf20Sopenharmony_ci	struct xfs_inode	*dp,
25888c2ecf20Sopenharmony_ci	xfs_dablk_t		bno,
25898c2ecf20Sopenharmony_ci	struct xfs_buf		**bpp,
25908c2ecf20Sopenharmony_ci	int			whichfork)
25918c2ecf20Sopenharmony_ci{
25928c2ecf20Sopenharmony_ci	struct xfs_mount	*mp = dp->i_mount;
25938c2ecf20Sopenharmony_ci	struct xfs_buf		*bp;
25948c2ecf20Sopenharmony_ci	struct xfs_buf_map	map, *mapp = &map;
25958c2ecf20Sopenharmony_ci	int			nmap = 1;
25968c2ecf20Sopenharmony_ci	int			error;
25978c2ecf20Sopenharmony_ci
25988c2ecf20Sopenharmony_ci	*bpp = NULL;
25998c2ecf20Sopenharmony_ci	error = xfs_dabuf_map(dp, bno, 0, whichfork, &mapp, &nmap);
26008c2ecf20Sopenharmony_ci	if (error || nmap == 0)
26018c2ecf20Sopenharmony_ci		goto out_free;
26028c2ecf20Sopenharmony_ci
26038c2ecf20Sopenharmony_ci	error = xfs_trans_get_buf_map(tp, mp->m_ddev_targp, mapp, nmap, 0, &bp);
26048c2ecf20Sopenharmony_ci	if (error)
26058c2ecf20Sopenharmony_ci		goto out_free;
26068c2ecf20Sopenharmony_ci
26078c2ecf20Sopenharmony_ci	*bpp = bp;
26088c2ecf20Sopenharmony_ci
26098c2ecf20Sopenharmony_ciout_free:
26108c2ecf20Sopenharmony_ci	if (mapp != &map)
26118c2ecf20Sopenharmony_ci		kmem_free(mapp);
26128c2ecf20Sopenharmony_ci
26138c2ecf20Sopenharmony_ci	return error;
26148c2ecf20Sopenharmony_ci}
26158c2ecf20Sopenharmony_ci
26168c2ecf20Sopenharmony_ci/*
26178c2ecf20Sopenharmony_ci * Get a buffer for the dir/attr block, fill in the contents.
26188c2ecf20Sopenharmony_ci */
26198c2ecf20Sopenharmony_ciint
26208c2ecf20Sopenharmony_cixfs_da_read_buf(
26218c2ecf20Sopenharmony_ci	struct xfs_trans	*tp,
26228c2ecf20Sopenharmony_ci	struct xfs_inode	*dp,
26238c2ecf20Sopenharmony_ci	xfs_dablk_t		bno,
26248c2ecf20Sopenharmony_ci	unsigned int		flags,
26258c2ecf20Sopenharmony_ci	struct xfs_buf		**bpp,
26268c2ecf20Sopenharmony_ci	int			whichfork,
26278c2ecf20Sopenharmony_ci	const struct xfs_buf_ops *ops)
26288c2ecf20Sopenharmony_ci{
26298c2ecf20Sopenharmony_ci	struct xfs_mount	*mp = dp->i_mount;
26308c2ecf20Sopenharmony_ci	struct xfs_buf		*bp;
26318c2ecf20Sopenharmony_ci	struct xfs_buf_map	map, *mapp = &map;
26328c2ecf20Sopenharmony_ci	int			nmap = 1;
26338c2ecf20Sopenharmony_ci	int			error;
26348c2ecf20Sopenharmony_ci
26358c2ecf20Sopenharmony_ci	*bpp = NULL;
26368c2ecf20Sopenharmony_ci	error = xfs_dabuf_map(dp, bno, flags, whichfork, &mapp, &nmap);
26378c2ecf20Sopenharmony_ci	if (error || !nmap)
26388c2ecf20Sopenharmony_ci		goto out_free;
26398c2ecf20Sopenharmony_ci
26408c2ecf20Sopenharmony_ci	error = xfs_trans_read_buf_map(mp, tp, mp->m_ddev_targp, mapp, nmap, 0,
26418c2ecf20Sopenharmony_ci			&bp, ops);
26428c2ecf20Sopenharmony_ci	if (error)
26438c2ecf20Sopenharmony_ci		goto out_free;
26448c2ecf20Sopenharmony_ci
26458c2ecf20Sopenharmony_ci	if (whichfork == XFS_ATTR_FORK)
26468c2ecf20Sopenharmony_ci		xfs_buf_set_ref(bp, XFS_ATTR_BTREE_REF);
26478c2ecf20Sopenharmony_ci	else
26488c2ecf20Sopenharmony_ci		xfs_buf_set_ref(bp, XFS_DIR_BTREE_REF);
26498c2ecf20Sopenharmony_ci	*bpp = bp;
26508c2ecf20Sopenharmony_ciout_free:
26518c2ecf20Sopenharmony_ci	if (mapp != &map)
26528c2ecf20Sopenharmony_ci		kmem_free(mapp);
26538c2ecf20Sopenharmony_ci
26548c2ecf20Sopenharmony_ci	return error;
26558c2ecf20Sopenharmony_ci}
26568c2ecf20Sopenharmony_ci
26578c2ecf20Sopenharmony_ci/*
26588c2ecf20Sopenharmony_ci * Readahead the dir/attr block.
26598c2ecf20Sopenharmony_ci */
26608c2ecf20Sopenharmony_ciint
26618c2ecf20Sopenharmony_cixfs_da_reada_buf(
26628c2ecf20Sopenharmony_ci	struct xfs_inode	*dp,
26638c2ecf20Sopenharmony_ci	xfs_dablk_t		bno,
26648c2ecf20Sopenharmony_ci	unsigned int		flags,
26658c2ecf20Sopenharmony_ci	int			whichfork,
26668c2ecf20Sopenharmony_ci	const struct xfs_buf_ops *ops)
26678c2ecf20Sopenharmony_ci{
26688c2ecf20Sopenharmony_ci	struct xfs_buf_map	map;
26698c2ecf20Sopenharmony_ci	struct xfs_buf_map	*mapp;
26708c2ecf20Sopenharmony_ci	int			nmap;
26718c2ecf20Sopenharmony_ci	int			error;
26728c2ecf20Sopenharmony_ci
26738c2ecf20Sopenharmony_ci	mapp = &map;
26748c2ecf20Sopenharmony_ci	nmap = 1;
26758c2ecf20Sopenharmony_ci	error = xfs_dabuf_map(dp, bno, flags, whichfork, &mapp, &nmap);
26768c2ecf20Sopenharmony_ci	if (error || !nmap)
26778c2ecf20Sopenharmony_ci		goto out_free;
26788c2ecf20Sopenharmony_ci
26798c2ecf20Sopenharmony_ci	xfs_buf_readahead_map(dp->i_mount->m_ddev_targp, mapp, nmap, ops);
26808c2ecf20Sopenharmony_ci
26818c2ecf20Sopenharmony_ciout_free:
26828c2ecf20Sopenharmony_ci	if (mapp != &map)
26838c2ecf20Sopenharmony_ci		kmem_free(mapp);
26848c2ecf20Sopenharmony_ci
26858c2ecf20Sopenharmony_ci	return error;
26868c2ecf20Sopenharmony_ci}
2687