162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0
262306a36Sopenharmony_ci
362306a36Sopenharmony_ci#include "misc.h"
462306a36Sopenharmony_ci#include "ctree.h"
562306a36Sopenharmony_ci#include "block-rsv.h"
662306a36Sopenharmony_ci#include "space-info.h"
762306a36Sopenharmony_ci#include "transaction.h"
862306a36Sopenharmony_ci#include "block-group.h"
962306a36Sopenharmony_ci#include "disk-io.h"
1062306a36Sopenharmony_ci#include "fs.h"
1162306a36Sopenharmony_ci#include "accessors.h"
1262306a36Sopenharmony_ci
1362306a36Sopenharmony_ci/*
1462306a36Sopenharmony_ci * HOW DO BLOCK RESERVES WORK
1562306a36Sopenharmony_ci *
1662306a36Sopenharmony_ci *   Think of block_rsv's as buckets for logically grouped metadata
1762306a36Sopenharmony_ci *   reservations.  Each block_rsv has a ->size and a ->reserved.  ->size is
1862306a36Sopenharmony_ci *   how large we want our block rsv to be, ->reserved is how much space is
1962306a36Sopenharmony_ci *   currently reserved for this block reserve.
2062306a36Sopenharmony_ci *
2162306a36Sopenharmony_ci *   ->failfast exists for the truncate case, and is described below.
2262306a36Sopenharmony_ci *
2362306a36Sopenharmony_ci * NORMAL OPERATION
2462306a36Sopenharmony_ci *
2562306a36Sopenharmony_ci *   -> Reserve
2662306a36Sopenharmony_ci *     Entrance: btrfs_block_rsv_add, btrfs_block_rsv_refill
2762306a36Sopenharmony_ci *
2862306a36Sopenharmony_ci *     We call into btrfs_reserve_metadata_bytes() with our bytes, which is
2962306a36Sopenharmony_ci *     accounted for in space_info->bytes_may_use, and then add the bytes to
3062306a36Sopenharmony_ci *     ->reserved, and ->size in the case of btrfs_block_rsv_add.
3162306a36Sopenharmony_ci *
3262306a36Sopenharmony_ci *     ->size is an over-estimation of how much we may use for a particular
3362306a36Sopenharmony_ci *     operation.
3462306a36Sopenharmony_ci *
3562306a36Sopenharmony_ci *   -> Use
3662306a36Sopenharmony_ci *     Entrance: btrfs_use_block_rsv
3762306a36Sopenharmony_ci *
3862306a36Sopenharmony_ci *     When we do a btrfs_alloc_tree_block() we call into btrfs_use_block_rsv()
3962306a36Sopenharmony_ci *     to determine the appropriate block_rsv to use, and then verify that
4062306a36Sopenharmony_ci *     ->reserved has enough space for our tree block allocation.  Once
4162306a36Sopenharmony_ci *     successful we subtract fs_info->nodesize from ->reserved.
4262306a36Sopenharmony_ci *
4362306a36Sopenharmony_ci *   -> Finish
4462306a36Sopenharmony_ci *     Entrance: btrfs_block_rsv_release
4562306a36Sopenharmony_ci *
4662306a36Sopenharmony_ci *     We are finished with our operation, subtract our individual reservation
4762306a36Sopenharmony_ci *     from ->size, and then subtract ->size from ->reserved and free up the
4862306a36Sopenharmony_ci *     excess if there is any.
4962306a36Sopenharmony_ci *
5062306a36Sopenharmony_ci *     There is some logic here to refill the delayed refs rsv or the global rsv
5162306a36Sopenharmony_ci *     as needed, otherwise the excess is subtracted from
5262306a36Sopenharmony_ci *     space_info->bytes_may_use.
5362306a36Sopenharmony_ci *
5462306a36Sopenharmony_ci * TYPES OF BLOCK RESERVES
5562306a36Sopenharmony_ci *
5662306a36Sopenharmony_ci * BLOCK_RSV_TRANS, BLOCK_RSV_DELOPS, BLOCK_RSV_CHUNK
5762306a36Sopenharmony_ci *   These behave normally, as described above, just within the confines of the
5862306a36Sopenharmony_ci *   lifetime of their particular operation (transaction for the whole trans
5962306a36Sopenharmony_ci *   handle lifetime, for example).
6062306a36Sopenharmony_ci *
6162306a36Sopenharmony_ci * BLOCK_RSV_GLOBAL
6262306a36Sopenharmony_ci *   It is impossible to properly account for all the space that may be required
6362306a36Sopenharmony_ci *   to make our extent tree updates.  This block reserve acts as an overflow
6462306a36Sopenharmony_ci *   buffer in case our delayed refs reserve does not reserve enough space to
6562306a36Sopenharmony_ci *   update the extent tree.
6662306a36Sopenharmony_ci *
6762306a36Sopenharmony_ci *   We can steal from this in some cases as well, notably on evict() or
6862306a36Sopenharmony_ci *   truncate() in order to help users recover from ENOSPC conditions.
6962306a36Sopenharmony_ci *
7062306a36Sopenharmony_ci * BLOCK_RSV_DELALLOC
7162306a36Sopenharmony_ci *   The individual item sizes are determined by the per-inode size
7262306a36Sopenharmony_ci *   calculations, which are described with the delalloc code.  This is pretty
7362306a36Sopenharmony_ci *   straightforward, it's just the calculation of ->size encodes a lot of
7462306a36Sopenharmony_ci *   different items, and thus it gets used when updating inodes, inserting file
7562306a36Sopenharmony_ci *   extents, and inserting checksums.
7662306a36Sopenharmony_ci *
7762306a36Sopenharmony_ci * BLOCK_RSV_DELREFS
7862306a36Sopenharmony_ci *   We keep a running tally of how many delayed refs we have on the system.
7962306a36Sopenharmony_ci *   We assume each one of these delayed refs are going to use a full
8062306a36Sopenharmony_ci *   reservation.  We use the transaction items and pre-reserve space for every
8162306a36Sopenharmony_ci *   operation, and use this reservation to refill any gap between ->size and
8262306a36Sopenharmony_ci *   ->reserved that may exist.
8362306a36Sopenharmony_ci *
8462306a36Sopenharmony_ci *   From there it's straightforward, removing a delayed ref means we remove its
8562306a36Sopenharmony_ci *   count from ->size and free up reservations as necessary.  Since this is
8662306a36Sopenharmony_ci *   the most dynamic block reserve in the system, we will try to refill this
8762306a36Sopenharmony_ci *   block reserve first with any excess returned by any other block reserve.
8862306a36Sopenharmony_ci *
8962306a36Sopenharmony_ci * BLOCK_RSV_EMPTY
9062306a36Sopenharmony_ci *   This is the fallback block reserve to make us try to reserve space if we
9162306a36Sopenharmony_ci *   don't have a specific bucket for this allocation.  It is mostly used for
9262306a36Sopenharmony_ci *   updating the device tree and such, since that is a separate pool we're
9362306a36Sopenharmony_ci *   content to just reserve space from the space_info on demand.
9462306a36Sopenharmony_ci *
9562306a36Sopenharmony_ci * BLOCK_RSV_TEMP
9662306a36Sopenharmony_ci *   This is used by things like truncate and iput.  We will temporarily
9762306a36Sopenharmony_ci *   allocate a block reserve, set it to some size, and then truncate bytes
9862306a36Sopenharmony_ci *   until we have no space left.  With ->failfast set we'll simply return
9962306a36Sopenharmony_ci *   ENOSPC from btrfs_use_block_rsv() to signal that we need to unwind and try
10062306a36Sopenharmony_ci *   to make a new reservation.  This is because these operations are
10162306a36Sopenharmony_ci *   unbounded, so we want to do as much work as we can, and then back off and
10262306a36Sopenharmony_ci *   re-reserve.
10362306a36Sopenharmony_ci */
10462306a36Sopenharmony_ci
10562306a36Sopenharmony_cistatic u64 block_rsv_release_bytes(struct btrfs_fs_info *fs_info,
10662306a36Sopenharmony_ci				    struct btrfs_block_rsv *block_rsv,
10762306a36Sopenharmony_ci				    struct btrfs_block_rsv *dest, u64 num_bytes,
10862306a36Sopenharmony_ci				    u64 *qgroup_to_release_ret)
10962306a36Sopenharmony_ci{
11062306a36Sopenharmony_ci	struct btrfs_space_info *space_info = block_rsv->space_info;
11162306a36Sopenharmony_ci	u64 qgroup_to_release = 0;
11262306a36Sopenharmony_ci	u64 ret;
11362306a36Sopenharmony_ci
11462306a36Sopenharmony_ci	spin_lock(&block_rsv->lock);
11562306a36Sopenharmony_ci	if (num_bytes == (u64)-1) {
11662306a36Sopenharmony_ci		num_bytes = block_rsv->size;
11762306a36Sopenharmony_ci		qgroup_to_release = block_rsv->qgroup_rsv_size;
11862306a36Sopenharmony_ci	}
11962306a36Sopenharmony_ci	block_rsv->size -= num_bytes;
12062306a36Sopenharmony_ci	if (block_rsv->reserved >= block_rsv->size) {
12162306a36Sopenharmony_ci		num_bytes = block_rsv->reserved - block_rsv->size;
12262306a36Sopenharmony_ci		block_rsv->reserved = block_rsv->size;
12362306a36Sopenharmony_ci		block_rsv->full = true;
12462306a36Sopenharmony_ci	} else {
12562306a36Sopenharmony_ci		num_bytes = 0;
12662306a36Sopenharmony_ci	}
12762306a36Sopenharmony_ci	if (qgroup_to_release_ret &&
12862306a36Sopenharmony_ci	    block_rsv->qgroup_rsv_reserved >= block_rsv->qgroup_rsv_size) {
12962306a36Sopenharmony_ci		qgroup_to_release = block_rsv->qgroup_rsv_reserved -
13062306a36Sopenharmony_ci				    block_rsv->qgroup_rsv_size;
13162306a36Sopenharmony_ci		block_rsv->qgroup_rsv_reserved = block_rsv->qgroup_rsv_size;
13262306a36Sopenharmony_ci	} else {
13362306a36Sopenharmony_ci		qgroup_to_release = 0;
13462306a36Sopenharmony_ci	}
13562306a36Sopenharmony_ci	spin_unlock(&block_rsv->lock);
13662306a36Sopenharmony_ci
13762306a36Sopenharmony_ci	ret = num_bytes;
13862306a36Sopenharmony_ci	if (num_bytes > 0) {
13962306a36Sopenharmony_ci		if (dest) {
14062306a36Sopenharmony_ci			spin_lock(&dest->lock);
14162306a36Sopenharmony_ci			if (!dest->full) {
14262306a36Sopenharmony_ci				u64 bytes_to_add;
14362306a36Sopenharmony_ci
14462306a36Sopenharmony_ci				bytes_to_add = dest->size - dest->reserved;
14562306a36Sopenharmony_ci				bytes_to_add = min(num_bytes, bytes_to_add);
14662306a36Sopenharmony_ci				dest->reserved += bytes_to_add;
14762306a36Sopenharmony_ci				if (dest->reserved >= dest->size)
14862306a36Sopenharmony_ci					dest->full = true;
14962306a36Sopenharmony_ci				num_bytes -= bytes_to_add;
15062306a36Sopenharmony_ci			}
15162306a36Sopenharmony_ci			spin_unlock(&dest->lock);
15262306a36Sopenharmony_ci		}
15362306a36Sopenharmony_ci		if (num_bytes)
15462306a36Sopenharmony_ci			btrfs_space_info_free_bytes_may_use(fs_info,
15562306a36Sopenharmony_ci							    space_info,
15662306a36Sopenharmony_ci							    num_bytes);
15762306a36Sopenharmony_ci	}
15862306a36Sopenharmony_ci	if (qgroup_to_release_ret)
15962306a36Sopenharmony_ci		*qgroup_to_release_ret = qgroup_to_release;
16062306a36Sopenharmony_ci	return ret;
16162306a36Sopenharmony_ci}
16262306a36Sopenharmony_ci
16362306a36Sopenharmony_ciint btrfs_block_rsv_migrate(struct btrfs_block_rsv *src,
16462306a36Sopenharmony_ci			    struct btrfs_block_rsv *dst, u64 num_bytes,
16562306a36Sopenharmony_ci			    bool update_size)
16662306a36Sopenharmony_ci{
16762306a36Sopenharmony_ci	int ret;
16862306a36Sopenharmony_ci
16962306a36Sopenharmony_ci	ret = btrfs_block_rsv_use_bytes(src, num_bytes);
17062306a36Sopenharmony_ci	if (ret)
17162306a36Sopenharmony_ci		return ret;
17262306a36Sopenharmony_ci
17362306a36Sopenharmony_ci	btrfs_block_rsv_add_bytes(dst, num_bytes, update_size);
17462306a36Sopenharmony_ci	return 0;
17562306a36Sopenharmony_ci}
17662306a36Sopenharmony_ci
17762306a36Sopenharmony_civoid btrfs_init_block_rsv(struct btrfs_block_rsv *rsv, enum btrfs_rsv_type type)
17862306a36Sopenharmony_ci{
17962306a36Sopenharmony_ci	memset(rsv, 0, sizeof(*rsv));
18062306a36Sopenharmony_ci	spin_lock_init(&rsv->lock);
18162306a36Sopenharmony_ci	rsv->type = type;
18262306a36Sopenharmony_ci}
18362306a36Sopenharmony_ci
18462306a36Sopenharmony_civoid btrfs_init_metadata_block_rsv(struct btrfs_fs_info *fs_info,
18562306a36Sopenharmony_ci				   struct btrfs_block_rsv *rsv,
18662306a36Sopenharmony_ci				   enum btrfs_rsv_type type)
18762306a36Sopenharmony_ci{
18862306a36Sopenharmony_ci	btrfs_init_block_rsv(rsv, type);
18962306a36Sopenharmony_ci	rsv->space_info = btrfs_find_space_info(fs_info,
19062306a36Sopenharmony_ci					    BTRFS_BLOCK_GROUP_METADATA);
19162306a36Sopenharmony_ci}
19262306a36Sopenharmony_ci
19362306a36Sopenharmony_cistruct btrfs_block_rsv *btrfs_alloc_block_rsv(struct btrfs_fs_info *fs_info,
19462306a36Sopenharmony_ci					      enum btrfs_rsv_type type)
19562306a36Sopenharmony_ci{
19662306a36Sopenharmony_ci	struct btrfs_block_rsv *block_rsv;
19762306a36Sopenharmony_ci
19862306a36Sopenharmony_ci	block_rsv = kmalloc(sizeof(*block_rsv), GFP_NOFS);
19962306a36Sopenharmony_ci	if (!block_rsv)
20062306a36Sopenharmony_ci		return NULL;
20162306a36Sopenharmony_ci
20262306a36Sopenharmony_ci	btrfs_init_metadata_block_rsv(fs_info, block_rsv, type);
20362306a36Sopenharmony_ci	return block_rsv;
20462306a36Sopenharmony_ci}
20562306a36Sopenharmony_ci
20662306a36Sopenharmony_civoid btrfs_free_block_rsv(struct btrfs_fs_info *fs_info,
20762306a36Sopenharmony_ci			  struct btrfs_block_rsv *rsv)
20862306a36Sopenharmony_ci{
20962306a36Sopenharmony_ci	if (!rsv)
21062306a36Sopenharmony_ci		return;
21162306a36Sopenharmony_ci	btrfs_block_rsv_release(fs_info, rsv, (u64)-1, NULL);
21262306a36Sopenharmony_ci	kfree(rsv);
21362306a36Sopenharmony_ci}
21462306a36Sopenharmony_ci
21562306a36Sopenharmony_ciint btrfs_block_rsv_add(struct btrfs_fs_info *fs_info,
21662306a36Sopenharmony_ci			struct btrfs_block_rsv *block_rsv, u64 num_bytes,
21762306a36Sopenharmony_ci			enum btrfs_reserve_flush_enum flush)
21862306a36Sopenharmony_ci{
21962306a36Sopenharmony_ci	int ret;
22062306a36Sopenharmony_ci
22162306a36Sopenharmony_ci	if (num_bytes == 0)
22262306a36Sopenharmony_ci		return 0;
22362306a36Sopenharmony_ci
22462306a36Sopenharmony_ci	ret = btrfs_reserve_metadata_bytes(fs_info, block_rsv, num_bytes, flush);
22562306a36Sopenharmony_ci	if (!ret)
22662306a36Sopenharmony_ci		btrfs_block_rsv_add_bytes(block_rsv, num_bytes, true);
22762306a36Sopenharmony_ci
22862306a36Sopenharmony_ci	return ret;
22962306a36Sopenharmony_ci}
23062306a36Sopenharmony_ci
23162306a36Sopenharmony_ciint btrfs_block_rsv_check(struct btrfs_block_rsv *block_rsv, int min_percent)
23262306a36Sopenharmony_ci{
23362306a36Sopenharmony_ci	u64 num_bytes = 0;
23462306a36Sopenharmony_ci	int ret = -ENOSPC;
23562306a36Sopenharmony_ci
23662306a36Sopenharmony_ci	spin_lock(&block_rsv->lock);
23762306a36Sopenharmony_ci	num_bytes = mult_perc(block_rsv->size, min_percent);
23862306a36Sopenharmony_ci	if (block_rsv->reserved >= num_bytes)
23962306a36Sopenharmony_ci		ret = 0;
24062306a36Sopenharmony_ci	spin_unlock(&block_rsv->lock);
24162306a36Sopenharmony_ci
24262306a36Sopenharmony_ci	return ret;
24362306a36Sopenharmony_ci}
24462306a36Sopenharmony_ci
24562306a36Sopenharmony_ciint btrfs_block_rsv_refill(struct btrfs_fs_info *fs_info,
24662306a36Sopenharmony_ci			   struct btrfs_block_rsv *block_rsv, u64 num_bytes,
24762306a36Sopenharmony_ci			   enum btrfs_reserve_flush_enum flush)
24862306a36Sopenharmony_ci{
24962306a36Sopenharmony_ci	int ret = -ENOSPC;
25062306a36Sopenharmony_ci
25162306a36Sopenharmony_ci	if (!block_rsv)
25262306a36Sopenharmony_ci		return 0;
25362306a36Sopenharmony_ci
25462306a36Sopenharmony_ci	spin_lock(&block_rsv->lock);
25562306a36Sopenharmony_ci	if (block_rsv->reserved >= num_bytes)
25662306a36Sopenharmony_ci		ret = 0;
25762306a36Sopenharmony_ci	else
25862306a36Sopenharmony_ci		num_bytes -= block_rsv->reserved;
25962306a36Sopenharmony_ci	spin_unlock(&block_rsv->lock);
26062306a36Sopenharmony_ci
26162306a36Sopenharmony_ci	if (!ret)
26262306a36Sopenharmony_ci		return 0;
26362306a36Sopenharmony_ci
26462306a36Sopenharmony_ci	ret = btrfs_reserve_metadata_bytes(fs_info, block_rsv, num_bytes, flush);
26562306a36Sopenharmony_ci	if (!ret) {
26662306a36Sopenharmony_ci		btrfs_block_rsv_add_bytes(block_rsv, num_bytes, false);
26762306a36Sopenharmony_ci		return 0;
26862306a36Sopenharmony_ci	}
26962306a36Sopenharmony_ci
27062306a36Sopenharmony_ci	return ret;
27162306a36Sopenharmony_ci}
27262306a36Sopenharmony_ci
27362306a36Sopenharmony_ciu64 btrfs_block_rsv_release(struct btrfs_fs_info *fs_info,
27462306a36Sopenharmony_ci			    struct btrfs_block_rsv *block_rsv, u64 num_bytes,
27562306a36Sopenharmony_ci			    u64 *qgroup_to_release)
27662306a36Sopenharmony_ci{
27762306a36Sopenharmony_ci	struct btrfs_block_rsv *global_rsv = &fs_info->global_block_rsv;
27862306a36Sopenharmony_ci	struct btrfs_block_rsv *delayed_rsv = &fs_info->delayed_refs_rsv;
27962306a36Sopenharmony_ci	struct btrfs_block_rsv *target = NULL;
28062306a36Sopenharmony_ci
28162306a36Sopenharmony_ci	/*
28262306a36Sopenharmony_ci	 * If we are the delayed_rsv then push to the global rsv, otherwise dump
28362306a36Sopenharmony_ci	 * into the delayed rsv if it is not full.
28462306a36Sopenharmony_ci	 */
28562306a36Sopenharmony_ci	if (block_rsv == delayed_rsv)
28662306a36Sopenharmony_ci		target = global_rsv;
28762306a36Sopenharmony_ci	else if (block_rsv != global_rsv && !btrfs_block_rsv_full(delayed_rsv))
28862306a36Sopenharmony_ci		target = delayed_rsv;
28962306a36Sopenharmony_ci
29062306a36Sopenharmony_ci	if (target && block_rsv->space_info != target->space_info)
29162306a36Sopenharmony_ci		target = NULL;
29262306a36Sopenharmony_ci
29362306a36Sopenharmony_ci	return block_rsv_release_bytes(fs_info, block_rsv, target, num_bytes,
29462306a36Sopenharmony_ci				       qgroup_to_release);
29562306a36Sopenharmony_ci}
29662306a36Sopenharmony_ci
29762306a36Sopenharmony_ciint btrfs_block_rsv_use_bytes(struct btrfs_block_rsv *block_rsv, u64 num_bytes)
29862306a36Sopenharmony_ci{
29962306a36Sopenharmony_ci	int ret = -ENOSPC;
30062306a36Sopenharmony_ci
30162306a36Sopenharmony_ci	spin_lock(&block_rsv->lock);
30262306a36Sopenharmony_ci	if (block_rsv->reserved >= num_bytes) {
30362306a36Sopenharmony_ci		block_rsv->reserved -= num_bytes;
30462306a36Sopenharmony_ci		if (block_rsv->reserved < block_rsv->size)
30562306a36Sopenharmony_ci			block_rsv->full = false;
30662306a36Sopenharmony_ci		ret = 0;
30762306a36Sopenharmony_ci	}
30862306a36Sopenharmony_ci	spin_unlock(&block_rsv->lock);
30962306a36Sopenharmony_ci	return ret;
31062306a36Sopenharmony_ci}
31162306a36Sopenharmony_ci
31262306a36Sopenharmony_civoid btrfs_block_rsv_add_bytes(struct btrfs_block_rsv *block_rsv,
31362306a36Sopenharmony_ci			       u64 num_bytes, bool update_size)
31462306a36Sopenharmony_ci{
31562306a36Sopenharmony_ci	spin_lock(&block_rsv->lock);
31662306a36Sopenharmony_ci	block_rsv->reserved += num_bytes;
31762306a36Sopenharmony_ci	if (update_size)
31862306a36Sopenharmony_ci		block_rsv->size += num_bytes;
31962306a36Sopenharmony_ci	else if (block_rsv->reserved >= block_rsv->size)
32062306a36Sopenharmony_ci		block_rsv->full = true;
32162306a36Sopenharmony_ci	spin_unlock(&block_rsv->lock);
32262306a36Sopenharmony_ci}
32362306a36Sopenharmony_ci
32462306a36Sopenharmony_civoid btrfs_update_global_block_rsv(struct btrfs_fs_info *fs_info)
32562306a36Sopenharmony_ci{
32662306a36Sopenharmony_ci	struct btrfs_block_rsv *block_rsv = &fs_info->global_block_rsv;
32762306a36Sopenharmony_ci	struct btrfs_space_info *sinfo = block_rsv->space_info;
32862306a36Sopenharmony_ci	struct btrfs_root *root, *tmp;
32962306a36Sopenharmony_ci	u64 num_bytes = btrfs_root_used(&fs_info->tree_root->root_item);
33062306a36Sopenharmony_ci	unsigned int min_items = 1;
33162306a36Sopenharmony_ci
33262306a36Sopenharmony_ci	/*
33362306a36Sopenharmony_ci	 * The global block rsv is based on the size of the extent tree, the
33462306a36Sopenharmony_ci	 * checksum tree and the root tree.  If the fs is empty we want to set
33562306a36Sopenharmony_ci	 * it to a minimal amount for safety.
33662306a36Sopenharmony_ci	 *
33762306a36Sopenharmony_ci	 * We also are going to need to modify the minimum of the tree root and
33862306a36Sopenharmony_ci	 * any global roots we could touch.
33962306a36Sopenharmony_ci	 */
34062306a36Sopenharmony_ci	read_lock(&fs_info->global_root_lock);
34162306a36Sopenharmony_ci	rbtree_postorder_for_each_entry_safe(root, tmp, &fs_info->global_root_tree,
34262306a36Sopenharmony_ci					     rb_node) {
34362306a36Sopenharmony_ci		if (root->root_key.objectid == BTRFS_EXTENT_TREE_OBJECTID ||
34462306a36Sopenharmony_ci		    root->root_key.objectid == BTRFS_CSUM_TREE_OBJECTID ||
34562306a36Sopenharmony_ci		    root->root_key.objectid == BTRFS_FREE_SPACE_TREE_OBJECTID) {
34662306a36Sopenharmony_ci			num_bytes += btrfs_root_used(&root->root_item);
34762306a36Sopenharmony_ci			min_items++;
34862306a36Sopenharmony_ci		}
34962306a36Sopenharmony_ci	}
35062306a36Sopenharmony_ci	read_unlock(&fs_info->global_root_lock);
35162306a36Sopenharmony_ci
35262306a36Sopenharmony_ci	if (btrfs_fs_compat_ro(fs_info, BLOCK_GROUP_TREE)) {
35362306a36Sopenharmony_ci		num_bytes += btrfs_root_used(&fs_info->block_group_root->root_item);
35462306a36Sopenharmony_ci		min_items++;
35562306a36Sopenharmony_ci	}
35662306a36Sopenharmony_ci
35762306a36Sopenharmony_ci	/*
35862306a36Sopenharmony_ci	 * But we also want to reserve enough space so we can do the fallback
35962306a36Sopenharmony_ci	 * global reserve for an unlink, which is an additional
36062306a36Sopenharmony_ci	 * BTRFS_UNLINK_METADATA_UNITS items.
36162306a36Sopenharmony_ci	 *
36262306a36Sopenharmony_ci	 * But we also need space for the delayed ref updates from the unlink,
36362306a36Sopenharmony_ci	 * so add BTRFS_UNLINK_METADATA_UNITS units for delayed refs, one for
36462306a36Sopenharmony_ci	 * each unlink metadata item.
36562306a36Sopenharmony_ci	 */
36662306a36Sopenharmony_ci	min_items += BTRFS_UNLINK_METADATA_UNITS;
36762306a36Sopenharmony_ci
36862306a36Sopenharmony_ci	num_bytes = max_t(u64, num_bytes,
36962306a36Sopenharmony_ci			  btrfs_calc_insert_metadata_size(fs_info, min_items) +
37062306a36Sopenharmony_ci			  btrfs_calc_delayed_ref_bytes(fs_info,
37162306a36Sopenharmony_ci					       BTRFS_UNLINK_METADATA_UNITS));
37262306a36Sopenharmony_ci
37362306a36Sopenharmony_ci	spin_lock(&sinfo->lock);
37462306a36Sopenharmony_ci	spin_lock(&block_rsv->lock);
37562306a36Sopenharmony_ci
37662306a36Sopenharmony_ci	block_rsv->size = min_t(u64, num_bytes, SZ_512M);
37762306a36Sopenharmony_ci
37862306a36Sopenharmony_ci	if (block_rsv->reserved < block_rsv->size) {
37962306a36Sopenharmony_ci		num_bytes = block_rsv->size - block_rsv->reserved;
38062306a36Sopenharmony_ci		btrfs_space_info_update_bytes_may_use(fs_info, sinfo,
38162306a36Sopenharmony_ci						      num_bytes);
38262306a36Sopenharmony_ci		block_rsv->reserved = block_rsv->size;
38362306a36Sopenharmony_ci	} else if (block_rsv->reserved > block_rsv->size) {
38462306a36Sopenharmony_ci		num_bytes = block_rsv->reserved - block_rsv->size;
38562306a36Sopenharmony_ci		btrfs_space_info_update_bytes_may_use(fs_info, sinfo,
38662306a36Sopenharmony_ci						      -num_bytes);
38762306a36Sopenharmony_ci		block_rsv->reserved = block_rsv->size;
38862306a36Sopenharmony_ci		btrfs_try_granting_tickets(fs_info, sinfo);
38962306a36Sopenharmony_ci	}
39062306a36Sopenharmony_ci
39162306a36Sopenharmony_ci	block_rsv->full = (block_rsv->reserved == block_rsv->size);
39262306a36Sopenharmony_ci
39362306a36Sopenharmony_ci	if (block_rsv->size >= sinfo->total_bytes)
39462306a36Sopenharmony_ci		sinfo->force_alloc = CHUNK_ALLOC_FORCE;
39562306a36Sopenharmony_ci	spin_unlock(&block_rsv->lock);
39662306a36Sopenharmony_ci	spin_unlock(&sinfo->lock);
39762306a36Sopenharmony_ci}
39862306a36Sopenharmony_ci
39962306a36Sopenharmony_civoid btrfs_init_root_block_rsv(struct btrfs_root *root)
40062306a36Sopenharmony_ci{
40162306a36Sopenharmony_ci	struct btrfs_fs_info *fs_info = root->fs_info;
40262306a36Sopenharmony_ci
40362306a36Sopenharmony_ci	switch (root->root_key.objectid) {
40462306a36Sopenharmony_ci	case BTRFS_CSUM_TREE_OBJECTID:
40562306a36Sopenharmony_ci	case BTRFS_EXTENT_TREE_OBJECTID:
40662306a36Sopenharmony_ci	case BTRFS_FREE_SPACE_TREE_OBJECTID:
40762306a36Sopenharmony_ci	case BTRFS_BLOCK_GROUP_TREE_OBJECTID:
40862306a36Sopenharmony_ci		root->block_rsv = &fs_info->delayed_refs_rsv;
40962306a36Sopenharmony_ci		break;
41062306a36Sopenharmony_ci	case BTRFS_ROOT_TREE_OBJECTID:
41162306a36Sopenharmony_ci	case BTRFS_DEV_TREE_OBJECTID:
41262306a36Sopenharmony_ci	case BTRFS_QUOTA_TREE_OBJECTID:
41362306a36Sopenharmony_ci		root->block_rsv = &fs_info->global_block_rsv;
41462306a36Sopenharmony_ci		break;
41562306a36Sopenharmony_ci	case BTRFS_CHUNK_TREE_OBJECTID:
41662306a36Sopenharmony_ci		root->block_rsv = &fs_info->chunk_block_rsv;
41762306a36Sopenharmony_ci		break;
41862306a36Sopenharmony_ci	default:
41962306a36Sopenharmony_ci		root->block_rsv = NULL;
42062306a36Sopenharmony_ci		break;
42162306a36Sopenharmony_ci	}
42262306a36Sopenharmony_ci}
42362306a36Sopenharmony_ci
42462306a36Sopenharmony_civoid btrfs_init_global_block_rsv(struct btrfs_fs_info *fs_info)
42562306a36Sopenharmony_ci{
42662306a36Sopenharmony_ci	struct btrfs_space_info *space_info;
42762306a36Sopenharmony_ci
42862306a36Sopenharmony_ci	space_info = btrfs_find_space_info(fs_info, BTRFS_BLOCK_GROUP_SYSTEM);
42962306a36Sopenharmony_ci	fs_info->chunk_block_rsv.space_info = space_info;
43062306a36Sopenharmony_ci
43162306a36Sopenharmony_ci	space_info = btrfs_find_space_info(fs_info, BTRFS_BLOCK_GROUP_METADATA);
43262306a36Sopenharmony_ci	fs_info->global_block_rsv.space_info = space_info;
43362306a36Sopenharmony_ci	fs_info->trans_block_rsv.space_info = space_info;
43462306a36Sopenharmony_ci	fs_info->empty_block_rsv.space_info = space_info;
43562306a36Sopenharmony_ci	fs_info->delayed_block_rsv.space_info = space_info;
43662306a36Sopenharmony_ci	fs_info->delayed_refs_rsv.space_info = space_info;
43762306a36Sopenharmony_ci
43862306a36Sopenharmony_ci	btrfs_update_global_block_rsv(fs_info);
43962306a36Sopenharmony_ci}
44062306a36Sopenharmony_ci
44162306a36Sopenharmony_civoid btrfs_release_global_block_rsv(struct btrfs_fs_info *fs_info)
44262306a36Sopenharmony_ci{
44362306a36Sopenharmony_ci	btrfs_block_rsv_release(fs_info, &fs_info->global_block_rsv, (u64)-1,
44462306a36Sopenharmony_ci				NULL);
44562306a36Sopenharmony_ci	WARN_ON(fs_info->trans_block_rsv.size > 0);
44662306a36Sopenharmony_ci	WARN_ON(fs_info->trans_block_rsv.reserved > 0);
44762306a36Sopenharmony_ci	WARN_ON(fs_info->chunk_block_rsv.size > 0);
44862306a36Sopenharmony_ci	WARN_ON(fs_info->chunk_block_rsv.reserved > 0);
44962306a36Sopenharmony_ci	WARN_ON(fs_info->delayed_block_rsv.size > 0);
45062306a36Sopenharmony_ci	WARN_ON(fs_info->delayed_block_rsv.reserved > 0);
45162306a36Sopenharmony_ci	WARN_ON(fs_info->delayed_refs_rsv.reserved > 0);
45262306a36Sopenharmony_ci	WARN_ON(fs_info->delayed_refs_rsv.size > 0);
45362306a36Sopenharmony_ci}
45462306a36Sopenharmony_ci
45562306a36Sopenharmony_cistatic struct btrfs_block_rsv *get_block_rsv(
45662306a36Sopenharmony_ci					const struct btrfs_trans_handle *trans,
45762306a36Sopenharmony_ci					const struct btrfs_root *root)
45862306a36Sopenharmony_ci{
45962306a36Sopenharmony_ci	struct btrfs_fs_info *fs_info = root->fs_info;
46062306a36Sopenharmony_ci	struct btrfs_block_rsv *block_rsv = NULL;
46162306a36Sopenharmony_ci
46262306a36Sopenharmony_ci	if (test_bit(BTRFS_ROOT_SHAREABLE, &root->state) ||
46362306a36Sopenharmony_ci	    (root == fs_info->uuid_root) ||
46462306a36Sopenharmony_ci	    (trans->adding_csums &&
46562306a36Sopenharmony_ci	     root->root_key.objectid == BTRFS_CSUM_TREE_OBJECTID))
46662306a36Sopenharmony_ci		block_rsv = trans->block_rsv;
46762306a36Sopenharmony_ci
46862306a36Sopenharmony_ci	if (!block_rsv)
46962306a36Sopenharmony_ci		block_rsv = root->block_rsv;
47062306a36Sopenharmony_ci
47162306a36Sopenharmony_ci	if (!block_rsv)
47262306a36Sopenharmony_ci		block_rsv = &fs_info->empty_block_rsv;
47362306a36Sopenharmony_ci
47462306a36Sopenharmony_ci	return block_rsv;
47562306a36Sopenharmony_ci}
47662306a36Sopenharmony_ci
47762306a36Sopenharmony_cistruct btrfs_block_rsv *btrfs_use_block_rsv(struct btrfs_trans_handle *trans,
47862306a36Sopenharmony_ci					    struct btrfs_root *root,
47962306a36Sopenharmony_ci					    u32 blocksize)
48062306a36Sopenharmony_ci{
48162306a36Sopenharmony_ci	struct btrfs_fs_info *fs_info = root->fs_info;
48262306a36Sopenharmony_ci	struct btrfs_block_rsv *block_rsv;
48362306a36Sopenharmony_ci	struct btrfs_block_rsv *global_rsv = &fs_info->global_block_rsv;
48462306a36Sopenharmony_ci	int ret;
48562306a36Sopenharmony_ci	bool global_updated = false;
48662306a36Sopenharmony_ci
48762306a36Sopenharmony_ci	block_rsv = get_block_rsv(trans, root);
48862306a36Sopenharmony_ci
48962306a36Sopenharmony_ci	if (unlikely(btrfs_block_rsv_size(block_rsv) == 0))
49062306a36Sopenharmony_ci		goto try_reserve;
49162306a36Sopenharmony_ciagain:
49262306a36Sopenharmony_ci	ret = btrfs_block_rsv_use_bytes(block_rsv, blocksize);
49362306a36Sopenharmony_ci	if (!ret)
49462306a36Sopenharmony_ci		return block_rsv;
49562306a36Sopenharmony_ci
49662306a36Sopenharmony_ci	if (block_rsv->failfast)
49762306a36Sopenharmony_ci		return ERR_PTR(ret);
49862306a36Sopenharmony_ci
49962306a36Sopenharmony_ci	if (block_rsv->type == BTRFS_BLOCK_RSV_GLOBAL && !global_updated) {
50062306a36Sopenharmony_ci		global_updated = true;
50162306a36Sopenharmony_ci		btrfs_update_global_block_rsv(fs_info);
50262306a36Sopenharmony_ci		goto again;
50362306a36Sopenharmony_ci	}
50462306a36Sopenharmony_ci
50562306a36Sopenharmony_ci	/*
50662306a36Sopenharmony_ci	 * The global reserve still exists to save us from ourselves, so don't
50762306a36Sopenharmony_ci	 * warn_on if we are short on our delayed refs reserve.
50862306a36Sopenharmony_ci	 */
50962306a36Sopenharmony_ci	if (block_rsv->type != BTRFS_BLOCK_RSV_DELREFS &&
51062306a36Sopenharmony_ci	    btrfs_test_opt(fs_info, ENOSPC_DEBUG)) {
51162306a36Sopenharmony_ci		static DEFINE_RATELIMIT_STATE(_rs,
51262306a36Sopenharmony_ci				DEFAULT_RATELIMIT_INTERVAL * 10,
51362306a36Sopenharmony_ci				/*DEFAULT_RATELIMIT_BURST*/ 1);
51462306a36Sopenharmony_ci		if (__ratelimit(&_rs))
51562306a36Sopenharmony_ci			WARN(1, KERN_DEBUG
51662306a36Sopenharmony_ci				"BTRFS: block rsv %d returned %d\n",
51762306a36Sopenharmony_ci				block_rsv->type, ret);
51862306a36Sopenharmony_ci	}
51962306a36Sopenharmony_citry_reserve:
52062306a36Sopenharmony_ci	ret = btrfs_reserve_metadata_bytes(fs_info, block_rsv, blocksize,
52162306a36Sopenharmony_ci					   BTRFS_RESERVE_NO_FLUSH);
52262306a36Sopenharmony_ci	if (!ret)
52362306a36Sopenharmony_ci		return block_rsv;
52462306a36Sopenharmony_ci	/*
52562306a36Sopenharmony_ci	 * If we couldn't reserve metadata bytes try and use some from
52662306a36Sopenharmony_ci	 * the global reserve if its space type is the same as the global
52762306a36Sopenharmony_ci	 * reservation.
52862306a36Sopenharmony_ci	 */
52962306a36Sopenharmony_ci	if (block_rsv->type != BTRFS_BLOCK_RSV_GLOBAL &&
53062306a36Sopenharmony_ci	    block_rsv->space_info == global_rsv->space_info) {
53162306a36Sopenharmony_ci		ret = btrfs_block_rsv_use_bytes(global_rsv, blocksize);
53262306a36Sopenharmony_ci		if (!ret)
53362306a36Sopenharmony_ci			return global_rsv;
53462306a36Sopenharmony_ci	}
53562306a36Sopenharmony_ci
53662306a36Sopenharmony_ci	/*
53762306a36Sopenharmony_ci	 * All hope is lost, but of course our reservations are overly
53862306a36Sopenharmony_ci	 * pessimistic, so instead of possibly having an ENOSPC abort here, try
53962306a36Sopenharmony_ci	 * one last time to force a reservation if there's enough actual space
54062306a36Sopenharmony_ci	 * on disk to make the reservation.
54162306a36Sopenharmony_ci	 */
54262306a36Sopenharmony_ci	ret = btrfs_reserve_metadata_bytes(fs_info, block_rsv, blocksize,
54362306a36Sopenharmony_ci					   BTRFS_RESERVE_FLUSH_EMERGENCY);
54462306a36Sopenharmony_ci	if (!ret)
54562306a36Sopenharmony_ci		return block_rsv;
54662306a36Sopenharmony_ci
54762306a36Sopenharmony_ci	return ERR_PTR(ret);
54862306a36Sopenharmony_ci}
54962306a36Sopenharmony_ci
55062306a36Sopenharmony_ciint btrfs_check_trunc_cache_free_space(struct btrfs_fs_info *fs_info,
55162306a36Sopenharmony_ci				       struct btrfs_block_rsv *rsv)
55262306a36Sopenharmony_ci{
55362306a36Sopenharmony_ci	u64 needed_bytes;
55462306a36Sopenharmony_ci	int ret;
55562306a36Sopenharmony_ci
55662306a36Sopenharmony_ci	/* 1 for slack space, 1 for updating the inode */
55762306a36Sopenharmony_ci	needed_bytes = btrfs_calc_insert_metadata_size(fs_info, 1) +
55862306a36Sopenharmony_ci		btrfs_calc_metadata_size(fs_info, 1);
55962306a36Sopenharmony_ci
56062306a36Sopenharmony_ci	spin_lock(&rsv->lock);
56162306a36Sopenharmony_ci	if (rsv->reserved < needed_bytes)
56262306a36Sopenharmony_ci		ret = -ENOSPC;
56362306a36Sopenharmony_ci	else
56462306a36Sopenharmony_ci		ret = 0;
56562306a36Sopenharmony_ci	spin_unlock(&rsv->lock);
56662306a36Sopenharmony_ci	return ret;
56762306a36Sopenharmony_ci}
568