162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0 262306a36Sopenharmony_ci 362306a36Sopenharmony_ci#include "misc.h" 462306a36Sopenharmony_ci#include "ctree.h" 562306a36Sopenharmony_ci#include "block-rsv.h" 662306a36Sopenharmony_ci#include "space-info.h" 762306a36Sopenharmony_ci#include "transaction.h" 862306a36Sopenharmony_ci#include "block-group.h" 962306a36Sopenharmony_ci#include "disk-io.h" 1062306a36Sopenharmony_ci#include "fs.h" 1162306a36Sopenharmony_ci#include "accessors.h" 1262306a36Sopenharmony_ci 1362306a36Sopenharmony_ci/* 1462306a36Sopenharmony_ci * HOW DO BLOCK RESERVES WORK 1562306a36Sopenharmony_ci * 1662306a36Sopenharmony_ci * Think of block_rsv's as buckets for logically grouped metadata 1762306a36Sopenharmony_ci * reservations. Each block_rsv has a ->size and a ->reserved. ->size is 1862306a36Sopenharmony_ci * how large we want our block rsv to be, ->reserved is how much space is 1962306a36Sopenharmony_ci * currently reserved for this block reserve. 2062306a36Sopenharmony_ci * 2162306a36Sopenharmony_ci * ->failfast exists for the truncate case, and is described below. 2262306a36Sopenharmony_ci * 2362306a36Sopenharmony_ci * NORMAL OPERATION 2462306a36Sopenharmony_ci * 2562306a36Sopenharmony_ci * -> Reserve 2662306a36Sopenharmony_ci * Entrance: btrfs_block_rsv_add, btrfs_block_rsv_refill 2762306a36Sopenharmony_ci * 2862306a36Sopenharmony_ci * We call into btrfs_reserve_metadata_bytes() with our bytes, which is 2962306a36Sopenharmony_ci * accounted for in space_info->bytes_may_use, and then add the bytes to 3062306a36Sopenharmony_ci * ->reserved, and ->size in the case of btrfs_block_rsv_add. 3162306a36Sopenharmony_ci * 3262306a36Sopenharmony_ci * ->size is an over-estimation of how much we may use for a particular 3362306a36Sopenharmony_ci * operation. 3462306a36Sopenharmony_ci * 3562306a36Sopenharmony_ci * -> Use 3662306a36Sopenharmony_ci * Entrance: btrfs_use_block_rsv 3762306a36Sopenharmony_ci * 3862306a36Sopenharmony_ci * When we do a btrfs_alloc_tree_block() we call into btrfs_use_block_rsv() 3962306a36Sopenharmony_ci * to determine the appropriate block_rsv to use, and then verify that 4062306a36Sopenharmony_ci * ->reserved has enough space for our tree block allocation. Once 4162306a36Sopenharmony_ci * successful we subtract fs_info->nodesize from ->reserved. 4262306a36Sopenharmony_ci * 4362306a36Sopenharmony_ci * -> Finish 4462306a36Sopenharmony_ci * Entrance: btrfs_block_rsv_release 4562306a36Sopenharmony_ci * 4662306a36Sopenharmony_ci * We are finished with our operation, subtract our individual reservation 4762306a36Sopenharmony_ci * from ->size, and then subtract ->size from ->reserved and free up the 4862306a36Sopenharmony_ci * excess if there is any. 4962306a36Sopenharmony_ci * 5062306a36Sopenharmony_ci * There is some logic here to refill the delayed refs rsv or the global rsv 5162306a36Sopenharmony_ci * as needed, otherwise the excess is subtracted from 5262306a36Sopenharmony_ci * space_info->bytes_may_use. 5362306a36Sopenharmony_ci * 5462306a36Sopenharmony_ci * TYPES OF BLOCK RESERVES 5562306a36Sopenharmony_ci * 5662306a36Sopenharmony_ci * BLOCK_RSV_TRANS, BLOCK_RSV_DELOPS, BLOCK_RSV_CHUNK 5762306a36Sopenharmony_ci * These behave normally, as described above, just within the confines of the 5862306a36Sopenharmony_ci * lifetime of their particular operation (transaction for the whole trans 5962306a36Sopenharmony_ci * handle lifetime, for example). 6062306a36Sopenharmony_ci * 6162306a36Sopenharmony_ci * BLOCK_RSV_GLOBAL 6262306a36Sopenharmony_ci * It is impossible to properly account for all the space that may be required 6362306a36Sopenharmony_ci * to make our extent tree updates. This block reserve acts as an overflow 6462306a36Sopenharmony_ci * buffer in case our delayed refs reserve does not reserve enough space to 6562306a36Sopenharmony_ci * update the extent tree. 6662306a36Sopenharmony_ci * 6762306a36Sopenharmony_ci * We can steal from this in some cases as well, notably on evict() or 6862306a36Sopenharmony_ci * truncate() in order to help users recover from ENOSPC conditions. 6962306a36Sopenharmony_ci * 7062306a36Sopenharmony_ci * BLOCK_RSV_DELALLOC 7162306a36Sopenharmony_ci * The individual item sizes are determined by the per-inode size 7262306a36Sopenharmony_ci * calculations, which are described with the delalloc code. This is pretty 7362306a36Sopenharmony_ci * straightforward, it's just the calculation of ->size encodes a lot of 7462306a36Sopenharmony_ci * different items, and thus it gets used when updating inodes, inserting file 7562306a36Sopenharmony_ci * extents, and inserting checksums. 7662306a36Sopenharmony_ci * 7762306a36Sopenharmony_ci * BLOCK_RSV_DELREFS 7862306a36Sopenharmony_ci * We keep a running tally of how many delayed refs we have on the system. 7962306a36Sopenharmony_ci * We assume each one of these delayed refs are going to use a full 8062306a36Sopenharmony_ci * reservation. We use the transaction items and pre-reserve space for every 8162306a36Sopenharmony_ci * operation, and use this reservation to refill any gap between ->size and 8262306a36Sopenharmony_ci * ->reserved that may exist. 8362306a36Sopenharmony_ci * 8462306a36Sopenharmony_ci * From there it's straightforward, removing a delayed ref means we remove its 8562306a36Sopenharmony_ci * count from ->size and free up reservations as necessary. Since this is 8662306a36Sopenharmony_ci * the most dynamic block reserve in the system, we will try to refill this 8762306a36Sopenharmony_ci * block reserve first with any excess returned by any other block reserve. 8862306a36Sopenharmony_ci * 8962306a36Sopenharmony_ci * BLOCK_RSV_EMPTY 9062306a36Sopenharmony_ci * This is the fallback block reserve to make us try to reserve space if we 9162306a36Sopenharmony_ci * don't have a specific bucket for this allocation. It is mostly used for 9262306a36Sopenharmony_ci * updating the device tree and such, since that is a separate pool we're 9362306a36Sopenharmony_ci * content to just reserve space from the space_info on demand. 9462306a36Sopenharmony_ci * 9562306a36Sopenharmony_ci * BLOCK_RSV_TEMP 9662306a36Sopenharmony_ci * This is used by things like truncate and iput. We will temporarily 9762306a36Sopenharmony_ci * allocate a block reserve, set it to some size, and then truncate bytes 9862306a36Sopenharmony_ci * until we have no space left. With ->failfast set we'll simply return 9962306a36Sopenharmony_ci * ENOSPC from btrfs_use_block_rsv() to signal that we need to unwind and try 10062306a36Sopenharmony_ci * to make a new reservation. This is because these operations are 10162306a36Sopenharmony_ci * unbounded, so we want to do as much work as we can, and then back off and 10262306a36Sopenharmony_ci * re-reserve. 10362306a36Sopenharmony_ci */ 10462306a36Sopenharmony_ci 10562306a36Sopenharmony_cistatic u64 block_rsv_release_bytes(struct btrfs_fs_info *fs_info, 10662306a36Sopenharmony_ci struct btrfs_block_rsv *block_rsv, 10762306a36Sopenharmony_ci struct btrfs_block_rsv *dest, u64 num_bytes, 10862306a36Sopenharmony_ci u64 *qgroup_to_release_ret) 10962306a36Sopenharmony_ci{ 11062306a36Sopenharmony_ci struct btrfs_space_info *space_info = block_rsv->space_info; 11162306a36Sopenharmony_ci u64 qgroup_to_release = 0; 11262306a36Sopenharmony_ci u64 ret; 11362306a36Sopenharmony_ci 11462306a36Sopenharmony_ci spin_lock(&block_rsv->lock); 11562306a36Sopenharmony_ci if (num_bytes == (u64)-1) { 11662306a36Sopenharmony_ci num_bytes = block_rsv->size; 11762306a36Sopenharmony_ci qgroup_to_release = block_rsv->qgroup_rsv_size; 11862306a36Sopenharmony_ci } 11962306a36Sopenharmony_ci block_rsv->size -= num_bytes; 12062306a36Sopenharmony_ci if (block_rsv->reserved >= block_rsv->size) { 12162306a36Sopenharmony_ci num_bytes = block_rsv->reserved - block_rsv->size; 12262306a36Sopenharmony_ci block_rsv->reserved = block_rsv->size; 12362306a36Sopenharmony_ci block_rsv->full = true; 12462306a36Sopenharmony_ci } else { 12562306a36Sopenharmony_ci num_bytes = 0; 12662306a36Sopenharmony_ci } 12762306a36Sopenharmony_ci if (qgroup_to_release_ret && 12862306a36Sopenharmony_ci block_rsv->qgroup_rsv_reserved >= block_rsv->qgroup_rsv_size) { 12962306a36Sopenharmony_ci qgroup_to_release = block_rsv->qgroup_rsv_reserved - 13062306a36Sopenharmony_ci block_rsv->qgroup_rsv_size; 13162306a36Sopenharmony_ci block_rsv->qgroup_rsv_reserved = block_rsv->qgroup_rsv_size; 13262306a36Sopenharmony_ci } else { 13362306a36Sopenharmony_ci qgroup_to_release = 0; 13462306a36Sopenharmony_ci } 13562306a36Sopenharmony_ci spin_unlock(&block_rsv->lock); 13662306a36Sopenharmony_ci 13762306a36Sopenharmony_ci ret = num_bytes; 13862306a36Sopenharmony_ci if (num_bytes > 0) { 13962306a36Sopenharmony_ci if (dest) { 14062306a36Sopenharmony_ci spin_lock(&dest->lock); 14162306a36Sopenharmony_ci if (!dest->full) { 14262306a36Sopenharmony_ci u64 bytes_to_add; 14362306a36Sopenharmony_ci 14462306a36Sopenharmony_ci bytes_to_add = dest->size - dest->reserved; 14562306a36Sopenharmony_ci bytes_to_add = min(num_bytes, bytes_to_add); 14662306a36Sopenharmony_ci dest->reserved += bytes_to_add; 14762306a36Sopenharmony_ci if (dest->reserved >= dest->size) 14862306a36Sopenharmony_ci dest->full = true; 14962306a36Sopenharmony_ci num_bytes -= bytes_to_add; 15062306a36Sopenharmony_ci } 15162306a36Sopenharmony_ci spin_unlock(&dest->lock); 15262306a36Sopenharmony_ci } 15362306a36Sopenharmony_ci if (num_bytes) 15462306a36Sopenharmony_ci btrfs_space_info_free_bytes_may_use(fs_info, 15562306a36Sopenharmony_ci space_info, 15662306a36Sopenharmony_ci num_bytes); 15762306a36Sopenharmony_ci } 15862306a36Sopenharmony_ci if (qgroup_to_release_ret) 15962306a36Sopenharmony_ci *qgroup_to_release_ret = qgroup_to_release; 16062306a36Sopenharmony_ci return ret; 16162306a36Sopenharmony_ci} 16262306a36Sopenharmony_ci 16362306a36Sopenharmony_ciint btrfs_block_rsv_migrate(struct btrfs_block_rsv *src, 16462306a36Sopenharmony_ci struct btrfs_block_rsv *dst, u64 num_bytes, 16562306a36Sopenharmony_ci bool update_size) 16662306a36Sopenharmony_ci{ 16762306a36Sopenharmony_ci int ret; 16862306a36Sopenharmony_ci 16962306a36Sopenharmony_ci ret = btrfs_block_rsv_use_bytes(src, num_bytes); 17062306a36Sopenharmony_ci if (ret) 17162306a36Sopenharmony_ci return ret; 17262306a36Sopenharmony_ci 17362306a36Sopenharmony_ci btrfs_block_rsv_add_bytes(dst, num_bytes, update_size); 17462306a36Sopenharmony_ci return 0; 17562306a36Sopenharmony_ci} 17662306a36Sopenharmony_ci 17762306a36Sopenharmony_civoid btrfs_init_block_rsv(struct btrfs_block_rsv *rsv, enum btrfs_rsv_type type) 17862306a36Sopenharmony_ci{ 17962306a36Sopenharmony_ci memset(rsv, 0, sizeof(*rsv)); 18062306a36Sopenharmony_ci spin_lock_init(&rsv->lock); 18162306a36Sopenharmony_ci rsv->type = type; 18262306a36Sopenharmony_ci} 18362306a36Sopenharmony_ci 18462306a36Sopenharmony_civoid btrfs_init_metadata_block_rsv(struct btrfs_fs_info *fs_info, 18562306a36Sopenharmony_ci struct btrfs_block_rsv *rsv, 18662306a36Sopenharmony_ci enum btrfs_rsv_type type) 18762306a36Sopenharmony_ci{ 18862306a36Sopenharmony_ci btrfs_init_block_rsv(rsv, type); 18962306a36Sopenharmony_ci rsv->space_info = btrfs_find_space_info(fs_info, 19062306a36Sopenharmony_ci BTRFS_BLOCK_GROUP_METADATA); 19162306a36Sopenharmony_ci} 19262306a36Sopenharmony_ci 19362306a36Sopenharmony_cistruct btrfs_block_rsv *btrfs_alloc_block_rsv(struct btrfs_fs_info *fs_info, 19462306a36Sopenharmony_ci enum btrfs_rsv_type type) 19562306a36Sopenharmony_ci{ 19662306a36Sopenharmony_ci struct btrfs_block_rsv *block_rsv; 19762306a36Sopenharmony_ci 19862306a36Sopenharmony_ci block_rsv = kmalloc(sizeof(*block_rsv), GFP_NOFS); 19962306a36Sopenharmony_ci if (!block_rsv) 20062306a36Sopenharmony_ci return NULL; 20162306a36Sopenharmony_ci 20262306a36Sopenharmony_ci btrfs_init_metadata_block_rsv(fs_info, block_rsv, type); 20362306a36Sopenharmony_ci return block_rsv; 20462306a36Sopenharmony_ci} 20562306a36Sopenharmony_ci 20662306a36Sopenharmony_civoid btrfs_free_block_rsv(struct btrfs_fs_info *fs_info, 20762306a36Sopenharmony_ci struct btrfs_block_rsv *rsv) 20862306a36Sopenharmony_ci{ 20962306a36Sopenharmony_ci if (!rsv) 21062306a36Sopenharmony_ci return; 21162306a36Sopenharmony_ci btrfs_block_rsv_release(fs_info, rsv, (u64)-1, NULL); 21262306a36Sopenharmony_ci kfree(rsv); 21362306a36Sopenharmony_ci} 21462306a36Sopenharmony_ci 21562306a36Sopenharmony_ciint btrfs_block_rsv_add(struct btrfs_fs_info *fs_info, 21662306a36Sopenharmony_ci struct btrfs_block_rsv *block_rsv, u64 num_bytes, 21762306a36Sopenharmony_ci enum btrfs_reserve_flush_enum flush) 21862306a36Sopenharmony_ci{ 21962306a36Sopenharmony_ci int ret; 22062306a36Sopenharmony_ci 22162306a36Sopenharmony_ci if (num_bytes == 0) 22262306a36Sopenharmony_ci return 0; 22362306a36Sopenharmony_ci 22462306a36Sopenharmony_ci ret = btrfs_reserve_metadata_bytes(fs_info, block_rsv, num_bytes, flush); 22562306a36Sopenharmony_ci if (!ret) 22662306a36Sopenharmony_ci btrfs_block_rsv_add_bytes(block_rsv, num_bytes, true); 22762306a36Sopenharmony_ci 22862306a36Sopenharmony_ci return ret; 22962306a36Sopenharmony_ci} 23062306a36Sopenharmony_ci 23162306a36Sopenharmony_ciint btrfs_block_rsv_check(struct btrfs_block_rsv *block_rsv, int min_percent) 23262306a36Sopenharmony_ci{ 23362306a36Sopenharmony_ci u64 num_bytes = 0; 23462306a36Sopenharmony_ci int ret = -ENOSPC; 23562306a36Sopenharmony_ci 23662306a36Sopenharmony_ci spin_lock(&block_rsv->lock); 23762306a36Sopenharmony_ci num_bytes = mult_perc(block_rsv->size, min_percent); 23862306a36Sopenharmony_ci if (block_rsv->reserved >= num_bytes) 23962306a36Sopenharmony_ci ret = 0; 24062306a36Sopenharmony_ci spin_unlock(&block_rsv->lock); 24162306a36Sopenharmony_ci 24262306a36Sopenharmony_ci return ret; 24362306a36Sopenharmony_ci} 24462306a36Sopenharmony_ci 24562306a36Sopenharmony_ciint btrfs_block_rsv_refill(struct btrfs_fs_info *fs_info, 24662306a36Sopenharmony_ci struct btrfs_block_rsv *block_rsv, u64 num_bytes, 24762306a36Sopenharmony_ci enum btrfs_reserve_flush_enum flush) 24862306a36Sopenharmony_ci{ 24962306a36Sopenharmony_ci int ret = -ENOSPC; 25062306a36Sopenharmony_ci 25162306a36Sopenharmony_ci if (!block_rsv) 25262306a36Sopenharmony_ci return 0; 25362306a36Sopenharmony_ci 25462306a36Sopenharmony_ci spin_lock(&block_rsv->lock); 25562306a36Sopenharmony_ci if (block_rsv->reserved >= num_bytes) 25662306a36Sopenharmony_ci ret = 0; 25762306a36Sopenharmony_ci else 25862306a36Sopenharmony_ci num_bytes -= block_rsv->reserved; 25962306a36Sopenharmony_ci spin_unlock(&block_rsv->lock); 26062306a36Sopenharmony_ci 26162306a36Sopenharmony_ci if (!ret) 26262306a36Sopenharmony_ci return 0; 26362306a36Sopenharmony_ci 26462306a36Sopenharmony_ci ret = btrfs_reserve_metadata_bytes(fs_info, block_rsv, num_bytes, flush); 26562306a36Sopenharmony_ci if (!ret) { 26662306a36Sopenharmony_ci btrfs_block_rsv_add_bytes(block_rsv, num_bytes, false); 26762306a36Sopenharmony_ci return 0; 26862306a36Sopenharmony_ci } 26962306a36Sopenharmony_ci 27062306a36Sopenharmony_ci return ret; 27162306a36Sopenharmony_ci} 27262306a36Sopenharmony_ci 27362306a36Sopenharmony_ciu64 btrfs_block_rsv_release(struct btrfs_fs_info *fs_info, 27462306a36Sopenharmony_ci struct btrfs_block_rsv *block_rsv, u64 num_bytes, 27562306a36Sopenharmony_ci u64 *qgroup_to_release) 27662306a36Sopenharmony_ci{ 27762306a36Sopenharmony_ci struct btrfs_block_rsv *global_rsv = &fs_info->global_block_rsv; 27862306a36Sopenharmony_ci struct btrfs_block_rsv *delayed_rsv = &fs_info->delayed_refs_rsv; 27962306a36Sopenharmony_ci struct btrfs_block_rsv *target = NULL; 28062306a36Sopenharmony_ci 28162306a36Sopenharmony_ci /* 28262306a36Sopenharmony_ci * If we are the delayed_rsv then push to the global rsv, otherwise dump 28362306a36Sopenharmony_ci * into the delayed rsv if it is not full. 28462306a36Sopenharmony_ci */ 28562306a36Sopenharmony_ci if (block_rsv == delayed_rsv) 28662306a36Sopenharmony_ci target = global_rsv; 28762306a36Sopenharmony_ci else if (block_rsv != global_rsv && !btrfs_block_rsv_full(delayed_rsv)) 28862306a36Sopenharmony_ci target = delayed_rsv; 28962306a36Sopenharmony_ci 29062306a36Sopenharmony_ci if (target && block_rsv->space_info != target->space_info) 29162306a36Sopenharmony_ci target = NULL; 29262306a36Sopenharmony_ci 29362306a36Sopenharmony_ci return block_rsv_release_bytes(fs_info, block_rsv, target, num_bytes, 29462306a36Sopenharmony_ci qgroup_to_release); 29562306a36Sopenharmony_ci} 29662306a36Sopenharmony_ci 29762306a36Sopenharmony_ciint btrfs_block_rsv_use_bytes(struct btrfs_block_rsv *block_rsv, u64 num_bytes) 29862306a36Sopenharmony_ci{ 29962306a36Sopenharmony_ci int ret = -ENOSPC; 30062306a36Sopenharmony_ci 30162306a36Sopenharmony_ci spin_lock(&block_rsv->lock); 30262306a36Sopenharmony_ci if (block_rsv->reserved >= num_bytes) { 30362306a36Sopenharmony_ci block_rsv->reserved -= num_bytes; 30462306a36Sopenharmony_ci if (block_rsv->reserved < block_rsv->size) 30562306a36Sopenharmony_ci block_rsv->full = false; 30662306a36Sopenharmony_ci ret = 0; 30762306a36Sopenharmony_ci } 30862306a36Sopenharmony_ci spin_unlock(&block_rsv->lock); 30962306a36Sopenharmony_ci return ret; 31062306a36Sopenharmony_ci} 31162306a36Sopenharmony_ci 31262306a36Sopenharmony_civoid btrfs_block_rsv_add_bytes(struct btrfs_block_rsv *block_rsv, 31362306a36Sopenharmony_ci u64 num_bytes, bool update_size) 31462306a36Sopenharmony_ci{ 31562306a36Sopenharmony_ci spin_lock(&block_rsv->lock); 31662306a36Sopenharmony_ci block_rsv->reserved += num_bytes; 31762306a36Sopenharmony_ci if (update_size) 31862306a36Sopenharmony_ci block_rsv->size += num_bytes; 31962306a36Sopenharmony_ci else if (block_rsv->reserved >= block_rsv->size) 32062306a36Sopenharmony_ci block_rsv->full = true; 32162306a36Sopenharmony_ci spin_unlock(&block_rsv->lock); 32262306a36Sopenharmony_ci} 32362306a36Sopenharmony_ci 32462306a36Sopenharmony_civoid btrfs_update_global_block_rsv(struct btrfs_fs_info *fs_info) 32562306a36Sopenharmony_ci{ 32662306a36Sopenharmony_ci struct btrfs_block_rsv *block_rsv = &fs_info->global_block_rsv; 32762306a36Sopenharmony_ci struct btrfs_space_info *sinfo = block_rsv->space_info; 32862306a36Sopenharmony_ci struct btrfs_root *root, *tmp; 32962306a36Sopenharmony_ci u64 num_bytes = btrfs_root_used(&fs_info->tree_root->root_item); 33062306a36Sopenharmony_ci unsigned int min_items = 1; 33162306a36Sopenharmony_ci 33262306a36Sopenharmony_ci /* 33362306a36Sopenharmony_ci * The global block rsv is based on the size of the extent tree, the 33462306a36Sopenharmony_ci * checksum tree and the root tree. If the fs is empty we want to set 33562306a36Sopenharmony_ci * it to a minimal amount for safety. 33662306a36Sopenharmony_ci * 33762306a36Sopenharmony_ci * We also are going to need to modify the minimum of the tree root and 33862306a36Sopenharmony_ci * any global roots we could touch. 33962306a36Sopenharmony_ci */ 34062306a36Sopenharmony_ci read_lock(&fs_info->global_root_lock); 34162306a36Sopenharmony_ci rbtree_postorder_for_each_entry_safe(root, tmp, &fs_info->global_root_tree, 34262306a36Sopenharmony_ci rb_node) { 34362306a36Sopenharmony_ci if (root->root_key.objectid == BTRFS_EXTENT_TREE_OBJECTID || 34462306a36Sopenharmony_ci root->root_key.objectid == BTRFS_CSUM_TREE_OBJECTID || 34562306a36Sopenharmony_ci root->root_key.objectid == BTRFS_FREE_SPACE_TREE_OBJECTID) { 34662306a36Sopenharmony_ci num_bytes += btrfs_root_used(&root->root_item); 34762306a36Sopenharmony_ci min_items++; 34862306a36Sopenharmony_ci } 34962306a36Sopenharmony_ci } 35062306a36Sopenharmony_ci read_unlock(&fs_info->global_root_lock); 35162306a36Sopenharmony_ci 35262306a36Sopenharmony_ci if (btrfs_fs_compat_ro(fs_info, BLOCK_GROUP_TREE)) { 35362306a36Sopenharmony_ci num_bytes += btrfs_root_used(&fs_info->block_group_root->root_item); 35462306a36Sopenharmony_ci min_items++; 35562306a36Sopenharmony_ci } 35662306a36Sopenharmony_ci 35762306a36Sopenharmony_ci /* 35862306a36Sopenharmony_ci * But we also want to reserve enough space so we can do the fallback 35962306a36Sopenharmony_ci * global reserve for an unlink, which is an additional 36062306a36Sopenharmony_ci * BTRFS_UNLINK_METADATA_UNITS items. 36162306a36Sopenharmony_ci * 36262306a36Sopenharmony_ci * But we also need space for the delayed ref updates from the unlink, 36362306a36Sopenharmony_ci * so add BTRFS_UNLINK_METADATA_UNITS units for delayed refs, one for 36462306a36Sopenharmony_ci * each unlink metadata item. 36562306a36Sopenharmony_ci */ 36662306a36Sopenharmony_ci min_items += BTRFS_UNLINK_METADATA_UNITS; 36762306a36Sopenharmony_ci 36862306a36Sopenharmony_ci num_bytes = max_t(u64, num_bytes, 36962306a36Sopenharmony_ci btrfs_calc_insert_metadata_size(fs_info, min_items) + 37062306a36Sopenharmony_ci btrfs_calc_delayed_ref_bytes(fs_info, 37162306a36Sopenharmony_ci BTRFS_UNLINK_METADATA_UNITS)); 37262306a36Sopenharmony_ci 37362306a36Sopenharmony_ci spin_lock(&sinfo->lock); 37462306a36Sopenharmony_ci spin_lock(&block_rsv->lock); 37562306a36Sopenharmony_ci 37662306a36Sopenharmony_ci block_rsv->size = min_t(u64, num_bytes, SZ_512M); 37762306a36Sopenharmony_ci 37862306a36Sopenharmony_ci if (block_rsv->reserved < block_rsv->size) { 37962306a36Sopenharmony_ci num_bytes = block_rsv->size - block_rsv->reserved; 38062306a36Sopenharmony_ci btrfs_space_info_update_bytes_may_use(fs_info, sinfo, 38162306a36Sopenharmony_ci num_bytes); 38262306a36Sopenharmony_ci block_rsv->reserved = block_rsv->size; 38362306a36Sopenharmony_ci } else if (block_rsv->reserved > block_rsv->size) { 38462306a36Sopenharmony_ci num_bytes = block_rsv->reserved - block_rsv->size; 38562306a36Sopenharmony_ci btrfs_space_info_update_bytes_may_use(fs_info, sinfo, 38662306a36Sopenharmony_ci -num_bytes); 38762306a36Sopenharmony_ci block_rsv->reserved = block_rsv->size; 38862306a36Sopenharmony_ci btrfs_try_granting_tickets(fs_info, sinfo); 38962306a36Sopenharmony_ci } 39062306a36Sopenharmony_ci 39162306a36Sopenharmony_ci block_rsv->full = (block_rsv->reserved == block_rsv->size); 39262306a36Sopenharmony_ci 39362306a36Sopenharmony_ci if (block_rsv->size >= sinfo->total_bytes) 39462306a36Sopenharmony_ci sinfo->force_alloc = CHUNK_ALLOC_FORCE; 39562306a36Sopenharmony_ci spin_unlock(&block_rsv->lock); 39662306a36Sopenharmony_ci spin_unlock(&sinfo->lock); 39762306a36Sopenharmony_ci} 39862306a36Sopenharmony_ci 39962306a36Sopenharmony_civoid btrfs_init_root_block_rsv(struct btrfs_root *root) 40062306a36Sopenharmony_ci{ 40162306a36Sopenharmony_ci struct btrfs_fs_info *fs_info = root->fs_info; 40262306a36Sopenharmony_ci 40362306a36Sopenharmony_ci switch (root->root_key.objectid) { 40462306a36Sopenharmony_ci case BTRFS_CSUM_TREE_OBJECTID: 40562306a36Sopenharmony_ci case BTRFS_EXTENT_TREE_OBJECTID: 40662306a36Sopenharmony_ci case BTRFS_FREE_SPACE_TREE_OBJECTID: 40762306a36Sopenharmony_ci case BTRFS_BLOCK_GROUP_TREE_OBJECTID: 40862306a36Sopenharmony_ci root->block_rsv = &fs_info->delayed_refs_rsv; 40962306a36Sopenharmony_ci break; 41062306a36Sopenharmony_ci case BTRFS_ROOT_TREE_OBJECTID: 41162306a36Sopenharmony_ci case BTRFS_DEV_TREE_OBJECTID: 41262306a36Sopenharmony_ci case BTRFS_QUOTA_TREE_OBJECTID: 41362306a36Sopenharmony_ci root->block_rsv = &fs_info->global_block_rsv; 41462306a36Sopenharmony_ci break; 41562306a36Sopenharmony_ci case BTRFS_CHUNK_TREE_OBJECTID: 41662306a36Sopenharmony_ci root->block_rsv = &fs_info->chunk_block_rsv; 41762306a36Sopenharmony_ci break; 41862306a36Sopenharmony_ci default: 41962306a36Sopenharmony_ci root->block_rsv = NULL; 42062306a36Sopenharmony_ci break; 42162306a36Sopenharmony_ci } 42262306a36Sopenharmony_ci} 42362306a36Sopenharmony_ci 42462306a36Sopenharmony_civoid btrfs_init_global_block_rsv(struct btrfs_fs_info *fs_info) 42562306a36Sopenharmony_ci{ 42662306a36Sopenharmony_ci struct btrfs_space_info *space_info; 42762306a36Sopenharmony_ci 42862306a36Sopenharmony_ci space_info = btrfs_find_space_info(fs_info, BTRFS_BLOCK_GROUP_SYSTEM); 42962306a36Sopenharmony_ci fs_info->chunk_block_rsv.space_info = space_info; 43062306a36Sopenharmony_ci 43162306a36Sopenharmony_ci space_info = btrfs_find_space_info(fs_info, BTRFS_BLOCK_GROUP_METADATA); 43262306a36Sopenharmony_ci fs_info->global_block_rsv.space_info = space_info; 43362306a36Sopenharmony_ci fs_info->trans_block_rsv.space_info = space_info; 43462306a36Sopenharmony_ci fs_info->empty_block_rsv.space_info = space_info; 43562306a36Sopenharmony_ci fs_info->delayed_block_rsv.space_info = space_info; 43662306a36Sopenharmony_ci fs_info->delayed_refs_rsv.space_info = space_info; 43762306a36Sopenharmony_ci 43862306a36Sopenharmony_ci btrfs_update_global_block_rsv(fs_info); 43962306a36Sopenharmony_ci} 44062306a36Sopenharmony_ci 44162306a36Sopenharmony_civoid btrfs_release_global_block_rsv(struct btrfs_fs_info *fs_info) 44262306a36Sopenharmony_ci{ 44362306a36Sopenharmony_ci btrfs_block_rsv_release(fs_info, &fs_info->global_block_rsv, (u64)-1, 44462306a36Sopenharmony_ci NULL); 44562306a36Sopenharmony_ci WARN_ON(fs_info->trans_block_rsv.size > 0); 44662306a36Sopenharmony_ci WARN_ON(fs_info->trans_block_rsv.reserved > 0); 44762306a36Sopenharmony_ci WARN_ON(fs_info->chunk_block_rsv.size > 0); 44862306a36Sopenharmony_ci WARN_ON(fs_info->chunk_block_rsv.reserved > 0); 44962306a36Sopenharmony_ci WARN_ON(fs_info->delayed_block_rsv.size > 0); 45062306a36Sopenharmony_ci WARN_ON(fs_info->delayed_block_rsv.reserved > 0); 45162306a36Sopenharmony_ci WARN_ON(fs_info->delayed_refs_rsv.reserved > 0); 45262306a36Sopenharmony_ci WARN_ON(fs_info->delayed_refs_rsv.size > 0); 45362306a36Sopenharmony_ci} 45462306a36Sopenharmony_ci 45562306a36Sopenharmony_cistatic struct btrfs_block_rsv *get_block_rsv( 45662306a36Sopenharmony_ci const struct btrfs_trans_handle *trans, 45762306a36Sopenharmony_ci const struct btrfs_root *root) 45862306a36Sopenharmony_ci{ 45962306a36Sopenharmony_ci struct btrfs_fs_info *fs_info = root->fs_info; 46062306a36Sopenharmony_ci struct btrfs_block_rsv *block_rsv = NULL; 46162306a36Sopenharmony_ci 46262306a36Sopenharmony_ci if (test_bit(BTRFS_ROOT_SHAREABLE, &root->state) || 46362306a36Sopenharmony_ci (root == fs_info->uuid_root) || 46462306a36Sopenharmony_ci (trans->adding_csums && 46562306a36Sopenharmony_ci root->root_key.objectid == BTRFS_CSUM_TREE_OBJECTID)) 46662306a36Sopenharmony_ci block_rsv = trans->block_rsv; 46762306a36Sopenharmony_ci 46862306a36Sopenharmony_ci if (!block_rsv) 46962306a36Sopenharmony_ci block_rsv = root->block_rsv; 47062306a36Sopenharmony_ci 47162306a36Sopenharmony_ci if (!block_rsv) 47262306a36Sopenharmony_ci block_rsv = &fs_info->empty_block_rsv; 47362306a36Sopenharmony_ci 47462306a36Sopenharmony_ci return block_rsv; 47562306a36Sopenharmony_ci} 47662306a36Sopenharmony_ci 47762306a36Sopenharmony_cistruct btrfs_block_rsv *btrfs_use_block_rsv(struct btrfs_trans_handle *trans, 47862306a36Sopenharmony_ci struct btrfs_root *root, 47962306a36Sopenharmony_ci u32 blocksize) 48062306a36Sopenharmony_ci{ 48162306a36Sopenharmony_ci struct btrfs_fs_info *fs_info = root->fs_info; 48262306a36Sopenharmony_ci struct btrfs_block_rsv *block_rsv; 48362306a36Sopenharmony_ci struct btrfs_block_rsv *global_rsv = &fs_info->global_block_rsv; 48462306a36Sopenharmony_ci int ret; 48562306a36Sopenharmony_ci bool global_updated = false; 48662306a36Sopenharmony_ci 48762306a36Sopenharmony_ci block_rsv = get_block_rsv(trans, root); 48862306a36Sopenharmony_ci 48962306a36Sopenharmony_ci if (unlikely(btrfs_block_rsv_size(block_rsv) == 0)) 49062306a36Sopenharmony_ci goto try_reserve; 49162306a36Sopenharmony_ciagain: 49262306a36Sopenharmony_ci ret = btrfs_block_rsv_use_bytes(block_rsv, blocksize); 49362306a36Sopenharmony_ci if (!ret) 49462306a36Sopenharmony_ci return block_rsv; 49562306a36Sopenharmony_ci 49662306a36Sopenharmony_ci if (block_rsv->failfast) 49762306a36Sopenharmony_ci return ERR_PTR(ret); 49862306a36Sopenharmony_ci 49962306a36Sopenharmony_ci if (block_rsv->type == BTRFS_BLOCK_RSV_GLOBAL && !global_updated) { 50062306a36Sopenharmony_ci global_updated = true; 50162306a36Sopenharmony_ci btrfs_update_global_block_rsv(fs_info); 50262306a36Sopenharmony_ci goto again; 50362306a36Sopenharmony_ci } 50462306a36Sopenharmony_ci 50562306a36Sopenharmony_ci /* 50662306a36Sopenharmony_ci * The global reserve still exists to save us from ourselves, so don't 50762306a36Sopenharmony_ci * warn_on if we are short on our delayed refs reserve. 50862306a36Sopenharmony_ci */ 50962306a36Sopenharmony_ci if (block_rsv->type != BTRFS_BLOCK_RSV_DELREFS && 51062306a36Sopenharmony_ci btrfs_test_opt(fs_info, ENOSPC_DEBUG)) { 51162306a36Sopenharmony_ci static DEFINE_RATELIMIT_STATE(_rs, 51262306a36Sopenharmony_ci DEFAULT_RATELIMIT_INTERVAL * 10, 51362306a36Sopenharmony_ci /*DEFAULT_RATELIMIT_BURST*/ 1); 51462306a36Sopenharmony_ci if (__ratelimit(&_rs)) 51562306a36Sopenharmony_ci WARN(1, KERN_DEBUG 51662306a36Sopenharmony_ci "BTRFS: block rsv %d returned %d\n", 51762306a36Sopenharmony_ci block_rsv->type, ret); 51862306a36Sopenharmony_ci } 51962306a36Sopenharmony_citry_reserve: 52062306a36Sopenharmony_ci ret = btrfs_reserve_metadata_bytes(fs_info, block_rsv, blocksize, 52162306a36Sopenharmony_ci BTRFS_RESERVE_NO_FLUSH); 52262306a36Sopenharmony_ci if (!ret) 52362306a36Sopenharmony_ci return block_rsv; 52462306a36Sopenharmony_ci /* 52562306a36Sopenharmony_ci * If we couldn't reserve metadata bytes try and use some from 52662306a36Sopenharmony_ci * the global reserve if its space type is the same as the global 52762306a36Sopenharmony_ci * reservation. 52862306a36Sopenharmony_ci */ 52962306a36Sopenharmony_ci if (block_rsv->type != BTRFS_BLOCK_RSV_GLOBAL && 53062306a36Sopenharmony_ci block_rsv->space_info == global_rsv->space_info) { 53162306a36Sopenharmony_ci ret = btrfs_block_rsv_use_bytes(global_rsv, blocksize); 53262306a36Sopenharmony_ci if (!ret) 53362306a36Sopenharmony_ci return global_rsv; 53462306a36Sopenharmony_ci } 53562306a36Sopenharmony_ci 53662306a36Sopenharmony_ci /* 53762306a36Sopenharmony_ci * All hope is lost, but of course our reservations are overly 53862306a36Sopenharmony_ci * pessimistic, so instead of possibly having an ENOSPC abort here, try 53962306a36Sopenharmony_ci * one last time to force a reservation if there's enough actual space 54062306a36Sopenharmony_ci * on disk to make the reservation. 54162306a36Sopenharmony_ci */ 54262306a36Sopenharmony_ci ret = btrfs_reserve_metadata_bytes(fs_info, block_rsv, blocksize, 54362306a36Sopenharmony_ci BTRFS_RESERVE_FLUSH_EMERGENCY); 54462306a36Sopenharmony_ci if (!ret) 54562306a36Sopenharmony_ci return block_rsv; 54662306a36Sopenharmony_ci 54762306a36Sopenharmony_ci return ERR_PTR(ret); 54862306a36Sopenharmony_ci} 54962306a36Sopenharmony_ci 55062306a36Sopenharmony_ciint btrfs_check_trunc_cache_free_space(struct btrfs_fs_info *fs_info, 55162306a36Sopenharmony_ci struct btrfs_block_rsv *rsv) 55262306a36Sopenharmony_ci{ 55362306a36Sopenharmony_ci u64 needed_bytes; 55462306a36Sopenharmony_ci int ret; 55562306a36Sopenharmony_ci 55662306a36Sopenharmony_ci /* 1 for slack space, 1 for updating the inode */ 55762306a36Sopenharmony_ci needed_bytes = btrfs_calc_insert_metadata_size(fs_info, 1) + 55862306a36Sopenharmony_ci btrfs_calc_metadata_size(fs_info, 1); 55962306a36Sopenharmony_ci 56062306a36Sopenharmony_ci spin_lock(&rsv->lock); 56162306a36Sopenharmony_ci if (rsv->reserved < needed_bytes) 56262306a36Sopenharmony_ci ret = -ENOSPC; 56362306a36Sopenharmony_ci else 56462306a36Sopenharmony_ci ret = 0; 56562306a36Sopenharmony_ci spin_unlock(&rsv->lock); 56662306a36Sopenharmony_ci return ret; 56762306a36Sopenharmony_ci} 568