162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-only 262306a36Sopenharmony_ci/* 362306a36Sopenharmony_ci * Copyright (C) 2011-2012 Red Hat, Inc. 462306a36Sopenharmony_ci * 562306a36Sopenharmony_ci * This file is released under the GPL. 662306a36Sopenharmony_ci */ 762306a36Sopenharmony_ci 862306a36Sopenharmony_ci#include "dm-thin-metadata.h" 962306a36Sopenharmony_ci#include "persistent-data/dm-btree.h" 1062306a36Sopenharmony_ci#include "persistent-data/dm-space-map.h" 1162306a36Sopenharmony_ci#include "persistent-data/dm-space-map-disk.h" 1262306a36Sopenharmony_ci#include "persistent-data/dm-transaction-manager.h" 1362306a36Sopenharmony_ci 1462306a36Sopenharmony_ci#include <linux/list.h> 1562306a36Sopenharmony_ci#include <linux/device-mapper.h> 1662306a36Sopenharmony_ci#include <linux/workqueue.h> 1762306a36Sopenharmony_ci 1862306a36Sopenharmony_ci/* 1962306a36Sopenharmony_ci *-------------------------------------------------------------------------- 2062306a36Sopenharmony_ci * As far as the metadata goes, there is: 2162306a36Sopenharmony_ci * 2262306a36Sopenharmony_ci * - A superblock in block zero, taking up fewer than 512 bytes for 2362306a36Sopenharmony_ci * atomic writes. 2462306a36Sopenharmony_ci * 2562306a36Sopenharmony_ci * - A space map managing the metadata blocks. 2662306a36Sopenharmony_ci * 2762306a36Sopenharmony_ci * - A space map managing the data blocks. 2862306a36Sopenharmony_ci * 2962306a36Sopenharmony_ci * - A btree mapping our internal thin dev ids onto struct disk_device_details. 3062306a36Sopenharmony_ci * 3162306a36Sopenharmony_ci * - A hierarchical btree, with 2 levels which effectively maps (thin 3262306a36Sopenharmony_ci * dev id, virtual block) -> block_time. Block time is a 64-bit 3362306a36Sopenharmony_ci * field holding the time in the low 24 bits, and block in the top 40 3462306a36Sopenharmony_ci * bits. 3562306a36Sopenharmony_ci * 3662306a36Sopenharmony_ci * BTrees consist solely of btree_nodes, that fill a block. Some are 3762306a36Sopenharmony_ci * internal nodes, as such their values are a __le64 pointing to other 3862306a36Sopenharmony_ci * nodes. Leaf nodes can store data of any reasonable size (ie. much 3962306a36Sopenharmony_ci * smaller than the block size). The nodes consist of the header, 4062306a36Sopenharmony_ci * followed by an array of keys, followed by an array of values. We have 4162306a36Sopenharmony_ci * to binary search on the keys so they're all held together to help the 4262306a36Sopenharmony_ci * cpu cache. 4362306a36Sopenharmony_ci * 4462306a36Sopenharmony_ci * Space maps have 2 btrees: 4562306a36Sopenharmony_ci * 4662306a36Sopenharmony_ci * - One maps a uint64_t onto a struct index_entry. Which points to a 4762306a36Sopenharmony_ci * bitmap block, and has some details about how many free entries there 4862306a36Sopenharmony_ci * are etc. 4962306a36Sopenharmony_ci * 5062306a36Sopenharmony_ci * - The bitmap blocks have a header (for the checksum). Then the rest 5162306a36Sopenharmony_ci * of the block is pairs of bits. With the meaning being: 5262306a36Sopenharmony_ci * 5362306a36Sopenharmony_ci * 0 - ref count is 0 5462306a36Sopenharmony_ci * 1 - ref count is 1 5562306a36Sopenharmony_ci * 2 - ref count is 2 5662306a36Sopenharmony_ci * 3 - ref count is higher than 2 5762306a36Sopenharmony_ci * 5862306a36Sopenharmony_ci * - If the count is higher than 2 then the ref count is entered in a 5962306a36Sopenharmony_ci * second btree that directly maps the block_address to a uint32_t ref 6062306a36Sopenharmony_ci * count. 6162306a36Sopenharmony_ci * 6262306a36Sopenharmony_ci * The space map metadata variant doesn't have a bitmaps btree. Instead 6362306a36Sopenharmony_ci * it has one single blocks worth of index_entries. This avoids 6462306a36Sopenharmony_ci * recursive issues with the bitmap btree needing to allocate space in 6562306a36Sopenharmony_ci * order to insert. With a small data block size such as 64k the 6662306a36Sopenharmony_ci * metadata support data devices that are hundreds of terrabytes. 6762306a36Sopenharmony_ci * 6862306a36Sopenharmony_ci * The space maps allocate space linearly from front to back. Space that 6962306a36Sopenharmony_ci * is freed in a transaction is never recycled within that transaction. 7062306a36Sopenharmony_ci * To try and avoid fragmenting _free_ space the allocator always goes 7162306a36Sopenharmony_ci * back and fills in gaps. 7262306a36Sopenharmony_ci * 7362306a36Sopenharmony_ci * All metadata io is in THIN_METADATA_BLOCK_SIZE sized/aligned chunks 7462306a36Sopenharmony_ci * from the block manager. 7562306a36Sopenharmony_ci *-------------------------------------------------------------------------- 7662306a36Sopenharmony_ci */ 7762306a36Sopenharmony_ci 7862306a36Sopenharmony_ci#define DM_MSG_PREFIX "thin metadata" 7962306a36Sopenharmony_ci 8062306a36Sopenharmony_ci#define THIN_SUPERBLOCK_MAGIC 27022010 8162306a36Sopenharmony_ci#define THIN_SUPERBLOCK_LOCATION 0 8262306a36Sopenharmony_ci#define THIN_VERSION 2 8362306a36Sopenharmony_ci#define SECTOR_TO_BLOCK_SHIFT 3 8462306a36Sopenharmony_ci 8562306a36Sopenharmony_ci/* 8662306a36Sopenharmony_ci * For btree insert: 8762306a36Sopenharmony_ci * 3 for btree insert + 8862306a36Sopenharmony_ci * 2 for btree lookup used within space map 8962306a36Sopenharmony_ci * For btree remove: 9062306a36Sopenharmony_ci * 2 for shadow spine + 9162306a36Sopenharmony_ci * 4 for rebalance 3 child node 9262306a36Sopenharmony_ci */ 9362306a36Sopenharmony_ci#define THIN_MAX_CONCURRENT_LOCKS 6 9462306a36Sopenharmony_ci 9562306a36Sopenharmony_ci/* This should be plenty */ 9662306a36Sopenharmony_ci#define SPACE_MAP_ROOT_SIZE 128 9762306a36Sopenharmony_ci 9862306a36Sopenharmony_ci/* 9962306a36Sopenharmony_ci * Little endian on-disk superblock and device details. 10062306a36Sopenharmony_ci */ 10162306a36Sopenharmony_cistruct thin_disk_superblock { 10262306a36Sopenharmony_ci __le32 csum; /* Checksum of superblock except for this field. */ 10362306a36Sopenharmony_ci __le32 flags; 10462306a36Sopenharmony_ci __le64 blocknr; /* This block number, dm_block_t. */ 10562306a36Sopenharmony_ci 10662306a36Sopenharmony_ci __u8 uuid[16]; 10762306a36Sopenharmony_ci __le64 magic; 10862306a36Sopenharmony_ci __le32 version; 10962306a36Sopenharmony_ci __le32 time; 11062306a36Sopenharmony_ci 11162306a36Sopenharmony_ci __le64 trans_id; 11262306a36Sopenharmony_ci 11362306a36Sopenharmony_ci /* 11462306a36Sopenharmony_ci * Root held by userspace transactions. 11562306a36Sopenharmony_ci */ 11662306a36Sopenharmony_ci __le64 held_root; 11762306a36Sopenharmony_ci 11862306a36Sopenharmony_ci __u8 data_space_map_root[SPACE_MAP_ROOT_SIZE]; 11962306a36Sopenharmony_ci __u8 metadata_space_map_root[SPACE_MAP_ROOT_SIZE]; 12062306a36Sopenharmony_ci 12162306a36Sopenharmony_ci /* 12262306a36Sopenharmony_ci * 2-level btree mapping (dev_id, (dev block, time)) -> data block 12362306a36Sopenharmony_ci */ 12462306a36Sopenharmony_ci __le64 data_mapping_root; 12562306a36Sopenharmony_ci 12662306a36Sopenharmony_ci /* 12762306a36Sopenharmony_ci * Device detail root mapping dev_id -> device_details 12862306a36Sopenharmony_ci */ 12962306a36Sopenharmony_ci __le64 device_details_root; 13062306a36Sopenharmony_ci 13162306a36Sopenharmony_ci __le32 data_block_size; /* In 512-byte sectors. */ 13262306a36Sopenharmony_ci 13362306a36Sopenharmony_ci __le32 metadata_block_size; /* In 512-byte sectors. */ 13462306a36Sopenharmony_ci __le64 metadata_nr_blocks; 13562306a36Sopenharmony_ci 13662306a36Sopenharmony_ci __le32 compat_flags; 13762306a36Sopenharmony_ci __le32 compat_ro_flags; 13862306a36Sopenharmony_ci __le32 incompat_flags; 13962306a36Sopenharmony_ci} __packed; 14062306a36Sopenharmony_ci 14162306a36Sopenharmony_cistruct disk_device_details { 14262306a36Sopenharmony_ci __le64 mapped_blocks; 14362306a36Sopenharmony_ci __le64 transaction_id; /* When created. */ 14462306a36Sopenharmony_ci __le32 creation_time; 14562306a36Sopenharmony_ci __le32 snapshotted_time; 14662306a36Sopenharmony_ci} __packed; 14762306a36Sopenharmony_ci 14862306a36Sopenharmony_cistruct dm_pool_metadata { 14962306a36Sopenharmony_ci struct hlist_node hash; 15062306a36Sopenharmony_ci 15162306a36Sopenharmony_ci struct block_device *bdev; 15262306a36Sopenharmony_ci struct dm_block_manager *bm; 15362306a36Sopenharmony_ci struct dm_space_map *metadata_sm; 15462306a36Sopenharmony_ci struct dm_space_map *data_sm; 15562306a36Sopenharmony_ci struct dm_transaction_manager *tm; 15662306a36Sopenharmony_ci struct dm_transaction_manager *nb_tm; 15762306a36Sopenharmony_ci 15862306a36Sopenharmony_ci /* 15962306a36Sopenharmony_ci * Two-level btree. 16062306a36Sopenharmony_ci * First level holds thin_dev_t. 16162306a36Sopenharmony_ci * Second level holds mappings. 16262306a36Sopenharmony_ci */ 16362306a36Sopenharmony_ci struct dm_btree_info info; 16462306a36Sopenharmony_ci 16562306a36Sopenharmony_ci /* 16662306a36Sopenharmony_ci * Non-blocking version of the above. 16762306a36Sopenharmony_ci */ 16862306a36Sopenharmony_ci struct dm_btree_info nb_info; 16962306a36Sopenharmony_ci 17062306a36Sopenharmony_ci /* 17162306a36Sopenharmony_ci * Just the top level for deleting whole devices. 17262306a36Sopenharmony_ci */ 17362306a36Sopenharmony_ci struct dm_btree_info tl_info; 17462306a36Sopenharmony_ci 17562306a36Sopenharmony_ci /* 17662306a36Sopenharmony_ci * Just the bottom level for creating new devices. 17762306a36Sopenharmony_ci */ 17862306a36Sopenharmony_ci struct dm_btree_info bl_info; 17962306a36Sopenharmony_ci 18062306a36Sopenharmony_ci /* 18162306a36Sopenharmony_ci * Describes the device details btree. 18262306a36Sopenharmony_ci */ 18362306a36Sopenharmony_ci struct dm_btree_info details_info; 18462306a36Sopenharmony_ci 18562306a36Sopenharmony_ci struct rw_semaphore root_lock; 18662306a36Sopenharmony_ci uint32_t time; 18762306a36Sopenharmony_ci dm_block_t root; 18862306a36Sopenharmony_ci dm_block_t details_root; 18962306a36Sopenharmony_ci struct list_head thin_devices; 19062306a36Sopenharmony_ci uint64_t trans_id; 19162306a36Sopenharmony_ci unsigned long flags; 19262306a36Sopenharmony_ci sector_t data_block_size; 19362306a36Sopenharmony_ci 19462306a36Sopenharmony_ci /* 19562306a36Sopenharmony_ci * Pre-commit callback. 19662306a36Sopenharmony_ci * 19762306a36Sopenharmony_ci * This allows the thin provisioning target to run a callback before 19862306a36Sopenharmony_ci * the metadata are committed. 19962306a36Sopenharmony_ci */ 20062306a36Sopenharmony_ci dm_pool_pre_commit_fn pre_commit_fn; 20162306a36Sopenharmony_ci void *pre_commit_context; 20262306a36Sopenharmony_ci 20362306a36Sopenharmony_ci /* 20462306a36Sopenharmony_ci * We reserve a section of the metadata for commit overhead. 20562306a36Sopenharmony_ci * All reported space does *not* include this. 20662306a36Sopenharmony_ci */ 20762306a36Sopenharmony_ci dm_block_t metadata_reserve; 20862306a36Sopenharmony_ci 20962306a36Sopenharmony_ci /* 21062306a36Sopenharmony_ci * Set if a transaction has to be aborted but the attempt to roll back 21162306a36Sopenharmony_ci * to the previous (good) transaction failed. The only pool metadata 21262306a36Sopenharmony_ci * operation possible in this state is the closing of the device. 21362306a36Sopenharmony_ci */ 21462306a36Sopenharmony_ci bool fail_io:1; 21562306a36Sopenharmony_ci 21662306a36Sopenharmony_ci /* 21762306a36Sopenharmony_ci * Set once a thin-pool has been accessed through one of the interfaces 21862306a36Sopenharmony_ci * that imply the pool is in-service (e.g. thin devices created/deleted, 21962306a36Sopenharmony_ci * thin-pool message, metadata snapshots, etc). 22062306a36Sopenharmony_ci */ 22162306a36Sopenharmony_ci bool in_service:1; 22262306a36Sopenharmony_ci 22362306a36Sopenharmony_ci /* 22462306a36Sopenharmony_ci * Reading the space map roots can fail, so we read it into these 22562306a36Sopenharmony_ci * buffers before the superblock is locked and updated. 22662306a36Sopenharmony_ci */ 22762306a36Sopenharmony_ci __u8 data_space_map_root[SPACE_MAP_ROOT_SIZE]; 22862306a36Sopenharmony_ci __u8 metadata_space_map_root[SPACE_MAP_ROOT_SIZE]; 22962306a36Sopenharmony_ci}; 23062306a36Sopenharmony_ci 23162306a36Sopenharmony_cistruct dm_thin_device { 23262306a36Sopenharmony_ci struct list_head list; 23362306a36Sopenharmony_ci struct dm_pool_metadata *pmd; 23462306a36Sopenharmony_ci dm_thin_id id; 23562306a36Sopenharmony_ci 23662306a36Sopenharmony_ci int open_count; 23762306a36Sopenharmony_ci bool changed:1; 23862306a36Sopenharmony_ci bool aborted_with_changes:1; 23962306a36Sopenharmony_ci uint64_t mapped_blocks; 24062306a36Sopenharmony_ci uint64_t transaction_id; 24162306a36Sopenharmony_ci uint32_t creation_time; 24262306a36Sopenharmony_ci uint32_t snapshotted_time; 24362306a36Sopenharmony_ci}; 24462306a36Sopenharmony_ci 24562306a36Sopenharmony_ci/* 24662306a36Sopenharmony_ci *-------------------------------------------------------------- 24762306a36Sopenharmony_ci * superblock validator 24862306a36Sopenharmony_ci *-------------------------------------------------------------- 24962306a36Sopenharmony_ci */ 25062306a36Sopenharmony_ci#define SUPERBLOCK_CSUM_XOR 160774 25162306a36Sopenharmony_ci 25262306a36Sopenharmony_cistatic void sb_prepare_for_write(struct dm_block_validator *v, 25362306a36Sopenharmony_ci struct dm_block *b, 25462306a36Sopenharmony_ci size_t block_size) 25562306a36Sopenharmony_ci{ 25662306a36Sopenharmony_ci struct thin_disk_superblock *disk_super = dm_block_data(b); 25762306a36Sopenharmony_ci 25862306a36Sopenharmony_ci disk_super->blocknr = cpu_to_le64(dm_block_location(b)); 25962306a36Sopenharmony_ci disk_super->csum = cpu_to_le32(dm_bm_checksum(&disk_super->flags, 26062306a36Sopenharmony_ci block_size - sizeof(__le32), 26162306a36Sopenharmony_ci SUPERBLOCK_CSUM_XOR)); 26262306a36Sopenharmony_ci} 26362306a36Sopenharmony_ci 26462306a36Sopenharmony_cistatic int sb_check(struct dm_block_validator *v, 26562306a36Sopenharmony_ci struct dm_block *b, 26662306a36Sopenharmony_ci size_t block_size) 26762306a36Sopenharmony_ci{ 26862306a36Sopenharmony_ci struct thin_disk_superblock *disk_super = dm_block_data(b); 26962306a36Sopenharmony_ci __le32 csum_le; 27062306a36Sopenharmony_ci 27162306a36Sopenharmony_ci if (dm_block_location(b) != le64_to_cpu(disk_super->blocknr)) { 27262306a36Sopenharmony_ci DMERR("%s failed: blocknr %llu: wanted %llu", 27362306a36Sopenharmony_ci __func__, le64_to_cpu(disk_super->blocknr), 27462306a36Sopenharmony_ci (unsigned long long)dm_block_location(b)); 27562306a36Sopenharmony_ci return -ENOTBLK; 27662306a36Sopenharmony_ci } 27762306a36Sopenharmony_ci 27862306a36Sopenharmony_ci if (le64_to_cpu(disk_super->magic) != THIN_SUPERBLOCK_MAGIC) { 27962306a36Sopenharmony_ci DMERR("%s failed: magic %llu: wanted %llu", 28062306a36Sopenharmony_ci __func__, le64_to_cpu(disk_super->magic), 28162306a36Sopenharmony_ci (unsigned long long)THIN_SUPERBLOCK_MAGIC); 28262306a36Sopenharmony_ci return -EILSEQ; 28362306a36Sopenharmony_ci } 28462306a36Sopenharmony_ci 28562306a36Sopenharmony_ci csum_le = cpu_to_le32(dm_bm_checksum(&disk_super->flags, 28662306a36Sopenharmony_ci block_size - sizeof(__le32), 28762306a36Sopenharmony_ci SUPERBLOCK_CSUM_XOR)); 28862306a36Sopenharmony_ci if (csum_le != disk_super->csum) { 28962306a36Sopenharmony_ci DMERR("%s failed: csum %u: wanted %u", 29062306a36Sopenharmony_ci __func__, le32_to_cpu(csum_le), le32_to_cpu(disk_super->csum)); 29162306a36Sopenharmony_ci return -EILSEQ; 29262306a36Sopenharmony_ci } 29362306a36Sopenharmony_ci 29462306a36Sopenharmony_ci return 0; 29562306a36Sopenharmony_ci} 29662306a36Sopenharmony_ci 29762306a36Sopenharmony_cistatic struct dm_block_validator sb_validator = { 29862306a36Sopenharmony_ci .name = "superblock", 29962306a36Sopenharmony_ci .prepare_for_write = sb_prepare_for_write, 30062306a36Sopenharmony_ci .check = sb_check 30162306a36Sopenharmony_ci}; 30262306a36Sopenharmony_ci 30362306a36Sopenharmony_ci/* 30462306a36Sopenharmony_ci *-------------------------------------------------------------- 30562306a36Sopenharmony_ci * Methods for the btree value types 30662306a36Sopenharmony_ci *-------------------------------------------------------------- 30762306a36Sopenharmony_ci */ 30862306a36Sopenharmony_cistatic uint64_t pack_block_time(dm_block_t b, uint32_t t) 30962306a36Sopenharmony_ci{ 31062306a36Sopenharmony_ci return (b << 24) | t; 31162306a36Sopenharmony_ci} 31262306a36Sopenharmony_ci 31362306a36Sopenharmony_cistatic void unpack_block_time(uint64_t v, dm_block_t *b, uint32_t *t) 31462306a36Sopenharmony_ci{ 31562306a36Sopenharmony_ci *b = v >> 24; 31662306a36Sopenharmony_ci *t = v & ((1 << 24) - 1); 31762306a36Sopenharmony_ci} 31862306a36Sopenharmony_ci 31962306a36Sopenharmony_ci/* 32062306a36Sopenharmony_ci * It's more efficient to call dm_sm_{inc,dec}_blocks as few times as 32162306a36Sopenharmony_ci * possible. 'with_runs' reads contiguous runs of blocks, and calls the 32262306a36Sopenharmony_ci * given sm function. 32362306a36Sopenharmony_ci */ 32462306a36Sopenharmony_citypedef int (*run_fn)(struct dm_space_map *, dm_block_t, dm_block_t); 32562306a36Sopenharmony_ci 32662306a36Sopenharmony_cistatic void with_runs(struct dm_space_map *sm, const __le64 *value_le, unsigned int count, run_fn fn) 32762306a36Sopenharmony_ci{ 32862306a36Sopenharmony_ci uint64_t b, begin, end; 32962306a36Sopenharmony_ci uint32_t t; 33062306a36Sopenharmony_ci bool in_run = false; 33162306a36Sopenharmony_ci unsigned int i; 33262306a36Sopenharmony_ci 33362306a36Sopenharmony_ci for (i = 0; i < count; i++, value_le++) { 33462306a36Sopenharmony_ci /* We know value_le is 8 byte aligned */ 33562306a36Sopenharmony_ci unpack_block_time(le64_to_cpu(*value_le), &b, &t); 33662306a36Sopenharmony_ci 33762306a36Sopenharmony_ci if (in_run) { 33862306a36Sopenharmony_ci if (b == end) { 33962306a36Sopenharmony_ci end++; 34062306a36Sopenharmony_ci } else { 34162306a36Sopenharmony_ci fn(sm, begin, end); 34262306a36Sopenharmony_ci begin = b; 34362306a36Sopenharmony_ci end = b + 1; 34462306a36Sopenharmony_ci } 34562306a36Sopenharmony_ci } else { 34662306a36Sopenharmony_ci in_run = true; 34762306a36Sopenharmony_ci begin = b; 34862306a36Sopenharmony_ci end = b + 1; 34962306a36Sopenharmony_ci } 35062306a36Sopenharmony_ci } 35162306a36Sopenharmony_ci 35262306a36Sopenharmony_ci if (in_run) 35362306a36Sopenharmony_ci fn(sm, begin, end); 35462306a36Sopenharmony_ci} 35562306a36Sopenharmony_ci 35662306a36Sopenharmony_cistatic void data_block_inc(void *context, const void *value_le, unsigned int count) 35762306a36Sopenharmony_ci{ 35862306a36Sopenharmony_ci with_runs((struct dm_space_map *) context, 35962306a36Sopenharmony_ci (const __le64 *) value_le, count, dm_sm_inc_blocks); 36062306a36Sopenharmony_ci} 36162306a36Sopenharmony_ci 36262306a36Sopenharmony_cistatic void data_block_dec(void *context, const void *value_le, unsigned int count) 36362306a36Sopenharmony_ci{ 36462306a36Sopenharmony_ci with_runs((struct dm_space_map *) context, 36562306a36Sopenharmony_ci (const __le64 *) value_le, count, dm_sm_dec_blocks); 36662306a36Sopenharmony_ci} 36762306a36Sopenharmony_ci 36862306a36Sopenharmony_cistatic int data_block_equal(void *context, const void *value1_le, const void *value2_le) 36962306a36Sopenharmony_ci{ 37062306a36Sopenharmony_ci __le64 v1_le, v2_le; 37162306a36Sopenharmony_ci uint64_t b1, b2; 37262306a36Sopenharmony_ci uint32_t t; 37362306a36Sopenharmony_ci 37462306a36Sopenharmony_ci memcpy(&v1_le, value1_le, sizeof(v1_le)); 37562306a36Sopenharmony_ci memcpy(&v2_le, value2_le, sizeof(v2_le)); 37662306a36Sopenharmony_ci unpack_block_time(le64_to_cpu(v1_le), &b1, &t); 37762306a36Sopenharmony_ci unpack_block_time(le64_to_cpu(v2_le), &b2, &t); 37862306a36Sopenharmony_ci 37962306a36Sopenharmony_ci return b1 == b2; 38062306a36Sopenharmony_ci} 38162306a36Sopenharmony_ci 38262306a36Sopenharmony_cistatic void subtree_inc(void *context, const void *value, unsigned int count) 38362306a36Sopenharmony_ci{ 38462306a36Sopenharmony_ci struct dm_btree_info *info = context; 38562306a36Sopenharmony_ci const __le64 *root_le = value; 38662306a36Sopenharmony_ci unsigned int i; 38762306a36Sopenharmony_ci 38862306a36Sopenharmony_ci for (i = 0; i < count; i++, root_le++) 38962306a36Sopenharmony_ci dm_tm_inc(info->tm, le64_to_cpu(*root_le)); 39062306a36Sopenharmony_ci} 39162306a36Sopenharmony_ci 39262306a36Sopenharmony_cistatic void subtree_dec(void *context, const void *value, unsigned int count) 39362306a36Sopenharmony_ci{ 39462306a36Sopenharmony_ci struct dm_btree_info *info = context; 39562306a36Sopenharmony_ci const __le64 *root_le = value; 39662306a36Sopenharmony_ci unsigned int i; 39762306a36Sopenharmony_ci 39862306a36Sopenharmony_ci for (i = 0; i < count; i++, root_le++) 39962306a36Sopenharmony_ci if (dm_btree_del(info, le64_to_cpu(*root_le))) 40062306a36Sopenharmony_ci DMERR("btree delete failed"); 40162306a36Sopenharmony_ci} 40262306a36Sopenharmony_ci 40362306a36Sopenharmony_cistatic int subtree_equal(void *context, const void *value1_le, const void *value2_le) 40462306a36Sopenharmony_ci{ 40562306a36Sopenharmony_ci __le64 v1_le, v2_le; 40662306a36Sopenharmony_ci 40762306a36Sopenharmony_ci memcpy(&v1_le, value1_le, sizeof(v1_le)); 40862306a36Sopenharmony_ci memcpy(&v2_le, value2_le, sizeof(v2_le)); 40962306a36Sopenharmony_ci 41062306a36Sopenharmony_ci return v1_le == v2_le; 41162306a36Sopenharmony_ci} 41262306a36Sopenharmony_ci 41362306a36Sopenharmony_ci/*----------------------------------------------------------------*/ 41462306a36Sopenharmony_ci 41562306a36Sopenharmony_ci/* 41662306a36Sopenharmony_ci * Variant that is used for in-core only changes or code that 41762306a36Sopenharmony_ci * shouldn't put the pool in service on its own (e.g. commit). 41862306a36Sopenharmony_ci */ 41962306a36Sopenharmony_cistatic inline void pmd_write_lock_in_core(struct dm_pool_metadata *pmd) 42062306a36Sopenharmony_ci __acquires(pmd->root_lock) 42162306a36Sopenharmony_ci{ 42262306a36Sopenharmony_ci down_write(&pmd->root_lock); 42362306a36Sopenharmony_ci} 42462306a36Sopenharmony_ci 42562306a36Sopenharmony_cistatic inline void pmd_write_lock(struct dm_pool_metadata *pmd) 42662306a36Sopenharmony_ci{ 42762306a36Sopenharmony_ci pmd_write_lock_in_core(pmd); 42862306a36Sopenharmony_ci if (unlikely(!pmd->in_service)) 42962306a36Sopenharmony_ci pmd->in_service = true; 43062306a36Sopenharmony_ci} 43162306a36Sopenharmony_ci 43262306a36Sopenharmony_cistatic inline void pmd_write_unlock(struct dm_pool_metadata *pmd) 43362306a36Sopenharmony_ci __releases(pmd->root_lock) 43462306a36Sopenharmony_ci{ 43562306a36Sopenharmony_ci up_write(&pmd->root_lock); 43662306a36Sopenharmony_ci} 43762306a36Sopenharmony_ci 43862306a36Sopenharmony_ci/*----------------------------------------------------------------*/ 43962306a36Sopenharmony_ci 44062306a36Sopenharmony_cistatic int superblock_lock_zero(struct dm_pool_metadata *pmd, 44162306a36Sopenharmony_ci struct dm_block **sblock) 44262306a36Sopenharmony_ci{ 44362306a36Sopenharmony_ci return dm_bm_write_lock_zero(pmd->bm, THIN_SUPERBLOCK_LOCATION, 44462306a36Sopenharmony_ci &sb_validator, sblock); 44562306a36Sopenharmony_ci} 44662306a36Sopenharmony_ci 44762306a36Sopenharmony_cistatic int superblock_lock(struct dm_pool_metadata *pmd, 44862306a36Sopenharmony_ci struct dm_block **sblock) 44962306a36Sopenharmony_ci{ 45062306a36Sopenharmony_ci return dm_bm_write_lock(pmd->bm, THIN_SUPERBLOCK_LOCATION, 45162306a36Sopenharmony_ci &sb_validator, sblock); 45262306a36Sopenharmony_ci} 45362306a36Sopenharmony_ci 45462306a36Sopenharmony_cistatic int __superblock_all_zeroes(struct dm_block_manager *bm, int *result) 45562306a36Sopenharmony_ci{ 45662306a36Sopenharmony_ci int r; 45762306a36Sopenharmony_ci unsigned int i; 45862306a36Sopenharmony_ci struct dm_block *b; 45962306a36Sopenharmony_ci __le64 *data_le, zero = cpu_to_le64(0); 46062306a36Sopenharmony_ci unsigned int block_size = dm_bm_block_size(bm) / sizeof(__le64); 46162306a36Sopenharmony_ci 46262306a36Sopenharmony_ci /* 46362306a36Sopenharmony_ci * We can't use a validator here - it may be all zeroes. 46462306a36Sopenharmony_ci */ 46562306a36Sopenharmony_ci r = dm_bm_read_lock(bm, THIN_SUPERBLOCK_LOCATION, NULL, &b); 46662306a36Sopenharmony_ci if (r) 46762306a36Sopenharmony_ci return r; 46862306a36Sopenharmony_ci 46962306a36Sopenharmony_ci data_le = dm_block_data(b); 47062306a36Sopenharmony_ci *result = 1; 47162306a36Sopenharmony_ci for (i = 0; i < block_size; i++) { 47262306a36Sopenharmony_ci if (data_le[i] != zero) { 47362306a36Sopenharmony_ci *result = 0; 47462306a36Sopenharmony_ci break; 47562306a36Sopenharmony_ci } 47662306a36Sopenharmony_ci } 47762306a36Sopenharmony_ci 47862306a36Sopenharmony_ci dm_bm_unlock(b); 47962306a36Sopenharmony_ci 48062306a36Sopenharmony_ci return 0; 48162306a36Sopenharmony_ci} 48262306a36Sopenharmony_ci 48362306a36Sopenharmony_cistatic void __setup_btree_details(struct dm_pool_metadata *pmd) 48462306a36Sopenharmony_ci{ 48562306a36Sopenharmony_ci pmd->info.tm = pmd->tm; 48662306a36Sopenharmony_ci pmd->info.levels = 2; 48762306a36Sopenharmony_ci pmd->info.value_type.context = pmd->data_sm; 48862306a36Sopenharmony_ci pmd->info.value_type.size = sizeof(__le64); 48962306a36Sopenharmony_ci pmd->info.value_type.inc = data_block_inc; 49062306a36Sopenharmony_ci pmd->info.value_type.dec = data_block_dec; 49162306a36Sopenharmony_ci pmd->info.value_type.equal = data_block_equal; 49262306a36Sopenharmony_ci 49362306a36Sopenharmony_ci memcpy(&pmd->nb_info, &pmd->info, sizeof(pmd->nb_info)); 49462306a36Sopenharmony_ci pmd->nb_info.tm = pmd->nb_tm; 49562306a36Sopenharmony_ci 49662306a36Sopenharmony_ci pmd->tl_info.tm = pmd->tm; 49762306a36Sopenharmony_ci pmd->tl_info.levels = 1; 49862306a36Sopenharmony_ci pmd->tl_info.value_type.context = &pmd->bl_info; 49962306a36Sopenharmony_ci pmd->tl_info.value_type.size = sizeof(__le64); 50062306a36Sopenharmony_ci pmd->tl_info.value_type.inc = subtree_inc; 50162306a36Sopenharmony_ci pmd->tl_info.value_type.dec = subtree_dec; 50262306a36Sopenharmony_ci pmd->tl_info.value_type.equal = subtree_equal; 50362306a36Sopenharmony_ci 50462306a36Sopenharmony_ci pmd->bl_info.tm = pmd->tm; 50562306a36Sopenharmony_ci pmd->bl_info.levels = 1; 50662306a36Sopenharmony_ci pmd->bl_info.value_type.context = pmd->data_sm; 50762306a36Sopenharmony_ci pmd->bl_info.value_type.size = sizeof(__le64); 50862306a36Sopenharmony_ci pmd->bl_info.value_type.inc = data_block_inc; 50962306a36Sopenharmony_ci pmd->bl_info.value_type.dec = data_block_dec; 51062306a36Sopenharmony_ci pmd->bl_info.value_type.equal = data_block_equal; 51162306a36Sopenharmony_ci 51262306a36Sopenharmony_ci pmd->details_info.tm = pmd->tm; 51362306a36Sopenharmony_ci pmd->details_info.levels = 1; 51462306a36Sopenharmony_ci pmd->details_info.value_type.context = NULL; 51562306a36Sopenharmony_ci pmd->details_info.value_type.size = sizeof(struct disk_device_details); 51662306a36Sopenharmony_ci pmd->details_info.value_type.inc = NULL; 51762306a36Sopenharmony_ci pmd->details_info.value_type.dec = NULL; 51862306a36Sopenharmony_ci pmd->details_info.value_type.equal = NULL; 51962306a36Sopenharmony_ci} 52062306a36Sopenharmony_ci 52162306a36Sopenharmony_cistatic int save_sm_roots(struct dm_pool_metadata *pmd) 52262306a36Sopenharmony_ci{ 52362306a36Sopenharmony_ci int r; 52462306a36Sopenharmony_ci size_t len; 52562306a36Sopenharmony_ci 52662306a36Sopenharmony_ci r = dm_sm_root_size(pmd->metadata_sm, &len); 52762306a36Sopenharmony_ci if (r < 0) 52862306a36Sopenharmony_ci return r; 52962306a36Sopenharmony_ci 53062306a36Sopenharmony_ci r = dm_sm_copy_root(pmd->metadata_sm, &pmd->metadata_space_map_root, len); 53162306a36Sopenharmony_ci if (r < 0) 53262306a36Sopenharmony_ci return r; 53362306a36Sopenharmony_ci 53462306a36Sopenharmony_ci r = dm_sm_root_size(pmd->data_sm, &len); 53562306a36Sopenharmony_ci if (r < 0) 53662306a36Sopenharmony_ci return r; 53762306a36Sopenharmony_ci 53862306a36Sopenharmony_ci return dm_sm_copy_root(pmd->data_sm, &pmd->data_space_map_root, len); 53962306a36Sopenharmony_ci} 54062306a36Sopenharmony_ci 54162306a36Sopenharmony_cistatic void copy_sm_roots(struct dm_pool_metadata *pmd, 54262306a36Sopenharmony_ci struct thin_disk_superblock *disk) 54362306a36Sopenharmony_ci{ 54462306a36Sopenharmony_ci memcpy(&disk->metadata_space_map_root, 54562306a36Sopenharmony_ci &pmd->metadata_space_map_root, 54662306a36Sopenharmony_ci sizeof(pmd->metadata_space_map_root)); 54762306a36Sopenharmony_ci 54862306a36Sopenharmony_ci memcpy(&disk->data_space_map_root, 54962306a36Sopenharmony_ci &pmd->data_space_map_root, 55062306a36Sopenharmony_ci sizeof(pmd->data_space_map_root)); 55162306a36Sopenharmony_ci} 55262306a36Sopenharmony_ci 55362306a36Sopenharmony_cistatic int __write_initial_superblock(struct dm_pool_metadata *pmd) 55462306a36Sopenharmony_ci{ 55562306a36Sopenharmony_ci int r; 55662306a36Sopenharmony_ci struct dm_block *sblock; 55762306a36Sopenharmony_ci struct thin_disk_superblock *disk_super; 55862306a36Sopenharmony_ci sector_t bdev_size = bdev_nr_sectors(pmd->bdev); 55962306a36Sopenharmony_ci 56062306a36Sopenharmony_ci if (bdev_size > THIN_METADATA_MAX_SECTORS) 56162306a36Sopenharmony_ci bdev_size = THIN_METADATA_MAX_SECTORS; 56262306a36Sopenharmony_ci 56362306a36Sopenharmony_ci r = dm_sm_commit(pmd->data_sm); 56462306a36Sopenharmony_ci if (r < 0) 56562306a36Sopenharmony_ci return r; 56662306a36Sopenharmony_ci 56762306a36Sopenharmony_ci r = dm_tm_pre_commit(pmd->tm); 56862306a36Sopenharmony_ci if (r < 0) 56962306a36Sopenharmony_ci return r; 57062306a36Sopenharmony_ci 57162306a36Sopenharmony_ci r = save_sm_roots(pmd); 57262306a36Sopenharmony_ci if (r < 0) 57362306a36Sopenharmony_ci return r; 57462306a36Sopenharmony_ci 57562306a36Sopenharmony_ci r = superblock_lock_zero(pmd, &sblock); 57662306a36Sopenharmony_ci if (r) 57762306a36Sopenharmony_ci return r; 57862306a36Sopenharmony_ci 57962306a36Sopenharmony_ci disk_super = dm_block_data(sblock); 58062306a36Sopenharmony_ci disk_super->flags = 0; 58162306a36Sopenharmony_ci memset(disk_super->uuid, 0, sizeof(disk_super->uuid)); 58262306a36Sopenharmony_ci disk_super->magic = cpu_to_le64(THIN_SUPERBLOCK_MAGIC); 58362306a36Sopenharmony_ci disk_super->version = cpu_to_le32(THIN_VERSION); 58462306a36Sopenharmony_ci disk_super->time = 0; 58562306a36Sopenharmony_ci disk_super->trans_id = 0; 58662306a36Sopenharmony_ci disk_super->held_root = 0; 58762306a36Sopenharmony_ci 58862306a36Sopenharmony_ci copy_sm_roots(pmd, disk_super); 58962306a36Sopenharmony_ci 59062306a36Sopenharmony_ci disk_super->data_mapping_root = cpu_to_le64(pmd->root); 59162306a36Sopenharmony_ci disk_super->device_details_root = cpu_to_le64(pmd->details_root); 59262306a36Sopenharmony_ci disk_super->metadata_block_size = cpu_to_le32(THIN_METADATA_BLOCK_SIZE); 59362306a36Sopenharmony_ci disk_super->metadata_nr_blocks = cpu_to_le64(bdev_size >> SECTOR_TO_BLOCK_SHIFT); 59462306a36Sopenharmony_ci disk_super->data_block_size = cpu_to_le32(pmd->data_block_size); 59562306a36Sopenharmony_ci 59662306a36Sopenharmony_ci return dm_tm_commit(pmd->tm, sblock); 59762306a36Sopenharmony_ci} 59862306a36Sopenharmony_ci 59962306a36Sopenharmony_cistatic int __format_metadata(struct dm_pool_metadata *pmd) 60062306a36Sopenharmony_ci{ 60162306a36Sopenharmony_ci int r; 60262306a36Sopenharmony_ci 60362306a36Sopenharmony_ci r = dm_tm_create_with_sm(pmd->bm, THIN_SUPERBLOCK_LOCATION, 60462306a36Sopenharmony_ci &pmd->tm, &pmd->metadata_sm); 60562306a36Sopenharmony_ci if (r < 0) { 60662306a36Sopenharmony_ci pmd->tm = NULL; 60762306a36Sopenharmony_ci pmd->metadata_sm = NULL; 60862306a36Sopenharmony_ci DMERR("tm_create_with_sm failed"); 60962306a36Sopenharmony_ci return r; 61062306a36Sopenharmony_ci } 61162306a36Sopenharmony_ci 61262306a36Sopenharmony_ci pmd->data_sm = dm_sm_disk_create(pmd->tm, 0); 61362306a36Sopenharmony_ci if (IS_ERR(pmd->data_sm)) { 61462306a36Sopenharmony_ci DMERR("sm_disk_create failed"); 61562306a36Sopenharmony_ci r = PTR_ERR(pmd->data_sm); 61662306a36Sopenharmony_ci pmd->data_sm = NULL; 61762306a36Sopenharmony_ci goto bad_cleanup_tm; 61862306a36Sopenharmony_ci } 61962306a36Sopenharmony_ci 62062306a36Sopenharmony_ci pmd->nb_tm = dm_tm_create_non_blocking_clone(pmd->tm); 62162306a36Sopenharmony_ci if (!pmd->nb_tm) { 62262306a36Sopenharmony_ci DMERR("could not create non-blocking clone tm"); 62362306a36Sopenharmony_ci r = -ENOMEM; 62462306a36Sopenharmony_ci goto bad_cleanup_data_sm; 62562306a36Sopenharmony_ci } 62662306a36Sopenharmony_ci 62762306a36Sopenharmony_ci __setup_btree_details(pmd); 62862306a36Sopenharmony_ci 62962306a36Sopenharmony_ci r = dm_btree_empty(&pmd->info, &pmd->root); 63062306a36Sopenharmony_ci if (r < 0) 63162306a36Sopenharmony_ci goto bad_cleanup_nb_tm; 63262306a36Sopenharmony_ci 63362306a36Sopenharmony_ci r = dm_btree_empty(&pmd->details_info, &pmd->details_root); 63462306a36Sopenharmony_ci if (r < 0) { 63562306a36Sopenharmony_ci DMERR("couldn't create devices root"); 63662306a36Sopenharmony_ci goto bad_cleanup_nb_tm; 63762306a36Sopenharmony_ci } 63862306a36Sopenharmony_ci 63962306a36Sopenharmony_ci r = __write_initial_superblock(pmd); 64062306a36Sopenharmony_ci if (r) 64162306a36Sopenharmony_ci goto bad_cleanup_nb_tm; 64262306a36Sopenharmony_ci 64362306a36Sopenharmony_ci return 0; 64462306a36Sopenharmony_ci 64562306a36Sopenharmony_cibad_cleanup_nb_tm: 64662306a36Sopenharmony_ci dm_tm_destroy(pmd->nb_tm); 64762306a36Sopenharmony_ci pmd->nb_tm = NULL; 64862306a36Sopenharmony_cibad_cleanup_data_sm: 64962306a36Sopenharmony_ci dm_sm_destroy(pmd->data_sm); 65062306a36Sopenharmony_ci pmd->data_sm = NULL; 65162306a36Sopenharmony_cibad_cleanup_tm: 65262306a36Sopenharmony_ci dm_tm_destroy(pmd->tm); 65362306a36Sopenharmony_ci pmd->tm = NULL; 65462306a36Sopenharmony_ci dm_sm_destroy(pmd->metadata_sm); 65562306a36Sopenharmony_ci pmd->metadata_sm = NULL; 65662306a36Sopenharmony_ci 65762306a36Sopenharmony_ci return r; 65862306a36Sopenharmony_ci} 65962306a36Sopenharmony_ci 66062306a36Sopenharmony_cistatic int __check_incompat_features(struct thin_disk_superblock *disk_super, 66162306a36Sopenharmony_ci struct dm_pool_metadata *pmd) 66262306a36Sopenharmony_ci{ 66362306a36Sopenharmony_ci uint32_t features; 66462306a36Sopenharmony_ci 66562306a36Sopenharmony_ci features = le32_to_cpu(disk_super->incompat_flags) & ~THIN_FEATURE_INCOMPAT_SUPP; 66662306a36Sopenharmony_ci if (features) { 66762306a36Sopenharmony_ci DMERR("could not access metadata due to unsupported optional features (%lx).", 66862306a36Sopenharmony_ci (unsigned long)features); 66962306a36Sopenharmony_ci return -EINVAL; 67062306a36Sopenharmony_ci } 67162306a36Sopenharmony_ci 67262306a36Sopenharmony_ci /* 67362306a36Sopenharmony_ci * Check for read-only metadata to skip the following RDWR checks. 67462306a36Sopenharmony_ci */ 67562306a36Sopenharmony_ci if (bdev_read_only(pmd->bdev)) 67662306a36Sopenharmony_ci return 0; 67762306a36Sopenharmony_ci 67862306a36Sopenharmony_ci features = le32_to_cpu(disk_super->compat_ro_flags) & ~THIN_FEATURE_COMPAT_RO_SUPP; 67962306a36Sopenharmony_ci if (features) { 68062306a36Sopenharmony_ci DMERR("could not access metadata RDWR due to unsupported optional features (%lx).", 68162306a36Sopenharmony_ci (unsigned long)features); 68262306a36Sopenharmony_ci return -EINVAL; 68362306a36Sopenharmony_ci } 68462306a36Sopenharmony_ci 68562306a36Sopenharmony_ci return 0; 68662306a36Sopenharmony_ci} 68762306a36Sopenharmony_ci 68862306a36Sopenharmony_cistatic int __open_metadata(struct dm_pool_metadata *pmd) 68962306a36Sopenharmony_ci{ 69062306a36Sopenharmony_ci int r; 69162306a36Sopenharmony_ci struct dm_block *sblock; 69262306a36Sopenharmony_ci struct thin_disk_superblock *disk_super; 69362306a36Sopenharmony_ci 69462306a36Sopenharmony_ci r = dm_bm_read_lock(pmd->bm, THIN_SUPERBLOCK_LOCATION, 69562306a36Sopenharmony_ci &sb_validator, &sblock); 69662306a36Sopenharmony_ci if (r < 0) { 69762306a36Sopenharmony_ci DMERR("couldn't read superblock"); 69862306a36Sopenharmony_ci return r; 69962306a36Sopenharmony_ci } 70062306a36Sopenharmony_ci 70162306a36Sopenharmony_ci disk_super = dm_block_data(sblock); 70262306a36Sopenharmony_ci 70362306a36Sopenharmony_ci /* Verify the data block size hasn't changed */ 70462306a36Sopenharmony_ci if (le32_to_cpu(disk_super->data_block_size) != pmd->data_block_size) { 70562306a36Sopenharmony_ci DMERR("changing the data block size (from %u to %llu) is not supported", 70662306a36Sopenharmony_ci le32_to_cpu(disk_super->data_block_size), 70762306a36Sopenharmony_ci (unsigned long long)pmd->data_block_size); 70862306a36Sopenharmony_ci r = -EINVAL; 70962306a36Sopenharmony_ci goto bad_unlock_sblock; 71062306a36Sopenharmony_ci } 71162306a36Sopenharmony_ci 71262306a36Sopenharmony_ci r = __check_incompat_features(disk_super, pmd); 71362306a36Sopenharmony_ci if (r < 0) 71462306a36Sopenharmony_ci goto bad_unlock_sblock; 71562306a36Sopenharmony_ci 71662306a36Sopenharmony_ci r = dm_tm_open_with_sm(pmd->bm, THIN_SUPERBLOCK_LOCATION, 71762306a36Sopenharmony_ci disk_super->metadata_space_map_root, 71862306a36Sopenharmony_ci sizeof(disk_super->metadata_space_map_root), 71962306a36Sopenharmony_ci &pmd->tm, &pmd->metadata_sm); 72062306a36Sopenharmony_ci if (r < 0) { 72162306a36Sopenharmony_ci pmd->tm = NULL; 72262306a36Sopenharmony_ci pmd->metadata_sm = NULL; 72362306a36Sopenharmony_ci DMERR("tm_open_with_sm failed"); 72462306a36Sopenharmony_ci goto bad_unlock_sblock; 72562306a36Sopenharmony_ci } 72662306a36Sopenharmony_ci 72762306a36Sopenharmony_ci pmd->data_sm = dm_sm_disk_open(pmd->tm, disk_super->data_space_map_root, 72862306a36Sopenharmony_ci sizeof(disk_super->data_space_map_root)); 72962306a36Sopenharmony_ci if (IS_ERR(pmd->data_sm)) { 73062306a36Sopenharmony_ci DMERR("sm_disk_open failed"); 73162306a36Sopenharmony_ci r = PTR_ERR(pmd->data_sm); 73262306a36Sopenharmony_ci pmd->data_sm = NULL; 73362306a36Sopenharmony_ci goto bad_cleanup_tm; 73462306a36Sopenharmony_ci } 73562306a36Sopenharmony_ci 73662306a36Sopenharmony_ci pmd->nb_tm = dm_tm_create_non_blocking_clone(pmd->tm); 73762306a36Sopenharmony_ci if (!pmd->nb_tm) { 73862306a36Sopenharmony_ci DMERR("could not create non-blocking clone tm"); 73962306a36Sopenharmony_ci r = -ENOMEM; 74062306a36Sopenharmony_ci goto bad_cleanup_data_sm; 74162306a36Sopenharmony_ci } 74262306a36Sopenharmony_ci 74362306a36Sopenharmony_ci /* 74462306a36Sopenharmony_ci * For pool metadata opening process, root setting is redundant 74562306a36Sopenharmony_ci * because it will be set again in __begin_transaction(). But dm 74662306a36Sopenharmony_ci * pool aborting process really needs to get last transaction's 74762306a36Sopenharmony_ci * root to avoid accessing broken btree. 74862306a36Sopenharmony_ci */ 74962306a36Sopenharmony_ci pmd->root = le64_to_cpu(disk_super->data_mapping_root); 75062306a36Sopenharmony_ci pmd->details_root = le64_to_cpu(disk_super->device_details_root); 75162306a36Sopenharmony_ci 75262306a36Sopenharmony_ci __setup_btree_details(pmd); 75362306a36Sopenharmony_ci dm_bm_unlock(sblock); 75462306a36Sopenharmony_ci 75562306a36Sopenharmony_ci return 0; 75662306a36Sopenharmony_ci 75762306a36Sopenharmony_cibad_cleanup_data_sm: 75862306a36Sopenharmony_ci dm_sm_destroy(pmd->data_sm); 75962306a36Sopenharmony_ci pmd->data_sm = NULL; 76062306a36Sopenharmony_cibad_cleanup_tm: 76162306a36Sopenharmony_ci dm_tm_destroy(pmd->tm); 76262306a36Sopenharmony_ci pmd->tm = NULL; 76362306a36Sopenharmony_ci dm_sm_destroy(pmd->metadata_sm); 76462306a36Sopenharmony_ci pmd->metadata_sm = NULL; 76562306a36Sopenharmony_cibad_unlock_sblock: 76662306a36Sopenharmony_ci dm_bm_unlock(sblock); 76762306a36Sopenharmony_ci 76862306a36Sopenharmony_ci return r; 76962306a36Sopenharmony_ci} 77062306a36Sopenharmony_ci 77162306a36Sopenharmony_cistatic int __open_or_format_metadata(struct dm_pool_metadata *pmd, bool format_device) 77262306a36Sopenharmony_ci{ 77362306a36Sopenharmony_ci int r, unformatted; 77462306a36Sopenharmony_ci 77562306a36Sopenharmony_ci r = __superblock_all_zeroes(pmd->bm, &unformatted); 77662306a36Sopenharmony_ci if (r) 77762306a36Sopenharmony_ci return r; 77862306a36Sopenharmony_ci 77962306a36Sopenharmony_ci if (unformatted) 78062306a36Sopenharmony_ci return format_device ? __format_metadata(pmd) : -EPERM; 78162306a36Sopenharmony_ci 78262306a36Sopenharmony_ci return __open_metadata(pmd); 78362306a36Sopenharmony_ci} 78462306a36Sopenharmony_ci 78562306a36Sopenharmony_cistatic int __create_persistent_data_objects(struct dm_pool_metadata *pmd, bool format_device) 78662306a36Sopenharmony_ci{ 78762306a36Sopenharmony_ci int r; 78862306a36Sopenharmony_ci 78962306a36Sopenharmony_ci pmd->bm = dm_block_manager_create(pmd->bdev, THIN_METADATA_BLOCK_SIZE << SECTOR_SHIFT, 79062306a36Sopenharmony_ci THIN_MAX_CONCURRENT_LOCKS); 79162306a36Sopenharmony_ci if (IS_ERR(pmd->bm)) { 79262306a36Sopenharmony_ci DMERR("could not create block manager"); 79362306a36Sopenharmony_ci r = PTR_ERR(pmd->bm); 79462306a36Sopenharmony_ci pmd->bm = NULL; 79562306a36Sopenharmony_ci return r; 79662306a36Sopenharmony_ci } 79762306a36Sopenharmony_ci 79862306a36Sopenharmony_ci r = __open_or_format_metadata(pmd, format_device); 79962306a36Sopenharmony_ci if (r) { 80062306a36Sopenharmony_ci dm_block_manager_destroy(pmd->bm); 80162306a36Sopenharmony_ci pmd->bm = NULL; 80262306a36Sopenharmony_ci } 80362306a36Sopenharmony_ci 80462306a36Sopenharmony_ci return r; 80562306a36Sopenharmony_ci} 80662306a36Sopenharmony_ci 80762306a36Sopenharmony_cistatic void __destroy_persistent_data_objects(struct dm_pool_metadata *pmd, 80862306a36Sopenharmony_ci bool destroy_bm) 80962306a36Sopenharmony_ci{ 81062306a36Sopenharmony_ci dm_sm_destroy(pmd->data_sm); 81162306a36Sopenharmony_ci pmd->data_sm = NULL; 81262306a36Sopenharmony_ci dm_sm_destroy(pmd->metadata_sm); 81362306a36Sopenharmony_ci pmd->metadata_sm = NULL; 81462306a36Sopenharmony_ci dm_tm_destroy(pmd->nb_tm); 81562306a36Sopenharmony_ci pmd->nb_tm = NULL; 81662306a36Sopenharmony_ci dm_tm_destroy(pmd->tm); 81762306a36Sopenharmony_ci pmd->tm = NULL; 81862306a36Sopenharmony_ci if (destroy_bm) 81962306a36Sopenharmony_ci dm_block_manager_destroy(pmd->bm); 82062306a36Sopenharmony_ci} 82162306a36Sopenharmony_ci 82262306a36Sopenharmony_cistatic int __begin_transaction(struct dm_pool_metadata *pmd) 82362306a36Sopenharmony_ci{ 82462306a36Sopenharmony_ci int r; 82562306a36Sopenharmony_ci struct thin_disk_superblock *disk_super; 82662306a36Sopenharmony_ci struct dm_block *sblock; 82762306a36Sopenharmony_ci 82862306a36Sopenharmony_ci /* 82962306a36Sopenharmony_ci * We re-read the superblock every time. Shouldn't need to do this 83062306a36Sopenharmony_ci * really. 83162306a36Sopenharmony_ci */ 83262306a36Sopenharmony_ci r = dm_bm_read_lock(pmd->bm, THIN_SUPERBLOCK_LOCATION, 83362306a36Sopenharmony_ci &sb_validator, &sblock); 83462306a36Sopenharmony_ci if (r) 83562306a36Sopenharmony_ci return r; 83662306a36Sopenharmony_ci 83762306a36Sopenharmony_ci disk_super = dm_block_data(sblock); 83862306a36Sopenharmony_ci pmd->time = le32_to_cpu(disk_super->time); 83962306a36Sopenharmony_ci pmd->root = le64_to_cpu(disk_super->data_mapping_root); 84062306a36Sopenharmony_ci pmd->details_root = le64_to_cpu(disk_super->device_details_root); 84162306a36Sopenharmony_ci pmd->trans_id = le64_to_cpu(disk_super->trans_id); 84262306a36Sopenharmony_ci pmd->flags = le32_to_cpu(disk_super->flags); 84362306a36Sopenharmony_ci pmd->data_block_size = le32_to_cpu(disk_super->data_block_size); 84462306a36Sopenharmony_ci 84562306a36Sopenharmony_ci dm_bm_unlock(sblock); 84662306a36Sopenharmony_ci return 0; 84762306a36Sopenharmony_ci} 84862306a36Sopenharmony_ci 84962306a36Sopenharmony_cistatic int __write_changed_details(struct dm_pool_metadata *pmd) 85062306a36Sopenharmony_ci{ 85162306a36Sopenharmony_ci int r; 85262306a36Sopenharmony_ci struct dm_thin_device *td, *tmp; 85362306a36Sopenharmony_ci struct disk_device_details details; 85462306a36Sopenharmony_ci uint64_t key; 85562306a36Sopenharmony_ci 85662306a36Sopenharmony_ci list_for_each_entry_safe(td, tmp, &pmd->thin_devices, list) { 85762306a36Sopenharmony_ci if (!td->changed) 85862306a36Sopenharmony_ci continue; 85962306a36Sopenharmony_ci 86062306a36Sopenharmony_ci key = td->id; 86162306a36Sopenharmony_ci 86262306a36Sopenharmony_ci details.mapped_blocks = cpu_to_le64(td->mapped_blocks); 86362306a36Sopenharmony_ci details.transaction_id = cpu_to_le64(td->transaction_id); 86462306a36Sopenharmony_ci details.creation_time = cpu_to_le32(td->creation_time); 86562306a36Sopenharmony_ci details.snapshotted_time = cpu_to_le32(td->snapshotted_time); 86662306a36Sopenharmony_ci __dm_bless_for_disk(&details); 86762306a36Sopenharmony_ci 86862306a36Sopenharmony_ci r = dm_btree_insert(&pmd->details_info, pmd->details_root, 86962306a36Sopenharmony_ci &key, &details, &pmd->details_root); 87062306a36Sopenharmony_ci if (r) 87162306a36Sopenharmony_ci return r; 87262306a36Sopenharmony_ci 87362306a36Sopenharmony_ci if (td->open_count) 87462306a36Sopenharmony_ci td->changed = false; 87562306a36Sopenharmony_ci else { 87662306a36Sopenharmony_ci list_del(&td->list); 87762306a36Sopenharmony_ci kfree(td); 87862306a36Sopenharmony_ci } 87962306a36Sopenharmony_ci } 88062306a36Sopenharmony_ci 88162306a36Sopenharmony_ci return 0; 88262306a36Sopenharmony_ci} 88362306a36Sopenharmony_ci 88462306a36Sopenharmony_cistatic int __commit_transaction(struct dm_pool_metadata *pmd) 88562306a36Sopenharmony_ci{ 88662306a36Sopenharmony_ci int r; 88762306a36Sopenharmony_ci struct thin_disk_superblock *disk_super; 88862306a36Sopenharmony_ci struct dm_block *sblock; 88962306a36Sopenharmony_ci 89062306a36Sopenharmony_ci /* 89162306a36Sopenharmony_ci * We need to know if the thin_disk_superblock exceeds a 512-byte sector. 89262306a36Sopenharmony_ci */ 89362306a36Sopenharmony_ci BUILD_BUG_ON(sizeof(struct thin_disk_superblock) > 512); 89462306a36Sopenharmony_ci BUG_ON(!rwsem_is_locked(&pmd->root_lock)); 89562306a36Sopenharmony_ci 89662306a36Sopenharmony_ci if (unlikely(!pmd->in_service)) 89762306a36Sopenharmony_ci return 0; 89862306a36Sopenharmony_ci 89962306a36Sopenharmony_ci if (pmd->pre_commit_fn) { 90062306a36Sopenharmony_ci r = pmd->pre_commit_fn(pmd->pre_commit_context); 90162306a36Sopenharmony_ci if (r < 0) { 90262306a36Sopenharmony_ci DMERR("pre-commit callback failed"); 90362306a36Sopenharmony_ci return r; 90462306a36Sopenharmony_ci } 90562306a36Sopenharmony_ci } 90662306a36Sopenharmony_ci 90762306a36Sopenharmony_ci r = __write_changed_details(pmd); 90862306a36Sopenharmony_ci if (r < 0) 90962306a36Sopenharmony_ci return r; 91062306a36Sopenharmony_ci 91162306a36Sopenharmony_ci r = dm_sm_commit(pmd->data_sm); 91262306a36Sopenharmony_ci if (r < 0) 91362306a36Sopenharmony_ci return r; 91462306a36Sopenharmony_ci 91562306a36Sopenharmony_ci r = dm_tm_pre_commit(pmd->tm); 91662306a36Sopenharmony_ci if (r < 0) 91762306a36Sopenharmony_ci return r; 91862306a36Sopenharmony_ci 91962306a36Sopenharmony_ci r = save_sm_roots(pmd); 92062306a36Sopenharmony_ci if (r < 0) 92162306a36Sopenharmony_ci return r; 92262306a36Sopenharmony_ci 92362306a36Sopenharmony_ci r = superblock_lock(pmd, &sblock); 92462306a36Sopenharmony_ci if (r) 92562306a36Sopenharmony_ci return r; 92662306a36Sopenharmony_ci 92762306a36Sopenharmony_ci disk_super = dm_block_data(sblock); 92862306a36Sopenharmony_ci disk_super->time = cpu_to_le32(pmd->time); 92962306a36Sopenharmony_ci disk_super->data_mapping_root = cpu_to_le64(pmd->root); 93062306a36Sopenharmony_ci disk_super->device_details_root = cpu_to_le64(pmd->details_root); 93162306a36Sopenharmony_ci disk_super->trans_id = cpu_to_le64(pmd->trans_id); 93262306a36Sopenharmony_ci disk_super->flags = cpu_to_le32(pmd->flags); 93362306a36Sopenharmony_ci 93462306a36Sopenharmony_ci copy_sm_roots(pmd, disk_super); 93562306a36Sopenharmony_ci 93662306a36Sopenharmony_ci return dm_tm_commit(pmd->tm, sblock); 93762306a36Sopenharmony_ci} 93862306a36Sopenharmony_ci 93962306a36Sopenharmony_cistatic void __set_metadata_reserve(struct dm_pool_metadata *pmd) 94062306a36Sopenharmony_ci{ 94162306a36Sopenharmony_ci int r; 94262306a36Sopenharmony_ci dm_block_t total; 94362306a36Sopenharmony_ci dm_block_t max_blocks = 4096; /* 16M */ 94462306a36Sopenharmony_ci 94562306a36Sopenharmony_ci r = dm_sm_get_nr_blocks(pmd->metadata_sm, &total); 94662306a36Sopenharmony_ci if (r) { 94762306a36Sopenharmony_ci DMERR("could not get size of metadata device"); 94862306a36Sopenharmony_ci pmd->metadata_reserve = max_blocks; 94962306a36Sopenharmony_ci } else 95062306a36Sopenharmony_ci pmd->metadata_reserve = min(max_blocks, div_u64(total, 10)); 95162306a36Sopenharmony_ci} 95262306a36Sopenharmony_ci 95362306a36Sopenharmony_cistruct dm_pool_metadata *dm_pool_metadata_open(struct block_device *bdev, 95462306a36Sopenharmony_ci sector_t data_block_size, 95562306a36Sopenharmony_ci bool format_device) 95662306a36Sopenharmony_ci{ 95762306a36Sopenharmony_ci int r; 95862306a36Sopenharmony_ci struct dm_pool_metadata *pmd; 95962306a36Sopenharmony_ci 96062306a36Sopenharmony_ci pmd = kmalloc(sizeof(*pmd), GFP_KERNEL); 96162306a36Sopenharmony_ci if (!pmd) { 96262306a36Sopenharmony_ci DMERR("could not allocate metadata struct"); 96362306a36Sopenharmony_ci return ERR_PTR(-ENOMEM); 96462306a36Sopenharmony_ci } 96562306a36Sopenharmony_ci 96662306a36Sopenharmony_ci init_rwsem(&pmd->root_lock); 96762306a36Sopenharmony_ci pmd->time = 0; 96862306a36Sopenharmony_ci INIT_LIST_HEAD(&pmd->thin_devices); 96962306a36Sopenharmony_ci pmd->fail_io = false; 97062306a36Sopenharmony_ci pmd->in_service = false; 97162306a36Sopenharmony_ci pmd->bdev = bdev; 97262306a36Sopenharmony_ci pmd->data_block_size = data_block_size; 97362306a36Sopenharmony_ci pmd->pre_commit_fn = NULL; 97462306a36Sopenharmony_ci pmd->pre_commit_context = NULL; 97562306a36Sopenharmony_ci 97662306a36Sopenharmony_ci r = __create_persistent_data_objects(pmd, format_device); 97762306a36Sopenharmony_ci if (r) { 97862306a36Sopenharmony_ci kfree(pmd); 97962306a36Sopenharmony_ci return ERR_PTR(r); 98062306a36Sopenharmony_ci } 98162306a36Sopenharmony_ci 98262306a36Sopenharmony_ci r = __begin_transaction(pmd); 98362306a36Sopenharmony_ci if (r < 0) { 98462306a36Sopenharmony_ci if (dm_pool_metadata_close(pmd) < 0) 98562306a36Sopenharmony_ci DMWARN("%s: dm_pool_metadata_close() failed.", __func__); 98662306a36Sopenharmony_ci return ERR_PTR(r); 98762306a36Sopenharmony_ci } 98862306a36Sopenharmony_ci 98962306a36Sopenharmony_ci __set_metadata_reserve(pmd); 99062306a36Sopenharmony_ci 99162306a36Sopenharmony_ci return pmd; 99262306a36Sopenharmony_ci} 99362306a36Sopenharmony_ci 99462306a36Sopenharmony_ciint dm_pool_metadata_close(struct dm_pool_metadata *pmd) 99562306a36Sopenharmony_ci{ 99662306a36Sopenharmony_ci int r; 99762306a36Sopenharmony_ci unsigned int open_devices = 0; 99862306a36Sopenharmony_ci struct dm_thin_device *td, *tmp; 99962306a36Sopenharmony_ci 100062306a36Sopenharmony_ci down_read(&pmd->root_lock); 100162306a36Sopenharmony_ci list_for_each_entry_safe(td, tmp, &pmd->thin_devices, list) { 100262306a36Sopenharmony_ci if (td->open_count) 100362306a36Sopenharmony_ci open_devices++; 100462306a36Sopenharmony_ci else { 100562306a36Sopenharmony_ci list_del(&td->list); 100662306a36Sopenharmony_ci kfree(td); 100762306a36Sopenharmony_ci } 100862306a36Sopenharmony_ci } 100962306a36Sopenharmony_ci up_read(&pmd->root_lock); 101062306a36Sopenharmony_ci 101162306a36Sopenharmony_ci if (open_devices) { 101262306a36Sopenharmony_ci DMERR("attempt to close pmd when %u device(s) are still open", 101362306a36Sopenharmony_ci open_devices); 101462306a36Sopenharmony_ci return -EBUSY; 101562306a36Sopenharmony_ci } 101662306a36Sopenharmony_ci 101762306a36Sopenharmony_ci pmd_write_lock_in_core(pmd); 101862306a36Sopenharmony_ci if (!pmd->fail_io && !dm_bm_is_read_only(pmd->bm)) { 101962306a36Sopenharmony_ci r = __commit_transaction(pmd); 102062306a36Sopenharmony_ci if (r < 0) 102162306a36Sopenharmony_ci DMWARN("%s: __commit_transaction() failed, error = %d", 102262306a36Sopenharmony_ci __func__, r); 102362306a36Sopenharmony_ci } 102462306a36Sopenharmony_ci pmd_write_unlock(pmd); 102562306a36Sopenharmony_ci __destroy_persistent_data_objects(pmd, true); 102662306a36Sopenharmony_ci 102762306a36Sopenharmony_ci kfree(pmd); 102862306a36Sopenharmony_ci return 0; 102962306a36Sopenharmony_ci} 103062306a36Sopenharmony_ci 103162306a36Sopenharmony_ci/* 103262306a36Sopenharmony_ci * __open_device: Returns @td corresponding to device with id @dev, 103362306a36Sopenharmony_ci * creating it if @create is set and incrementing @td->open_count. 103462306a36Sopenharmony_ci * On failure, @td is undefined. 103562306a36Sopenharmony_ci */ 103662306a36Sopenharmony_cistatic int __open_device(struct dm_pool_metadata *pmd, 103762306a36Sopenharmony_ci dm_thin_id dev, int create, 103862306a36Sopenharmony_ci struct dm_thin_device **td) 103962306a36Sopenharmony_ci{ 104062306a36Sopenharmony_ci int r, changed = 0; 104162306a36Sopenharmony_ci struct dm_thin_device *td2; 104262306a36Sopenharmony_ci uint64_t key = dev; 104362306a36Sopenharmony_ci struct disk_device_details details_le; 104462306a36Sopenharmony_ci 104562306a36Sopenharmony_ci /* 104662306a36Sopenharmony_ci * If the device is already open, return it. 104762306a36Sopenharmony_ci */ 104862306a36Sopenharmony_ci list_for_each_entry(td2, &pmd->thin_devices, list) 104962306a36Sopenharmony_ci if (td2->id == dev) { 105062306a36Sopenharmony_ci /* 105162306a36Sopenharmony_ci * May not create an already-open device. 105262306a36Sopenharmony_ci */ 105362306a36Sopenharmony_ci if (create) 105462306a36Sopenharmony_ci return -EEXIST; 105562306a36Sopenharmony_ci 105662306a36Sopenharmony_ci td2->open_count++; 105762306a36Sopenharmony_ci *td = td2; 105862306a36Sopenharmony_ci return 0; 105962306a36Sopenharmony_ci } 106062306a36Sopenharmony_ci 106162306a36Sopenharmony_ci /* 106262306a36Sopenharmony_ci * Check the device exists. 106362306a36Sopenharmony_ci */ 106462306a36Sopenharmony_ci r = dm_btree_lookup(&pmd->details_info, pmd->details_root, 106562306a36Sopenharmony_ci &key, &details_le); 106662306a36Sopenharmony_ci if (r) { 106762306a36Sopenharmony_ci if (r != -ENODATA || !create) 106862306a36Sopenharmony_ci return r; 106962306a36Sopenharmony_ci 107062306a36Sopenharmony_ci /* 107162306a36Sopenharmony_ci * Create new device. 107262306a36Sopenharmony_ci */ 107362306a36Sopenharmony_ci changed = 1; 107462306a36Sopenharmony_ci details_le.mapped_blocks = 0; 107562306a36Sopenharmony_ci details_le.transaction_id = cpu_to_le64(pmd->trans_id); 107662306a36Sopenharmony_ci details_le.creation_time = cpu_to_le32(pmd->time); 107762306a36Sopenharmony_ci details_le.snapshotted_time = cpu_to_le32(pmd->time); 107862306a36Sopenharmony_ci } 107962306a36Sopenharmony_ci 108062306a36Sopenharmony_ci *td = kmalloc(sizeof(**td), GFP_NOIO); 108162306a36Sopenharmony_ci if (!*td) 108262306a36Sopenharmony_ci return -ENOMEM; 108362306a36Sopenharmony_ci 108462306a36Sopenharmony_ci (*td)->pmd = pmd; 108562306a36Sopenharmony_ci (*td)->id = dev; 108662306a36Sopenharmony_ci (*td)->open_count = 1; 108762306a36Sopenharmony_ci (*td)->changed = changed; 108862306a36Sopenharmony_ci (*td)->aborted_with_changes = false; 108962306a36Sopenharmony_ci (*td)->mapped_blocks = le64_to_cpu(details_le.mapped_blocks); 109062306a36Sopenharmony_ci (*td)->transaction_id = le64_to_cpu(details_le.transaction_id); 109162306a36Sopenharmony_ci (*td)->creation_time = le32_to_cpu(details_le.creation_time); 109262306a36Sopenharmony_ci (*td)->snapshotted_time = le32_to_cpu(details_le.snapshotted_time); 109362306a36Sopenharmony_ci 109462306a36Sopenharmony_ci list_add(&(*td)->list, &pmd->thin_devices); 109562306a36Sopenharmony_ci 109662306a36Sopenharmony_ci return 0; 109762306a36Sopenharmony_ci} 109862306a36Sopenharmony_ci 109962306a36Sopenharmony_cistatic void __close_device(struct dm_thin_device *td) 110062306a36Sopenharmony_ci{ 110162306a36Sopenharmony_ci --td->open_count; 110262306a36Sopenharmony_ci} 110362306a36Sopenharmony_ci 110462306a36Sopenharmony_cistatic int __create_thin(struct dm_pool_metadata *pmd, 110562306a36Sopenharmony_ci dm_thin_id dev) 110662306a36Sopenharmony_ci{ 110762306a36Sopenharmony_ci int r; 110862306a36Sopenharmony_ci dm_block_t dev_root; 110962306a36Sopenharmony_ci uint64_t key = dev; 111062306a36Sopenharmony_ci struct dm_thin_device *td; 111162306a36Sopenharmony_ci __le64 value; 111262306a36Sopenharmony_ci 111362306a36Sopenharmony_ci r = dm_btree_lookup(&pmd->details_info, pmd->details_root, 111462306a36Sopenharmony_ci &key, NULL); 111562306a36Sopenharmony_ci if (!r) 111662306a36Sopenharmony_ci return -EEXIST; 111762306a36Sopenharmony_ci 111862306a36Sopenharmony_ci /* 111962306a36Sopenharmony_ci * Create an empty btree for the mappings. 112062306a36Sopenharmony_ci */ 112162306a36Sopenharmony_ci r = dm_btree_empty(&pmd->bl_info, &dev_root); 112262306a36Sopenharmony_ci if (r) 112362306a36Sopenharmony_ci return r; 112462306a36Sopenharmony_ci 112562306a36Sopenharmony_ci /* 112662306a36Sopenharmony_ci * Insert it into the main mapping tree. 112762306a36Sopenharmony_ci */ 112862306a36Sopenharmony_ci value = cpu_to_le64(dev_root); 112962306a36Sopenharmony_ci __dm_bless_for_disk(&value); 113062306a36Sopenharmony_ci r = dm_btree_insert(&pmd->tl_info, pmd->root, &key, &value, &pmd->root); 113162306a36Sopenharmony_ci if (r) { 113262306a36Sopenharmony_ci dm_btree_del(&pmd->bl_info, dev_root); 113362306a36Sopenharmony_ci return r; 113462306a36Sopenharmony_ci } 113562306a36Sopenharmony_ci 113662306a36Sopenharmony_ci r = __open_device(pmd, dev, 1, &td); 113762306a36Sopenharmony_ci if (r) { 113862306a36Sopenharmony_ci dm_btree_remove(&pmd->tl_info, pmd->root, &key, &pmd->root); 113962306a36Sopenharmony_ci dm_btree_del(&pmd->bl_info, dev_root); 114062306a36Sopenharmony_ci return r; 114162306a36Sopenharmony_ci } 114262306a36Sopenharmony_ci __close_device(td); 114362306a36Sopenharmony_ci 114462306a36Sopenharmony_ci return r; 114562306a36Sopenharmony_ci} 114662306a36Sopenharmony_ci 114762306a36Sopenharmony_ciint dm_pool_create_thin(struct dm_pool_metadata *pmd, dm_thin_id dev) 114862306a36Sopenharmony_ci{ 114962306a36Sopenharmony_ci int r = -EINVAL; 115062306a36Sopenharmony_ci 115162306a36Sopenharmony_ci pmd_write_lock(pmd); 115262306a36Sopenharmony_ci if (!pmd->fail_io) 115362306a36Sopenharmony_ci r = __create_thin(pmd, dev); 115462306a36Sopenharmony_ci pmd_write_unlock(pmd); 115562306a36Sopenharmony_ci 115662306a36Sopenharmony_ci return r; 115762306a36Sopenharmony_ci} 115862306a36Sopenharmony_ci 115962306a36Sopenharmony_cistatic int __set_snapshot_details(struct dm_pool_metadata *pmd, 116062306a36Sopenharmony_ci struct dm_thin_device *snap, 116162306a36Sopenharmony_ci dm_thin_id origin, uint32_t time) 116262306a36Sopenharmony_ci{ 116362306a36Sopenharmony_ci int r; 116462306a36Sopenharmony_ci struct dm_thin_device *td; 116562306a36Sopenharmony_ci 116662306a36Sopenharmony_ci r = __open_device(pmd, origin, 0, &td); 116762306a36Sopenharmony_ci if (r) 116862306a36Sopenharmony_ci return r; 116962306a36Sopenharmony_ci 117062306a36Sopenharmony_ci td->changed = true; 117162306a36Sopenharmony_ci td->snapshotted_time = time; 117262306a36Sopenharmony_ci 117362306a36Sopenharmony_ci snap->mapped_blocks = td->mapped_blocks; 117462306a36Sopenharmony_ci snap->snapshotted_time = time; 117562306a36Sopenharmony_ci __close_device(td); 117662306a36Sopenharmony_ci 117762306a36Sopenharmony_ci return 0; 117862306a36Sopenharmony_ci} 117962306a36Sopenharmony_ci 118062306a36Sopenharmony_cistatic int __create_snap(struct dm_pool_metadata *pmd, 118162306a36Sopenharmony_ci dm_thin_id dev, dm_thin_id origin) 118262306a36Sopenharmony_ci{ 118362306a36Sopenharmony_ci int r; 118462306a36Sopenharmony_ci dm_block_t origin_root; 118562306a36Sopenharmony_ci uint64_t key = origin, dev_key = dev; 118662306a36Sopenharmony_ci struct dm_thin_device *td; 118762306a36Sopenharmony_ci __le64 value; 118862306a36Sopenharmony_ci 118962306a36Sopenharmony_ci /* check this device is unused */ 119062306a36Sopenharmony_ci r = dm_btree_lookup(&pmd->details_info, pmd->details_root, 119162306a36Sopenharmony_ci &dev_key, NULL); 119262306a36Sopenharmony_ci if (!r) 119362306a36Sopenharmony_ci return -EEXIST; 119462306a36Sopenharmony_ci 119562306a36Sopenharmony_ci /* find the mapping tree for the origin */ 119662306a36Sopenharmony_ci r = dm_btree_lookup(&pmd->tl_info, pmd->root, &key, &value); 119762306a36Sopenharmony_ci if (r) 119862306a36Sopenharmony_ci return r; 119962306a36Sopenharmony_ci origin_root = le64_to_cpu(value); 120062306a36Sopenharmony_ci 120162306a36Sopenharmony_ci /* clone the origin, an inc will do */ 120262306a36Sopenharmony_ci dm_tm_inc(pmd->tm, origin_root); 120362306a36Sopenharmony_ci 120462306a36Sopenharmony_ci /* insert into the main mapping tree */ 120562306a36Sopenharmony_ci value = cpu_to_le64(origin_root); 120662306a36Sopenharmony_ci __dm_bless_for_disk(&value); 120762306a36Sopenharmony_ci key = dev; 120862306a36Sopenharmony_ci r = dm_btree_insert(&pmd->tl_info, pmd->root, &key, &value, &pmd->root); 120962306a36Sopenharmony_ci if (r) { 121062306a36Sopenharmony_ci dm_tm_dec(pmd->tm, origin_root); 121162306a36Sopenharmony_ci return r; 121262306a36Sopenharmony_ci } 121362306a36Sopenharmony_ci 121462306a36Sopenharmony_ci pmd->time++; 121562306a36Sopenharmony_ci 121662306a36Sopenharmony_ci r = __open_device(pmd, dev, 1, &td); 121762306a36Sopenharmony_ci if (r) 121862306a36Sopenharmony_ci goto bad; 121962306a36Sopenharmony_ci 122062306a36Sopenharmony_ci r = __set_snapshot_details(pmd, td, origin, pmd->time); 122162306a36Sopenharmony_ci __close_device(td); 122262306a36Sopenharmony_ci 122362306a36Sopenharmony_ci if (r) 122462306a36Sopenharmony_ci goto bad; 122562306a36Sopenharmony_ci 122662306a36Sopenharmony_ci return 0; 122762306a36Sopenharmony_ci 122862306a36Sopenharmony_cibad: 122962306a36Sopenharmony_ci dm_btree_remove(&pmd->tl_info, pmd->root, &key, &pmd->root); 123062306a36Sopenharmony_ci dm_btree_remove(&pmd->details_info, pmd->details_root, 123162306a36Sopenharmony_ci &key, &pmd->details_root); 123262306a36Sopenharmony_ci return r; 123362306a36Sopenharmony_ci} 123462306a36Sopenharmony_ci 123562306a36Sopenharmony_ciint dm_pool_create_snap(struct dm_pool_metadata *pmd, 123662306a36Sopenharmony_ci dm_thin_id dev, 123762306a36Sopenharmony_ci dm_thin_id origin) 123862306a36Sopenharmony_ci{ 123962306a36Sopenharmony_ci int r = -EINVAL; 124062306a36Sopenharmony_ci 124162306a36Sopenharmony_ci pmd_write_lock(pmd); 124262306a36Sopenharmony_ci if (!pmd->fail_io) 124362306a36Sopenharmony_ci r = __create_snap(pmd, dev, origin); 124462306a36Sopenharmony_ci pmd_write_unlock(pmd); 124562306a36Sopenharmony_ci 124662306a36Sopenharmony_ci return r; 124762306a36Sopenharmony_ci} 124862306a36Sopenharmony_ci 124962306a36Sopenharmony_cistatic int __delete_device(struct dm_pool_metadata *pmd, dm_thin_id dev) 125062306a36Sopenharmony_ci{ 125162306a36Sopenharmony_ci int r; 125262306a36Sopenharmony_ci uint64_t key = dev; 125362306a36Sopenharmony_ci struct dm_thin_device *td; 125462306a36Sopenharmony_ci 125562306a36Sopenharmony_ci /* TODO: failure should mark the transaction invalid */ 125662306a36Sopenharmony_ci r = __open_device(pmd, dev, 0, &td); 125762306a36Sopenharmony_ci if (r) 125862306a36Sopenharmony_ci return r; 125962306a36Sopenharmony_ci 126062306a36Sopenharmony_ci if (td->open_count > 1) { 126162306a36Sopenharmony_ci __close_device(td); 126262306a36Sopenharmony_ci return -EBUSY; 126362306a36Sopenharmony_ci } 126462306a36Sopenharmony_ci 126562306a36Sopenharmony_ci list_del(&td->list); 126662306a36Sopenharmony_ci kfree(td); 126762306a36Sopenharmony_ci r = dm_btree_remove(&pmd->details_info, pmd->details_root, 126862306a36Sopenharmony_ci &key, &pmd->details_root); 126962306a36Sopenharmony_ci if (r) 127062306a36Sopenharmony_ci return r; 127162306a36Sopenharmony_ci 127262306a36Sopenharmony_ci r = dm_btree_remove(&pmd->tl_info, pmd->root, &key, &pmd->root); 127362306a36Sopenharmony_ci if (r) 127462306a36Sopenharmony_ci return r; 127562306a36Sopenharmony_ci 127662306a36Sopenharmony_ci return 0; 127762306a36Sopenharmony_ci} 127862306a36Sopenharmony_ci 127962306a36Sopenharmony_ciint dm_pool_delete_thin_device(struct dm_pool_metadata *pmd, 128062306a36Sopenharmony_ci dm_thin_id dev) 128162306a36Sopenharmony_ci{ 128262306a36Sopenharmony_ci int r = -EINVAL; 128362306a36Sopenharmony_ci 128462306a36Sopenharmony_ci pmd_write_lock(pmd); 128562306a36Sopenharmony_ci if (!pmd->fail_io) 128662306a36Sopenharmony_ci r = __delete_device(pmd, dev); 128762306a36Sopenharmony_ci pmd_write_unlock(pmd); 128862306a36Sopenharmony_ci 128962306a36Sopenharmony_ci return r; 129062306a36Sopenharmony_ci} 129162306a36Sopenharmony_ci 129262306a36Sopenharmony_ciint dm_pool_set_metadata_transaction_id(struct dm_pool_metadata *pmd, 129362306a36Sopenharmony_ci uint64_t current_id, 129462306a36Sopenharmony_ci uint64_t new_id) 129562306a36Sopenharmony_ci{ 129662306a36Sopenharmony_ci int r = -EINVAL; 129762306a36Sopenharmony_ci 129862306a36Sopenharmony_ci pmd_write_lock(pmd); 129962306a36Sopenharmony_ci 130062306a36Sopenharmony_ci if (pmd->fail_io) 130162306a36Sopenharmony_ci goto out; 130262306a36Sopenharmony_ci 130362306a36Sopenharmony_ci if (pmd->trans_id != current_id) { 130462306a36Sopenharmony_ci DMERR("mismatched transaction id"); 130562306a36Sopenharmony_ci goto out; 130662306a36Sopenharmony_ci } 130762306a36Sopenharmony_ci 130862306a36Sopenharmony_ci pmd->trans_id = new_id; 130962306a36Sopenharmony_ci r = 0; 131062306a36Sopenharmony_ci 131162306a36Sopenharmony_ciout: 131262306a36Sopenharmony_ci pmd_write_unlock(pmd); 131362306a36Sopenharmony_ci 131462306a36Sopenharmony_ci return r; 131562306a36Sopenharmony_ci} 131662306a36Sopenharmony_ci 131762306a36Sopenharmony_ciint dm_pool_get_metadata_transaction_id(struct dm_pool_metadata *pmd, 131862306a36Sopenharmony_ci uint64_t *result) 131962306a36Sopenharmony_ci{ 132062306a36Sopenharmony_ci int r = -EINVAL; 132162306a36Sopenharmony_ci 132262306a36Sopenharmony_ci down_read(&pmd->root_lock); 132362306a36Sopenharmony_ci if (!pmd->fail_io) { 132462306a36Sopenharmony_ci *result = pmd->trans_id; 132562306a36Sopenharmony_ci r = 0; 132662306a36Sopenharmony_ci } 132762306a36Sopenharmony_ci up_read(&pmd->root_lock); 132862306a36Sopenharmony_ci 132962306a36Sopenharmony_ci return r; 133062306a36Sopenharmony_ci} 133162306a36Sopenharmony_ci 133262306a36Sopenharmony_cistatic int __reserve_metadata_snap(struct dm_pool_metadata *pmd) 133362306a36Sopenharmony_ci{ 133462306a36Sopenharmony_ci int r, inc; 133562306a36Sopenharmony_ci struct thin_disk_superblock *disk_super; 133662306a36Sopenharmony_ci struct dm_block *copy, *sblock; 133762306a36Sopenharmony_ci dm_block_t held_root; 133862306a36Sopenharmony_ci 133962306a36Sopenharmony_ci /* 134062306a36Sopenharmony_ci * We commit to ensure the btree roots which we increment in a 134162306a36Sopenharmony_ci * moment are up to date. 134262306a36Sopenharmony_ci */ 134362306a36Sopenharmony_ci r = __commit_transaction(pmd); 134462306a36Sopenharmony_ci if (r < 0) { 134562306a36Sopenharmony_ci DMWARN("%s: __commit_transaction() failed, error = %d", 134662306a36Sopenharmony_ci __func__, r); 134762306a36Sopenharmony_ci return r; 134862306a36Sopenharmony_ci } 134962306a36Sopenharmony_ci 135062306a36Sopenharmony_ci /* 135162306a36Sopenharmony_ci * Copy the superblock. 135262306a36Sopenharmony_ci */ 135362306a36Sopenharmony_ci dm_sm_inc_block(pmd->metadata_sm, THIN_SUPERBLOCK_LOCATION); 135462306a36Sopenharmony_ci r = dm_tm_shadow_block(pmd->tm, THIN_SUPERBLOCK_LOCATION, 135562306a36Sopenharmony_ci &sb_validator, ©, &inc); 135662306a36Sopenharmony_ci if (r) 135762306a36Sopenharmony_ci return r; 135862306a36Sopenharmony_ci 135962306a36Sopenharmony_ci BUG_ON(!inc); 136062306a36Sopenharmony_ci 136162306a36Sopenharmony_ci held_root = dm_block_location(copy); 136262306a36Sopenharmony_ci disk_super = dm_block_data(copy); 136362306a36Sopenharmony_ci 136462306a36Sopenharmony_ci if (le64_to_cpu(disk_super->held_root)) { 136562306a36Sopenharmony_ci DMWARN("Pool metadata snapshot already exists: release this before taking another."); 136662306a36Sopenharmony_ci 136762306a36Sopenharmony_ci dm_tm_dec(pmd->tm, held_root); 136862306a36Sopenharmony_ci dm_tm_unlock(pmd->tm, copy); 136962306a36Sopenharmony_ci return -EBUSY; 137062306a36Sopenharmony_ci } 137162306a36Sopenharmony_ci 137262306a36Sopenharmony_ci /* 137362306a36Sopenharmony_ci * Wipe the spacemap since we're not publishing this. 137462306a36Sopenharmony_ci */ 137562306a36Sopenharmony_ci memset(&disk_super->data_space_map_root, 0, 137662306a36Sopenharmony_ci sizeof(disk_super->data_space_map_root)); 137762306a36Sopenharmony_ci memset(&disk_super->metadata_space_map_root, 0, 137862306a36Sopenharmony_ci sizeof(disk_super->metadata_space_map_root)); 137962306a36Sopenharmony_ci 138062306a36Sopenharmony_ci /* 138162306a36Sopenharmony_ci * Increment the data structures that need to be preserved. 138262306a36Sopenharmony_ci */ 138362306a36Sopenharmony_ci dm_tm_inc(pmd->tm, le64_to_cpu(disk_super->data_mapping_root)); 138462306a36Sopenharmony_ci dm_tm_inc(pmd->tm, le64_to_cpu(disk_super->device_details_root)); 138562306a36Sopenharmony_ci dm_tm_unlock(pmd->tm, copy); 138662306a36Sopenharmony_ci 138762306a36Sopenharmony_ci /* 138862306a36Sopenharmony_ci * Write the held root into the superblock. 138962306a36Sopenharmony_ci */ 139062306a36Sopenharmony_ci r = superblock_lock(pmd, &sblock); 139162306a36Sopenharmony_ci if (r) { 139262306a36Sopenharmony_ci dm_tm_dec(pmd->tm, held_root); 139362306a36Sopenharmony_ci return r; 139462306a36Sopenharmony_ci } 139562306a36Sopenharmony_ci 139662306a36Sopenharmony_ci disk_super = dm_block_data(sblock); 139762306a36Sopenharmony_ci disk_super->held_root = cpu_to_le64(held_root); 139862306a36Sopenharmony_ci dm_bm_unlock(sblock); 139962306a36Sopenharmony_ci return 0; 140062306a36Sopenharmony_ci} 140162306a36Sopenharmony_ci 140262306a36Sopenharmony_ciint dm_pool_reserve_metadata_snap(struct dm_pool_metadata *pmd) 140362306a36Sopenharmony_ci{ 140462306a36Sopenharmony_ci int r = -EINVAL; 140562306a36Sopenharmony_ci 140662306a36Sopenharmony_ci pmd_write_lock(pmd); 140762306a36Sopenharmony_ci if (!pmd->fail_io) 140862306a36Sopenharmony_ci r = __reserve_metadata_snap(pmd); 140962306a36Sopenharmony_ci pmd_write_unlock(pmd); 141062306a36Sopenharmony_ci 141162306a36Sopenharmony_ci return r; 141262306a36Sopenharmony_ci} 141362306a36Sopenharmony_ci 141462306a36Sopenharmony_cistatic int __release_metadata_snap(struct dm_pool_metadata *pmd) 141562306a36Sopenharmony_ci{ 141662306a36Sopenharmony_ci int r; 141762306a36Sopenharmony_ci struct thin_disk_superblock *disk_super; 141862306a36Sopenharmony_ci struct dm_block *sblock, *copy; 141962306a36Sopenharmony_ci dm_block_t held_root; 142062306a36Sopenharmony_ci 142162306a36Sopenharmony_ci r = superblock_lock(pmd, &sblock); 142262306a36Sopenharmony_ci if (r) 142362306a36Sopenharmony_ci return r; 142462306a36Sopenharmony_ci 142562306a36Sopenharmony_ci disk_super = dm_block_data(sblock); 142662306a36Sopenharmony_ci held_root = le64_to_cpu(disk_super->held_root); 142762306a36Sopenharmony_ci disk_super->held_root = cpu_to_le64(0); 142862306a36Sopenharmony_ci 142962306a36Sopenharmony_ci dm_bm_unlock(sblock); 143062306a36Sopenharmony_ci 143162306a36Sopenharmony_ci if (!held_root) { 143262306a36Sopenharmony_ci DMWARN("No pool metadata snapshot found: nothing to release."); 143362306a36Sopenharmony_ci return -EINVAL; 143462306a36Sopenharmony_ci } 143562306a36Sopenharmony_ci 143662306a36Sopenharmony_ci r = dm_tm_read_lock(pmd->tm, held_root, &sb_validator, ©); 143762306a36Sopenharmony_ci if (r) 143862306a36Sopenharmony_ci return r; 143962306a36Sopenharmony_ci 144062306a36Sopenharmony_ci disk_super = dm_block_data(copy); 144162306a36Sopenharmony_ci dm_btree_del(&pmd->info, le64_to_cpu(disk_super->data_mapping_root)); 144262306a36Sopenharmony_ci dm_btree_del(&pmd->details_info, le64_to_cpu(disk_super->device_details_root)); 144362306a36Sopenharmony_ci dm_sm_dec_block(pmd->metadata_sm, held_root); 144462306a36Sopenharmony_ci 144562306a36Sopenharmony_ci dm_tm_unlock(pmd->tm, copy); 144662306a36Sopenharmony_ci 144762306a36Sopenharmony_ci return 0; 144862306a36Sopenharmony_ci} 144962306a36Sopenharmony_ci 145062306a36Sopenharmony_ciint dm_pool_release_metadata_snap(struct dm_pool_metadata *pmd) 145162306a36Sopenharmony_ci{ 145262306a36Sopenharmony_ci int r = -EINVAL; 145362306a36Sopenharmony_ci 145462306a36Sopenharmony_ci pmd_write_lock(pmd); 145562306a36Sopenharmony_ci if (!pmd->fail_io) 145662306a36Sopenharmony_ci r = __release_metadata_snap(pmd); 145762306a36Sopenharmony_ci pmd_write_unlock(pmd); 145862306a36Sopenharmony_ci 145962306a36Sopenharmony_ci return r; 146062306a36Sopenharmony_ci} 146162306a36Sopenharmony_ci 146262306a36Sopenharmony_cistatic int __get_metadata_snap(struct dm_pool_metadata *pmd, 146362306a36Sopenharmony_ci dm_block_t *result) 146462306a36Sopenharmony_ci{ 146562306a36Sopenharmony_ci int r; 146662306a36Sopenharmony_ci struct thin_disk_superblock *disk_super; 146762306a36Sopenharmony_ci struct dm_block *sblock; 146862306a36Sopenharmony_ci 146962306a36Sopenharmony_ci r = dm_bm_read_lock(pmd->bm, THIN_SUPERBLOCK_LOCATION, 147062306a36Sopenharmony_ci &sb_validator, &sblock); 147162306a36Sopenharmony_ci if (r) 147262306a36Sopenharmony_ci return r; 147362306a36Sopenharmony_ci 147462306a36Sopenharmony_ci disk_super = dm_block_data(sblock); 147562306a36Sopenharmony_ci *result = le64_to_cpu(disk_super->held_root); 147662306a36Sopenharmony_ci 147762306a36Sopenharmony_ci dm_bm_unlock(sblock); 147862306a36Sopenharmony_ci 147962306a36Sopenharmony_ci return 0; 148062306a36Sopenharmony_ci} 148162306a36Sopenharmony_ci 148262306a36Sopenharmony_ciint dm_pool_get_metadata_snap(struct dm_pool_metadata *pmd, 148362306a36Sopenharmony_ci dm_block_t *result) 148462306a36Sopenharmony_ci{ 148562306a36Sopenharmony_ci int r = -EINVAL; 148662306a36Sopenharmony_ci 148762306a36Sopenharmony_ci down_read(&pmd->root_lock); 148862306a36Sopenharmony_ci if (!pmd->fail_io) 148962306a36Sopenharmony_ci r = __get_metadata_snap(pmd, result); 149062306a36Sopenharmony_ci up_read(&pmd->root_lock); 149162306a36Sopenharmony_ci 149262306a36Sopenharmony_ci return r; 149362306a36Sopenharmony_ci} 149462306a36Sopenharmony_ci 149562306a36Sopenharmony_ciint dm_pool_open_thin_device(struct dm_pool_metadata *pmd, dm_thin_id dev, 149662306a36Sopenharmony_ci struct dm_thin_device **td) 149762306a36Sopenharmony_ci{ 149862306a36Sopenharmony_ci int r = -EINVAL; 149962306a36Sopenharmony_ci 150062306a36Sopenharmony_ci pmd_write_lock_in_core(pmd); 150162306a36Sopenharmony_ci if (!pmd->fail_io) 150262306a36Sopenharmony_ci r = __open_device(pmd, dev, 0, td); 150362306a36Sopenharmony_ci pmd_write_unlock(pmd); 150462306a36Sopenharmony_ci 150562306a36Sopenharmony_ci return r; 150662306a36Sopenharmony_ci} 150762306a36Sopenharmony_ci 150862306a36Sopenharmony_ciint dm_pool_close_thin_device(struct dm_thin_device *td) 150962306a36Sopenharmony_ci{ 151062306a36Sopenharmony_ci pmd_write_lock_in_core(td->pmd); 151162306a36Sopenharmony_ci __close_device(td); 151262306a36Sopenharmony_ci pmd_write_unlock(td->pmd); 151362306a36Sopenharmony_ci 151462306a36Sopenharmony_ci return 0; 151562306a36Sopenharmony_ci} 151662306a36Sopenharmony_ci 151762306a36Sopenharmony_cidm_thin_id dm_thin_dev_id(struct dm_thin_device *td) 151862306a36Sopenharmony_ci{ 151962306a36Sopenharmony_ci return td->id; 152062306a36Sopenharmony_ci} 152162306a36Sopenharmony_ci 152262306a36Sopenharmony_ci/* 152362306a36Sopenharmony_ci * Check whether @time (of block creation) is older than @td's last snapshot. 152462306a36Sopenharmony_ci * If so then the associated block is shared with the last snapshot device. 152562306a36Sopenharmony_ci * Any block on a device created *after* the device last got snapshotted is 152662306a36Sopenharmony_ci * necessarily not shared. 152762306a36Sopenharmony_ci */ 152862306a36Sopenharmony_cistatic bool __snapshotted_since(struct dm_thin_device *td, uint32_t time) 152962306a36Sopenharmony_ci{ 153062306a36Sopenharmony_ci return td->snapshotted_time > time; 153162306a36Sopenharmony_ci} 153262306a36Sopenharmony_ci 153362306a36Sopenharmony_cistatic void unpack_lookup_result(struct dm_thin_device *td, __le64 value, 153462306a36Sopenharmony_ci struct dm_thin_lookup_result *result) 153562306a36Sopenharmony_ci{ 153662306a36Sopenharmony_ci uint64_t block_time = 0; 153762306a36Sopenharmony_ci dm_block_t exception_block; 153862306a36Sopenharmony_ci uint32_t exception_time; 153962306a36Sopenharmony_ci 154062306a36Sopenharmony_ci block_time = le64_to_cpu(value); 154162306a36Sopenharmony_ci unpack_block_time(block_time, &exception_block, &exception_time); 154262306a36Sopenharmony_ci result->block = exception_block; 154362306a36Sopenharmony_ci result->shared = __snapshotted_since(td, exception_time); 154462306a36Sopenharmony_ci} 154562306a36Sopenharmony_ci 154662306a36Sopenharmony_cistatic int __find_block(struct dm_thin_device *td, dm_block_t block, 154762306a36Sopenharmony_ci int can_issue_io, struct dm_thin_lookup_result *result) 154862306a36Sopenharmony_ci{ 154962306a36Sopenharmony_ci int r; 155062306a36Sopenharmony_ci __le64 value; 155162306a36Sopenharmony_ci struct dm_pool_metadata *pmd = td->pmd; 155262306a36Sopenharmony_ci dm_block_t keys[2] = { td->id, block }; 155362306a36Sopenharmony_ci struct dm_btree_info *info; 155462306a36Sopenharmony_ci 155562306a36Sopenharmony_ci if (can_issue_io) 155662306a36Sopenharmony_ci info = &pmd->info; 155762306a36Sopenharmony_ci else 155862306a36Sopenharmony_ci info = &pmd->nb_info; 155962306a36Sopenharmony_ci 156062306a36Sopenharmony_ci r = dm_btree_lookup(info, pmd->root, keys, &value); 156162306a36Sopenharmony_ci if (!r) 156262306a36Sopenharmony_ci unpack_lookup_result(td, value, result); 156362306a36Sopenharmony_ci 156462306a36Sopenharmony_ci return r; 156562306a36Sopenharmony_ci} 156662306a36Sopenharmony_ci 156762306a36Sopenharmony_ciint dm_thin_find_block(struct dm_thin_device *td, dm_block_t block, 156862306a36Sopenharmony_ci int can_issue_io, struct dm_thin_lookup_result *result) 156962306a36Sopenharmony_ci{ 157062306a36Sopenharmony_ci int r; 157162306a36Sopenharmony_ci struct dm_pool_metadata *pmd = td->pmd; 157262306a36Sopenharmony_ci 157362306a36Sopenharmony_ci down_read(&pmd->root_lock); 157462306a36Sopenharmony_ci if (pmd->fail_io) { 157562306a36Sopenharmony_ci up_read(&pmd->root_lock); 157662306a36Sopenharmony_ci return -EINVAL; 157762306a36Sopenharmony_ci } 157862306a36Sopenharmony_ci 157962306a36Sopenharmony_ci r = __find_block(td, block, can_issue_io, result); 158062306a36Sopenharmony_ci 158162306a36Sopenharmony_ci up_read(&pmd->root_lock); 158262306a36Sopenharmony_ci return r; 158362306a36Sopenharmony_ci} 158462306a36Sopenharmony_ci 158562306a36Sopenharmony_cistatic int __find_next_mapped_block(struct dm_thin_device *td, dm_block_t block, 158662306a36Sopenharmony_ci dm_block_t *vblock, 158762306a36Sopenharmony_ci struct dm_thin_lookup_result *result) 158862306a36Sopenharmony_ci{ 158962306a36Sopenharmony_ci int r; 159062306a36Sopenharmony_ci __le64 value; 159162306a36Sopenharmony_ci struct dm_pool_metadata *pmd = td->pmd; 159262306a36Sopenharmony_ci dm_block_t keys[2] = { td->id, block }; 159362306a36Sopenharmony_ci 159462306a36Sopenharmony_ci r = dm_btree_lookup_next(&pmd->info, pmd->root, keys, vblock, &value); 159562306a36Sopenharmony_ci if (!r) 159662306a36Sopenharmony_ci unpack_lookup_result(td, value, result); 159762306a36Sopenharmony_ci 159862306a36Sopenharmony_ci return r; 159962306a36Sopenharmony_ci} 160062306a36Sopenharmony_ci 160162306a36Sopenharmony_cistatic int __find_mapped_range(struct dm_thin_device *td, 160262306a36Sopenharmony_ci dm_block_t begin, dm_block_t end, 160362306a36Sopenharmony_ci dm_block_t *thin_begin, dm_block_t *thin_end, 160462306a36Sopenharmony_ci dm_block_t *pool_begin, bool *maybe_shared) 160562306a36Sopenharmony_ci{ 160662306a36Sopenharmony_ci int r; 160762306a36Sopenharmony_ci dm_block_t pool_end; 160862306a36Sopenharmony_ci struct dm_thin_lookup_result lookup; 160962306a36Sopenharmony_ci 161062306a36Sopenharmony_ci if (end < begin) 161162306a36Sopenharmony_ci return -ENODATA; 161262306a36Sopenharmony_ci 161362306a36Sopenharmony_ci r = __find_next_mapped_block(td, begin, &begin, &lookup); 161462306a36Sopenharmony_ci if (r) 161562306a36Sopenharmony_ci return r; 161662306a36Sopenharmony_ci 161762306a36Sopenharmony_ci if (begin >= end) 161862306a36Sopenharmony_ci return -ENODATA; 161962306a36Sopenharmony_ci 162062306a36Sopenharmony_ci *thin_begin = begin; 162162306a36Sopenharmony_ci *pool_begin = lookup.block; 162262306a36Sopenharmony_ci *maybe_shared = lookup.shared; 162362306a36Sopenharmony_ci 162462306a36Sopenharmony_ci begin++; 162562306a36Sopenharmony_ci pool_end = *pool_begin + 1; 162662306a36Sopenharmony_ci while (begin != end) { 162762306a36Sopenharmony_ci r = __find_block(td, begin, true, &lookup); 162862306a36Sopenharmony_ci if (r) { 162962306a36Sopenharmony_ci if (r == -ENODATA) 163062306a36Sopenharmony_ci break; 163162306a36Sopenharmony_ci 163262306a36Sopenharmony_ci return r; 163362306a36Sopenharmony_ci } 163462306a36Sopenharmony_ci 163562306a36Sopenharmony_ci if ((lookup.block != pool_end) || 163662306a36Sopenharmony_ci (lookup.shared != *maybe_shared)) 163762306a36Sopenharmony_ci break; 163862306a36Sopenharmony_ci 163962306a36Sopenharmony_ci pool_end++; 164062306a36Sopenharmony_ci begin++; 164162306a36Sopenharmony_ci } 164262306a36Sopenharmony_ci 164362306a36Sopenharmony_ci *thin_end = begin; 164462306a36Sopenharmony_ci return 0; 164562306a36Sopenharmony_ci} 164662306a36Sopenharmony_ci 164762306a36Sopenharmony_ciint dm_thin_find_mapped_range(struct dm_thin_device *td, 164862306a36Sopenharmony_ci dm_block_t begin, dm_block_t end, 164962306a36Sopenharmony_ci dm_block_t *thin_begin, dm_block_t *thin_end, 165062306a36Sopenharmony_ci dm_block_t *pool_begin, bool *maybe_shared) 165162306a36Sopenharmony_ci{ 165262306a36Sopenharmony_ci int r = -EINVAL; 165362306a36Sopenharmony_ci struct dm_pool_metadata *pmd = td->pmd; 165462306a36Sopenharmony_ci 165562306a36Sopenharmony_ci down_read(&pmd->root_lock); 165662306a36Sopenharmony_ci if (!pmd->fail_io) { 165762306a36Sopenharmony_ci r = __find_mapped_range(td, begin, end, thin_begin, thin_end, 165862306a36Sopenharmony_ci pool_begin, maybe_shared); 165962306a36Sopenharmony_ci } 166062306a36Sopenharmony_ci up_read(&pmd->root_lock); 166162306a36Sopenharmony_ci 166262306a36Sopenharmony_ci return r; 166362306a36Sopenharmony_ci} 166462306a36Sopenharmony_ci 166562306a36Sopenharmony_cistatic int __insert(struct dm_thin_device *td, dm_block_t block, 166662306a36Sopenharmony_ci dm_block_t data_block) 166762306a36Sopenharmony_ci{ 166862306a36Sopenharmony_ci int r, inserted; 166962306a36Sopenharmony_ci __le64 value; 167062306a36Sopenharmony_ci struct dm_pool_metadata *pmd = td->pmd; 167162306a36Sopenharmony_ci dm_block_t keys[2] = { td->id, block }; 167262306a36Sopenharmony_ci 167362306a36Sopenharmony_ci value = cpu_to_le64(pack_block_time(data_block, pmd->time)); 167462306a36Sopenharmony_ci __dm_bless_for_disk(&value); 167562306a36Sopenharmony_ci 167662306a36Sopenharmony_ci r = dm_btree_insert_notify(&pmd->info, pmd->root, keys, &value, 167762306a36Sopenharmony_ci &pmd->root, &inserted); 167862306a36Sopenharmony_ci if (r) 167962306a36Sopenharmony_ci return r; 168062306a36Sopenharmony_ci 168162306a36Sopenharmony_ci td->changed = true; 168262306a36Sopenharmony_ci if (inserted) 168362306a36Sopenharmony_ci td->mapped_blocks++; 168462306a36Sopenharmony_ci 168562306a36Sopenharmony_ci return 0; 168662306a36Sopenharmony_ci} 168762306a36Sopenharmony_ci 168862306a36Sopenharmony_ciint dm_thin_insert_block(struct dm_thin_device *td, dm_block_t block, 168962306a36Sopenharmony_ci dm_block_t data_block) 169062306a36Sopenharmony_ci{ 169162306a36Sopenharmony_ci int r = -EINVAL; 169262306a36Sopenharmony_ci 169362306a36Sopenharmony_ci pmd_write_lock(td->pmd); 169462306a36Sopenharmony_ci if (!td->pmd->fail_io) 169562306a36Sopenharmony_ci r = __insert(td, block, data_block); 169662306a36Sopenharmony_ci pmd_write_unlock(td->pmd); 169762306a36Sopenharmony_ci 169862306a36Sopenharmony_ci return r; 169962306a36Sopenharmony_ci} 170062306a36Sopenharmony_ci 170162306a36Sopenharmony_cistatic int __remove_range(struct dm_thin_device *td, dm_block_t begin, dm_block_t end) 170262306a36Sopenharmony_ci{ 170362306a36Sopenharmony_ci int r; 170462306a36Sopenharmony_ci unsigned int count, total_count = 0; 170562306a36Sopenharmony_ci struct dm_pool_metadata *pmd = td->pmd; 170662306a36Sopenharmony_ci dm_block_t keys[1] = { td->id }; 170762306a36Sopenharmony_ci __le64 value; 170862306a36Sopenharmony_ci dm_block_t mapping_root; 170962306a36Sopenharmony_ci 171062306a36Sopenharmony_ci /* 171162306a36Sopenharmony_ci * Find the mapping tree 171262306a36Sopenharmony_ci */ 171362306a36Sopenharmony_ci r = dm_btree_lookup(&pmd->tl_info, pmd->root, keys, &value); 171462306a36Sopenharmony_ci if (r) 171562306a36Sopenharmony_ci return r; 171662306a36Sopenharmony_ci 171762306a36Sopenharmony_ci /* 171862306a36Sopenharmony_ci * Remove from the mapping tree, taking care to inc the 171962306a36Sopenharmony_ci * ref count so it doesn't get deleted. 172062306a36Sopenharmony_ci */ 172162306a36Sopenharmony_ci mapping_root = le64_to_cpu(value); 172262306a36Sopenharmony_ci dm_tm_inc(pmd->tm, mapping_root); 172362306a36Sopenharmony_ci r = dm_btree_remove(&pmd->tl_info, pmd->root, keys, &pmd->root); 172462306a36Sopenharmony_ci if (r) 172562306a36Sopenharmony_ci return r; 172662306a36Sopenharmony_ci 172762306a36Sopenharmony_ci /* 172862306a36Sopenharmony_ci * Remove leaves stops at the first unmapped entry, so we have to 172962306a36Sopenharmony_ci * loop round finding mapped ranges. 173062306a36Sopenharmony_ci */ 173162306a36Sopenharmony_ci while (begin < end) { 173262306a36Sopenharmony_ci r = dm_btree_lookup_next(&pmd->bl_info, mapping_root, &begin, &begin, &value); 173362306a36Sopenharmony_ci if (r == -ENODATA) 173462306a36Sopenharmony_ci break; 173562306a36Sopenharmony_ci 173662306a36Sopenharmony_ci if (r) 173762306a36Sopenharmony_ci return r; 173862306a36Sopenharmony_ci 173962306a36Sopenharmony_ci if (begin >= end) 174062306a36Sopenharmony_ci break; 174162306a36Sopenharmony_ci 174262306a36Sopenharmony_ci r = dm_btree_remove_leaves(&pmd->bl_info, mapping_root, &begin, end, &mapping_root, &count); 174362306a36Sopenharmony_ci if (r) 174462306a36Sopenharmony_ci return r; 174562306a36Sopenharmony_ci 174662306a36Sopenharmony_ci total_count += count; 174762306a36Sopenharmony_ci } 174862306a36Sopenharmony_ci 174962306a36Sopenharmony_ci td->mapped_blocks -= total_count; 175062306a36Sopenharmony_ci td->changed = true; 175162306a36Sopenharmony_ci 175262306a36Sopenharmony_ci /* 175362306a36Sopenharmony_ci * Reinsert the mapping tree. 175462306a36Sopenharmony_ci */ 175562306a36Sopenharmony_ci value = cpu_to_le64(mapping_root); 175662306a36Sopenharmony_ci __dm_bless_for_disk(&value); 175762306a36Sopenharmony_ci return dm_btree_insert(&pmd->tl_info, pmd->root, keys, &value, &pmd->root); 175862306a36Sopenharmony_ci} 175962306a36Sopenharmony_ci 176062306a36Sopenharmony_ciint dm_thin_remove_range(struct dm_thin_device *td, 176162306a36Sopenharmony_ci dm_block_t begin, dm_block_t end) 176262306a36Sopenharmony_ci{ 176362306a36Sopenharmony_ci int r = -EINVAL; 176462306a36Sopenharmony_ci 176562306a36Sopenharmony_ci pmd_write_lock(td->pmd); 176662306a36Sopenharmony_ci if (!td->pmd->fail_io) 176762306a36Sopenharmony_ci r = __remove_range(td, begin, end); 176862306a36Sopenharmony_ci pmd_write_unlock(td->pmd); 176962306a36Sopenharmony_ci 177062306a36Sopenharmony_ci return r; 177162306a36Sopenharmony_ci} 177262306a36Sopenharmony_ci 177362306a36Sopenharmony_ciint dm_pool_block_is_shared(struct dm_pool_metadata *pmd, dm_block_t b, bool *result) 177462306a36Sopenharmony_ci{ 177562306a36Sopenharmony_ci int r = -EINVAL; 177662306a36Sopenharmony_ci uint32_t ref_count; 177762306a36Sopenharmony_ci 177862306a36Sopenharmony_ci down_read(&pmd->root_lock); 177962306a36Sopenharmony_ci if (!pmd->fail_io) { 178062306a36Sopenharmony_ci r = dm_sm_get_count(pmd->data_sm, b, &ref_count); 178162306a36Sopenharmony_ci if (!r) 178262306a36Sopenharmony_ci *result = (ref_count > 1); 178362306a36Sopenharmony_ci } 178462306a36Sopenharmony_ci up_read(&pmd->root_lock); 178562306a36Sopenharmony_ci 178662306a36Sopenharmony_ci return r; 178762306a36Sopenharmony_ci} 178862306a36Sopenharmony_ci 178962306a36Sopenharmony_ciint dm_pool_inc_data_range(struct dm_pool_metadata *pmd, dm_block_t b, dm_block_t e) 179062306a36Sopenharmony_ci{ 179162306a36Sopenharmony_ci int r = -EINVAL; 179262306a36Sopenharmony_ci 179362306a36Sopenharmony_ci pmd_write_lock(pmd); 179462306a36Sopenharmony_ci if (!pmd->fail_io) 179562306a36Sopenharmony_ci r = dm_sm_inc_blocks(pmd->data_sm, b, e); 179662306a36Sopenharmony_ci pmd_write_unlock(pmd); 179762306a36Sopenharmony_ci 179862306a36Sopenharmony_ci return r; 179962306a36Sopenharmony_ci} 180062306a36Sopenharmony_ci 180162306a36Sopenharmony_ciint dm_pool_dec_data_range(struct dm_pool_metadata *pmd, dm_block_t b, dm_block_t e) 180262306a36Sopenharmony_ci{ 180362306a36Sopenharmony_ci int r = -EINVAL; 180462306a36Sopenharmony_ci 180562306a36Sopenharmony_ci pmd_write_lock(pmd); 180662306a36Sopenharmony_ci if (!pmd->fail_io) 180762306a36Sopenharmony_ci r = dm_sm_dec_blocks(pmd->data_sm, b, e); 180862306a36Sopenharmony_ci pmd_write_unlock(pmd); 180962306a36Sopenharmony_ci 181062306a36Sopenharmony_ci return r; 181162306a36Sopenharmony_ci} 181262306a36Sopenharmony_ci 181362306a36Sopenharmony_cibool dm_thin_changed_this_transaction(struct dm_thin_device *td) 181462306a36Sopenharmony_ci{ 181562306a36Sopenharmony_ci int r; 181662306a36Sopenharmony_ci 181762306a36Sopenharmony_ci down_read(&td->pmd->root_lock); 181862306a36Sopenharmony_ci r = td->changed; 181962306a36Sopenharmony_ci up_read(&td->pmd->root_lock); 182062306a36Sopenharmony_ci 182162306a36Sopenharmony_ci return r; 182262306a36Sopenharmony_ci} 182362306a36Sopenharmony_ci 182462306a36Sopenharmony_cibool dm_pool_changed_this_transaction(struct dm_pool_metadata *pmd) 182562306a36Sopenharmony_ci{ 182662306a36Sopenharmony_ci bool r = false; 182762306a36Sopenharmony_ci struct dm_thin_device *td, *tmp; 182862306a36Sopenharmony_ci 182962306a36Sopenharmony_ci down_read(&pmd->root_lock); 183062306a36Sopenharmony_ci list_for_each_entry_safe(td, tmp, &pmd->thin_devices, list) { 183162306a36Sopenharmony_ci if (td->changed) { 183262306a36Sopenharmony_ci r = td->changed; 183362306a36Sopenharmony_ci break; 183462306a36Sopenharmony_ci } 183562306a36Sopenharmony_ci } 183662306a36Sopenharmony_ci up_read(&pmd->root_lock); 183762306a36Sopenharmony_ci 183862306a36Sopenharmony_ci return r; 183962306a36Sopenharmony_ci} 184062306a36Sopenharmony_ci 184162306a36Sopenharmony_cibool dm_thin_aborted_changes(struct dm_thin_device *td) 184262306a36Sopenharmony_ci{ 184362306a36Sopenharmony_ci bool r; 184462306a36Sopenharmony_ci 184562306a36Sopenharmony_ci down_read(&td->pmd->root_lock); 184662306a36Sopenharmony_ci r = td->aborted_with_changes; 184762306a36Sopenharmony_ci up_read(&td->pmd->root_lock); 184862306a36Sopenharmony_ci 184962306a36Sopenharmony_ci return r; 185062306a36Sopenharmony_ci} 185162306a36Sopenharmony_ci 185262306a36Sopenharmony_ciint dm_pool_alloc_data_block(struct dm_pool_metadata *pmd, dm_block_t *result) 185362306a36Sopenharmony_ci{ 185462306a36Sopenharmony_ci int r = -EINVAL; 185562306a36Sopenharmony_ci 185662306a36Sopenharmony_ci pmd_write_lock(pmd); 185762306a36Sopenharmony_ci if (!pmd->fail_io) 185862306a36Sopenharmony_ci r = dm_sm_new_block(pmd->data_sm, result); 185962306a36Sopenharmony_ci pmd_write_unlock(pmd); 186062306a36Sopenharmony_ci 186162306a36Sopenharmony_ci return r; 186262306a36Sopenharmony_ci} 186362306a36Sopenharmony_ci 186462306a36Sopenharmony_ciint dm_pool_commit_metadata(struct dm_pool_metadata *pmd) 186562306a36Sopenharmony_ci{ 186662306a36Sopenharmony_ci int r = -EINVAL; 186762306a36Sopenharmony_ci 186862306a36Sopenharmony_ci /* 186962306a36Sopenharmony_ci * Care is taken to not have commit be what 187062306a36Sopenharmony_ci * triggers putting the thin-pool in-service. 187162306a36Sopenharmony_ci */ 187262306a36Sopenharmony_ci pmd_write_lock_in_core(pmd); 187362306a36Sopenharmony_ci if (pmd->fail_io) 187462306a36Sopenharmony_ci goto out; 187562306a36Sopenharmony_ci 187662306a36Sopenharmony_ci r = __commit_transaction(pmd); 187762306a36Sopenharmony_ci if (r < 0) 187862306a36Sopenharmony_ci goto out; 187962306a36Sopenharmony_ci 188062306a36Sopenharmony_ci /* 188162306a36Sopenharmony_ci * Open the next transaction. 188262306a36Sopenharmony_ci */ 188362306a36Sopenharmony_ci r = __begin_transaction(pmd); 188462306a36Sopenharmony_ciout: 188562306a36Sopenharmony_ci pmd_write_unlock(pmd); 188662306a36Sopenharmony_ci return r; 188762306a36Sopenharmony_ci} 188862306a36Sopenharmony_ci 188962306a36Sopenharmony_cistatic void __set_abort_with_changes_flags(struct dm_pool_metadata *pmd) 189062306a36Sopenharmony_ci{ 189162306a36Sopenharmony_ci struct dm_thin_device *td; 189262306a36Sopenharmony_ci 189362306a36Sopenharmony_ci list_for_each_entry(td, &pmd->thin_devices, list) 189462306a36Sopenharmony_ci td->aborted_with_changes = td->changed; 189562306a36Sopenharmony_ci} 189662306a36Sopenharmony_ci 189762306a36Sopenharmony_ciint dm_pool_abort_metadata(struct dm_pool_metadata *pmd) 189862306a36Sopenharmony_ci{ 189962306a36Sopenharmony_ci int r = -EINVAL; 190062306a36Sopenharmony_ci 190162306a36Sopenharmony_ci /* fail_io is double-checked with pmd->root_lock held below */ 190262306a36Sopenharmony_ci if (unlikely(pmd->fail_io)) 190362306a36Sopenharmony_ci return r; 190462306a36Sopenharmony_ci 190562306a36Sopenharmony_ci pmd_write_lock(pmd); 190662306a36Sopenharmony_ci if (pmd->fail_io) { 190762306a36Sopenharmony_ci pmd_write_unlock(pmd); 190862306a36Sopenharmony_ci return r; 190962306a36Sopenharmony_ci } 191062306a36Sopenharmony_ci __set_abort_with_changes_flags(pmd); 191162306a36Sopenharmony_ci 191262306a36Sopenharmony_ci /* destroy data_sm/metadata_sm/nb_tm/tm */ 191362306a36Sopenharmony_ci __destroy_persistent_data_objects(pmd, false); 191462306a36Sopenharmony_ci 191562306a36Sopenharmony_ci /* reset bm */ 191662306a36Sopenharmony_ci dm_block_manager_reset(pmd->bm); 191762306a36Sopenharmony_ci 191862306a36Sopenharmony_ci /* rebuild data_sm/metadata_sm/nb_tm/tm */ 191962306a36Sopenharmony_ci r = __open_or_format_metadata(pmd, false); 192062306a36Sopenharmony_ci if (r) 192162306a36Sopenharmony_ci pmd->fail_io = true; 192262306a36Sopenharmony_ci pmd_write_unlock(pmd); 192362306a36Sopenharmony_ci return r; 192462306a36Sopenharmony_ci} 192562306a36Sopenharmony_ci 192662306a36Sopenharmony_ciint dm_pool_get_free_block_count(struct dm_pool_metadata *pmd, dm_block_t *result) 192762306a36Sopenharmony_ci{ 192862306a36Sopenharmony_ci int r = -EINVAL; 192962306a36Sopenharmony_ci 193062306a36Sopenharmony_ci down_read(&pmd->root_lock); 193162306a36Sopenharmony_ci if (!pmd->fail_io) 193262306a36Sopenharmony_ci r = dm_sm_get_nr_free(pmd->data_sm, result); 193362306a36Sopenharmony_ci up_read(&pmd->root_lock); 193462306a36Sopenharmony_ci 193562306a36Sopenharmony_ci return r; 193662306a36Sopenharmony_ci} 193762306a36Sopenharmony_ci 193862306a36Sopenharmony_ciint dm_pool_get_free_metadata_block_count(struct dm_pool_metadata *pmd, 193962306a36Sopenharmony_ci dm_block_t *result) 194062306a36Sopenharmony_ci{ 194162306a36Sopenharmony_ci int r = -EINVAL; 194262306a36Sopenharmony_ci 194362306a36Sopenharmony_ci down_read(&pmd->root_lock); 194462306a36Sopenharmony_ci if (!pmd->fail_io) 194562306a36Sopenharmony_ci r = dm_sm_get_nr_free(pmd->metadata_sm, result); 194662306a36Sopenharmony_ci 194762306a36Sopenharmony_ci if (!r) { 194862306a36Sopenharmony_ci if (*result < pmd->metadata_reserve) 194962306a36Sopenharmony_ci *result = 0; 195062306a36Sopenharmony_ci else 195162306a36Sopenharmony_ci *result -= pmd->metadata_reserve; 195262306a36Sopenharmony_ci } 195362306a36Sopenharmony_ci up_read(&pmd->root_lock); 195462306a36Sopenharmony_ci 195562306a36Sopenharmony_ci return r; 195662306a36Sopenharmony_ci} 195762306a36Sopenharmony_ci 195862306a36Sopenharmony_ciint dm_pool_get_metadata_dev_size(struct dm_pool_metadata *pmd, 195962306a36Sopenharmony_ci dm_block_t *result) 196062306a36Sopenharmony_ci{ 196162306a36Sopenharmony_ci int r = -EINVAL; 196262306a36Sopenharmony_ci 196362306a36Sopenharmony_ci down_read(&pmd->root_lock); 196462306a36Sopenharmony_ci if (!pmd->fail_io) 196562306a36Sopenharmony_ci r = dm_sm_get_nr_blocks(pmd->metadata_sm, result); 196662306a36Sopenharmony_ci up_read(&pmd->root_lock); 196762306a36Sopenharmony_ci 196862306a36Sopenharmony_ci return r; 196962306a36Sopenharmony_ci} 197062306a36Sopenharmony_ci 197162306a36Sopenharmony_ciint dm_pool_get_data_dev_size(struct dm_pool_metadata *pmd, dm_block_t *result) 197262306a36Sopenharmony_ci{ 197362306a36Sopenharmony_ci int r = -EINVAL; 197462306a36Sopenharmony_ci 197562306a36Sopenharmony_ci down_read(&pmd->root_lock); 197662306a36Sopenharmony_ci if (!pmd->fail_io) 197762306a36Sopenharmony_ci r = dm_sm_get_nr_blocks(pmd->data_sm, result); 197862306a36Sopenharmony_ci up_read(&pmd->root_lock); 197962306a36Sopenharmony_ci 198062306a36Sopenharmony_ci return r; 198162306a36Sopenharmony_ci} 198262306a36Sopenharmony_ci 198362306a36Sopenharmony_ciint dm_thin_get_mapped_count(struct dm_thin_device *td, dm_block_t *result) 198462306a36Sopenharmony_ci{ 198562306a36Sopenharmony_ci int r = -EINVAL; 198662306a36Sopenharmony_ci struct dm_pool_metadata *pmd = td->pmd; 198762306a36Sopenharmony_ci 198862306a36Sopenharmony_ci down_read(&pmd->root_lock); 198962306a36Sopenharmony_ci if (!pmd->fail_io) { 199062306a36Sopenharmony_ci *result = td->mapped_blocks; 199162306a36Sopenharmony_ci r = 0; 199262306a36Sopenharmony_ci } 199362306a36Sopenharmony_ci up_read(&pmd->root_lock); 199462306a36Sopenharmony_ci 199562306a36Sopenharmony_ci return r; 199662306a36Sopenharmony_ci} 199762306a36Sopenharmony_ci 199862306a36Sopenharmony_cistatic int __highest_block(struct dm_thin_device *td, dm_block_t *result) 199962306a36Sopenharmony_ci{ 200062306a36Sopenharmony_ci int r; 200162306a36Sopenharmony_ci __le64 value_le; 200262306a36Sopenharmony_ci dm_block_t thin_root; 200362306a36Sopenharmony_ci struct dm_pool_metadata *pmd = td->pmd; 200462306a36Sopenharmony_ci 200562306a36Sopenharmony_ci r = dm_btree_lookup(&pmd->tl_info, pmd->root, &td->id, &value_le); 200662306a36Sopenharmony_ci if (r) 200762306a36Sopenharmony_ci return r; 200862306a36Sopenharmony_ci 200962306a36Sopenharmony_ci thin_root = le64_to_cpu(value_le); 201062306a36Sopenharmony_ci 201162306a36Sopenharmony_ci return dm_btree_find_highest_key(&pmd->bl_info, thin_root, result); 201262306a36Sopenharmony_ci} 201362306a36Sopenharmony_ci 201462306a36Sopenharmony_ciint dm_thin_get_highest_mapped_block(struct dm_thin_device *td, 201562306a36Sopenharmony_ci dm_block_t *result) 201662306a36Sopenharmony_ci{ 201762306a36Sopenharmony_ci int r = -EINVAL; 201862306a36Sopenharmony_ci struct dm_pool_metadata *pmd = td->pmd; 201962306a36Sopenharmony_ci 202062306a36Sopenharmony_ci down_read(&pmd->root_lock); 202162306a36Sopenharmony_ci if (!pmd->fail_io) 202262306a36Sopenharmony_ci r = __highest_block(td, result); 202362306a36Sopenharmony_ci up_read(&pmd->root_lock); 202462306a36Sopenharmony_ci 202562306a36Sopenharmony_ci return r; 202662306a36Sopenharmony_ci} 202762306a36Sopenharmony_ci 202862306a36Sopenharmony_cistatic int __resize_space_map(struct dm_space_map *sm, dm_block_t new_count) 202962306a36Sopenharmony_ci{ 203062306a36Sopenharmony_ci int r; 203162306a36Sopenharmony_ci dm_block_t old_count; 203262306a36Sopenharmony_ci 203362306a36Sopenharmony_ci r = dm_sm_get_nr_blocks(sm, &old_count); 203462306a36Sopenharmony_ci if (r) 203562306a36Sopenharmony_ci return r; 203662306a36Sopenharmony_ci 203762306a36Sopenharmony_ci if (new_count == old_count) 203862306a36Sopenharmony_ci return 0; 203962306a36Sopenharmony_ci 204062306a36Sopenharmony_ci if (new_count < old_count) { 204162306a36Sopenharmony_ci DMERR("cannot reduce size of space map"); 204262306a36Sopenharmony_ci return -EINVAL; 204362306a36Sopenharmony_ci } 204462306a36Sopenharmony_ci 204562306a36Sopenharmony_ci return dm_sm_extend(sm, new_count - old_count); 204662306a36Sopenharmony_ci} 204762306a36Sopenharmony_ci 204862306a36Sopenharmony_ciint dm_pool_resize_data_dev(struct dm_pool_metadata *pmd, dm_block_t new_count) 204962306a36Sopenharmony_ci{ 205062306a36Sopenharmony_ci int r = -EINVAL; 205162306a36Sopenharmony_ci 205262306a36Sopenharmony_ci pmd_write_lock(pmd); 205362306a36Sopenharmony_ci if (!pmd->fail_io) 205462306a36Sopenharmony_ci r = __resize_space_map(pmd->data_sm, new_count); 205562306a36Sopenharmony_ci pmd_write_unlock(pmd); 205662306a36Sopenharmony_ci 205762306a36Sopenharmony_ci return r; 205862306a36Sopenharmony_ci} 205962306a36Sopenharmony_ci 206062306a36Sopenharmony_ciint dm_pool_resize_metadata_dev(struct dm_pool_metadata *pmd, dm_block_t new_count) 206162306a36Sopenharmony_ci{ 206262306a36Sopenharmony_ci int r = -EINVAL; 206362306a36Sopenharmony_ci 206462306a36Sopenharmony_ci pmd_write_lock(pmd); 206562306a36Sopenharmony_ci if (!pmd->fail_io) { 206662306a36Sopenharmony_ci r = __resize_space_map(pmd->metadata_sm, new_count); 206762306a36Sopenharmony_ci if (!r) 206862306a36Sopenharmony_ci __set_metadata_reserve(pmd); 206962306a36Sopenharmony_ci } 207062306a36Sopenharmony_ci pmd_write_unlock(pmd); 207162306a36Sopenharmony_ci 207262306a36Sopenharmony_ci return r; 207362306a36Sopenharmony_ci} 207462306a36Sopenharmony_ci 207562306a36Sopenharmony_civoid dm_pool_metadata_read_only(struct dm_pool_metadata *pmd) 207662306a36Sopenharmony_ci{ 207762306a36Sopenharmony_ci pmd_write_lock_in_core(pmd); 207862306a36Sopenharmony_ci dm_bm_set_read_only(pmd->bm); 207962306a36Sopenharmony_ci pmd_write_unlock(pmd); 208062306a36Sopenharmony_ci} 208162306a36Sopenharmony_ci 208262306a36Sopenharmony_civoid dm_pool_metadata_read_write(struct dm_pool_metadata *pmd) 208362306a36Sopenharmony_ci{ 208462306a36Sopenharmony_ci pmd_write_lock_in_core(pmd); 208562306a36Sopenharmony_ci dm_bm_set_read_write(pmd->bm); 208662306a36Sopenharmony_ci pmd_write_unlock(pmd); 208762306a36Sopenharmony_ci} 208862306a36Sopenharmony_ci 208962306a36Sopenharmony_ciint dm_pool_register_metadata_threshold(struct dm_pool_metadata *pmd, 209062306a36Sopenharmony_ci dm_block_t threshold, 209162306a36Sopenharmony_ci dm_sm_threshold_fn fn, 209262306a36Sopenharmony_ci void *context) 209362306a36Sopenharmony_ci{ 209462306a36Sopenharmony_ci int r = -EINVAL; 209562306a36Sopenharmony_ci 209662306a36Sopenharmony_ci pmd_write_lock_in_core(pmd); 209762306a36Sopenharmony_ci if (!pmd->fail_io) { 209862306a36Sopenharmony_ci r = dm_sm_register_threshold_callback(pmd->metadata_sm, 209962306a36Sopenharmony_ci threshold, fn, context); 210062306a36Sopenharmony_ci } 210162306a36Sopenharmony_ci pmd_write_unlock(pmd); 210262306a36Sopenharmony_ci 210362306a36Sopenharmony_ci return r; 210462306a36Sopenharmony_ci} 210562306a36Sopenharmony_ci 210662306a36Sopenharmony_civoid dm_pool_register_pre_commit_callback(struct dm_pool_metadata *pmd, 210762306a36Sopenharmony_ci dm_pool_pre_commit_fn fn, 210862306a36Sopenharmony_ci void *context) 210962306a36Sopenharmony_ci{ 211062306a36Sopenharmony_ci pmd_write_lock_in_core(pmd); 211162306a36Sopenharmony_ci pmd->pre_commit_fn = fn; 211262306a36Sopenharmony_ci pmd->pre_commit_context = context; 211362306a36Sopenharmony_ci pmd_write_unlock(pmd); 211462306a36Sopenharmony_ci} 211562306a36Sopenharmony_ci 211662306a36Sopenharmony_ciint dm_pool_metadata_set_needs_check(struct dm_pool_metadata *pmd) 211762306a36Sopenharmony_ci{ 211862306a36Sopenharmony_ci int r = -EINVAL; 211962306a36Sopenharmony_ci struct dm_block *sblock; 212062306a36Sopenharmony_ci struct thin_disk_superblock *disk_super; 212162306a36Sopenharmony_ci 212262306a36Sopenharmony_ci pmd_write_lock(pmd); 212362306a36Sopenharmony_ci if (pmd->fail_io) 212462306a36Sopenharmony_ci goto out; 212562306a36Sopenharmony_ci 212662306a36Sopenharmony_ci pmd->flags |= THIN_METADATA_NEEDS_CHECK_FLAG; 212762306a36Sopenharmony_ci 212862306a36Sopenharmony_ci r = superblock_lock(pmd, &sblock); 212962306a36Sopenharmony_ci if (r) { 213062306a36Sopenharmony_ci DMERR("couldn't lock superblock"); 213162306a36Sopenharmony_ci goto out; 213262306a36Sopenharmony_ci } 213362306a36Sopenharmony_ci 213462306a36Sopenharmony_ci disk_super = dm_block_data(sblock); 213562306a36Sopenharmony_ci disk_super->flags = cpu_to_le32(pmd->flags); 213662306a36Sopenharmony_ci 213762306a36Sopenharmony_ci dm_bm_unlock(sblock); 213862306a36Sopenharmony_ciout: 213962306a36Sopenharmony_ci pmd_write_unlock(pmd); 214062306a36Sopenharmony_ci return r; 214162306a36Sopenharmony_ci} 214262306a36Sopenharmony_ci 214362306a36Sopenharmony_cibool dm_pool_metadata_needs_check(struct dm_pool_metadata *pmd) 214462306a36Sopenharmony_ci{ 214562306a36Sopenharmony_ci bool needs_check; 214662306a36Sopenharmony_ci 214762306a36Sopenharmony_ci down_read(&pmd->root_lock); 214862306a36Sopenharmony_ci needs_check = pmd->flags & THIN_METADATA_NEEDS_CHECK_FLAG; 214962306a36Sopenharmony_ci up_read(&pmd->root_lock); 215062306a36Sopenharmony_ci 215162306a36Sopenharmony_ci return needs_check; 215262306a36Sopenharmony_ci} 215362306a36Sopenharmony_ci 215462306a36Sopenharmony_civoid dm_pool_issue_prefetches(struct dm_pool_metadata *pmd) 215562306a36Sopenharmony_ci{ 215662306a36Sopenharmony_ci down_read(&pmd->root_lock); 215762306a36Sopenharmony_ci if (!pmd->fail_io) 215862306a36Sopenharmony_ci dm_tm_issue_prefetches(pmd->tm); 215962306a36Sopenharmony_ci up_read(&pmd->root_lock); 216062306a36Sopenharmony_ci} 2161