18c2ecf20Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0 28c2ecf20Sopenharmony_ci/* 38c2ecf20Sopenharmony_ci * Copyright (C) 2018 Cambridge Greys Ltd 48c2ecf20Sopenharmony_ci * Copyright (C) 2015-2016 Anton Ivanov (aivanov@brocade.com) 58c2ecf20Sopenharmony_ci * Copyright (C) 2000 Jeff Dike (jdike@karaya.com) 68c2ecf20Sopenharmony_ci */ 78c2ecf20Sopenharmony_ci 88c2ecf20Sopenharmony_ci/* 2001-09-28...2002-04-17 98c2ecf20Sopenharmony_ci * Partition stuff by James_McMechan@hotmail.com 108c2ecf20Sopenharmony_ci * old style ubd by setting UBD_SHIFT to 0 118c2ecf20Sopenharmony_ci * 2002-09-27...2002-10-18 massive tinkering for 2.5 128c2ecf20Sopenharmony_ci * partitions have changed in 2.5 138c2ecf20Sopenharmony_ci * 2003-01-29 more tinkering for 2.5.59-1 148c2ecf20Sopenharmony_ci * This should now address the sysfs problems and has 158c2ecf20Sopenharmony_ci * the symlink for devfs to allow for booting with 168c2ecf20Sopenharmony_ci * the common /dev/ubd/discX/... names rather than 178c2ecf20Sopenharmony_ci * only /dev/ubdN/discN this version also has lots of 188c2ecf20Sopenharmony_ci * clean ups preparing for ubd-many. 198c2ecf20Sopenharmony_ci * James McMechan 208c2ecf20Sopenharmony_ci */ 218c2ecf20Sopenharmony_ci 228c2ecf20Sopenharmony_ci#define UBD_SHIFT 4 238c2ecf20Sopenharmony_ci 248c2ecf20Sopenharmony_ci#include <linux/module.h> 258c2ecf20Sopenharmony_ci#include <linux/init.h> 268c2ecf20Sopenharmony_ci#include <linux/blkdev.h> 278c2ecf20Sopenharmony_ci#include <linux/blk-mq.h> 288c2ecf20Sopenharmony_ci#include <linux/ata.h> 298c2ecf20Sopenharmony_ci#include <linux/hdreg.h> 308c2ecf20Sopenharmony_ci#include <linux/cdrom.h> 318c2ecf20Sopenharmony_ci#include <linux/proc_fs.h> 328c2ecf20Sopenharmony_ci#include <linux/seq_file.h> 338c2ecf20Sopenharmony_ci#include <linux/ctype.h> 348c2ecf20Sopenharmony_ci#include <linux/slab.h> 358c2ecf20Sopenharmony_ci#include <linux/vmalloc.h> 368c2ecf20Sopenharmony_ci#include <linux/platform_device.h> 378c2ecf20Sopenharmony_ci#include <linux/scatterlist.h> 388c2ecf20Sopenharmony_ci#include <asm/tlbflush.h> 398c2ecf20Sopenharmony_ci#include <kern_util.h> 408c2ecf20Sopenharmony_ci#include "mconsole_kern.h" 418c2ecf20Sopenharmony_ci#include <init.h> 428c2ecf20Sopenharmony_ci#include <irq_kern.h> 438c2ecf20Sopenharmony_ci#include "ubd.h" 448c2ecf20Sopenharmony_ci#include <os.h> 458c2ecf20Sopenharmony_ci#include "cow.h" 468c2ecf20Sopenharmony_ci 478c2ecf20Sopenharmony_ci/* Max request size is determined by sector mask - 32K */ 488c2ecf20Sopenharmony_ci#define UBD_MAX_REQUEST (8 * sizeof(long)) 498c2ecf20Sopenharmony_ci 508c2ecf20Sopenharmony_cistruct io_desc { 518c2ecf20Sopenharmony_ci char *buffer; 528c2ecf20Sopenharmony_ci unsigned long length; 538c2ecf20Sopenharmony_ci unsigned long sector_mask; 548c2ecf20Sopenharmony_ci unsigned long long cow_offset; 558c2ecf20Sopenharmony_ci unsigned long bitmap_words[2]; 568c2ecf20Sopenharmony_ci}; 578c2ecf20Sopenharmony_ci 588c2ecf20Sopenharmony_cistruct io_thread_req { 598c2ecf20Sopenharmony_ci struct request *req; 608c2ecf20Sopenharmony_ci int fds[2]; 618c2ecf20Sopenharmony_ci unsigned long offsets[2]; 628c2ecf20Sopenharmony_ci unsigned long long offset; 638c2ecf20Sopenharmony_ci int sectorsize; 648c2ecf20Sopenharmony_ci int error; 658c2ecf20Sopenharmony_ci 668c2ecf20Sopenharmony_ci int desc_cnt; 678c2ecf20Sopenharmony_ci /* io_desc has to be the last element of the struct */ 688c2ecf20Sopenharmony_ci struct io_desc io_desc[]; 698c2ecf20Sopenharmony_ci}; 708c2ecf20Sopenharmony_ci 718c2ecf20Sopenharmony_ci 728c2ecf20Sopenharmony_cistatic struct io_thread_req * (*irq_req_buffer)[]; 738c2ecf20Sopenharmony_cistatic struct io_thread_req *irq_remainder; 748c2ecf20Sopenharmony_cistatic int irq_remainder_size; 758c2ecf20Sopenharmony_ci 768c2ecf20Sopenharmony_cistatic struct io_thread_req * (*io_req_buffer)[]; 778c2ecf20Sopenharmony_cistatic struct io_thread_req *io_remainder; 788c2ecf20Sopenharmony_cistatic int io_remainder_size; 798c2ecf20Sopenharmony_ci 808c2ecf20Sopenharmony_ci 818c2ecf20Sopenharmony_ci 828c2ecf20Sopenharmony_cistatic inline int ubd_test_bit(__u64 bit, unsigned char *data) 838c2ecf20Sopenharmony_ci{ 848c2ecf20Sopenharmony_ci __u64 n; 858c2ecf20Sopenharmony_ci int bits, off; 868c2ecf20Sopenharmony_ci 878c2ecf20Sopenharmony_ci bits = sizeof(data[0]) * 8; 888c2ecf20Sopenharmony_ci n = bit / bits; 898c2ecf20Sopenharmony_ci off = bit % bits; 908c2ecf20Sopenharmony_ci return (data[n] & (1 << off)) != 0; 918c2ecf20Sopenharmony_ci} 928c2ecf20Sopenharmony_ci 938c2ecf20Sopenharmony_cistatic inline void ubd_set_bit(__u64 bit, unsigned char *data) 948c2ecf20Sopenharmony_ci{ 958c2ecf20Sopenharmony_ci __u64 n; 968c2ecf20Sopenharmony_ci int bits, off; 978c2ecf20Sopenharmony_ci 988c2ecf20Sopenharmony_ci bits = sizeof(data[0]) * 8; 998c2ecf20Sopenharmony_ci n = bit / bits; 1008c2ecf20Sopenharmony_ci off = bit % bits; 1018c2ecf20Sopenharmony_ci data[n] |= (1 << off); 1028c2ecf20Sopenharmony_ci} 1038c2ecf20Sopenharmony_ci/*End stuff from ubd_user.h*/ 1048c2ecf20Sopenharmony_ci 1058c2ecf20Sopenharmony_ci#define DRIVER_NAME "uml-blkdev" 1068c2ecf20Sopenharmony_ci 1078c2ecf20Sopenharmony_cistatic DEFINE_MUTEX(ubd_lock); 1088c2ecf20Sopenharmony_cistatic DEFINE_MUTEX(ubd_mutex); /* replaces BKL, might not be needed */ 1098c2ecf20Sopenharmony_ci 1108c2ecf20Sopenharmony_cistatic int ubd_open(struct block_device *bdev, fmode_t mode); 1118c2ecf20Sopenharmony_cistatic void ubd_release(struct gendisk *disk, fmode_t mode); 1128c2ecf20Sopenharmony_cistatic int ubd_ioctl(struct block_device *bdev, fmode_t mode, 1138c2ecf20Sopenharmony_ci unsigned int cmd, unsigned long arg); 1148c2ecf20Sopenharmony_cistatic int ubd_getgeo(struct block_device *bdev, struct hd_geometry *geo); 1158c2ecf20Sopenharmony_ci 1168c2ecf20Sopenharmony_ci#define MAX_DEV (16) 1178c2ecf20Sopenharmony_ci 1188c2ecf20Sopenharmony_cistatic const struct block_device_operations ubd_blops = { 1198c2ecf20Sopenharmony_ci .owner = THIS_MODULE, 1208c2ecf20Sopenharmony_ci .open = ubd_open, 1218c2ecf20Sopenharmony_ci .release = ubd_release, 1228c2ecf20Sopenharmony_ci .ioctl = ubd_ioctl, 1238c2ecf20Sopenharmony_ci .compat_ioctl = blkdev_compat_ptr_ioctl, 1248c2ecf20Sopenharmony_ci .getgeo = ubd_getgeo, 1258c2ecf20Sopenharmony_ci}; 1268c2ecf20Sopenharmony_ci 1278c2ecf20Sopenharmony_ci/* Protected by ubd_lock */ 1288c2ecf20Sopenharmony_cistatic int fake_major = UBD_MAJOR; 1298c2ecf20Sopenharmony_cistatic struct gendisk *ubd_gendisk[MAX_DEV]; 1308c2ecf20Sopenharmony_cistatic struct gendisk *fake_gendisk[MAX_DEV]; 1318c2ecf20Sopenharmony_ci 1328c2ecf20Sopenharmony_ci#ifdef CONFIG_BLK_DEV_UBD_SYNC 1338c2ecf20Sopenharmony_ci#define OPEN_FLAGS ((struct openflags) { .r = 1, .w = 1, .s = 1, .c = 0, \ 1348c2ecf20Sopenharmony_ci .cl = 1 }) 1358c2ecf20Sopenharmony_ci#else 1368c2ecf20Sopenharmony_ci#define OPEN_FLAGS ((struct openflags) { .r = 1, .w = 1, .s = 0, .c = 0, \ 1378c2ecf20Sopenharmony_ci .cl = 1 }) 1388c2ecf20Sopenharmony_ci#endif 1398c2ecf20Sopenharmony_cistatic struct openflags global_openflags = OPEN_FLAGS; 1408c2ecf20Sopenharmony_ci 1418c2ecf20Sopenharmony_cistruct cow { 1428c2ecf20Sopenharmony_ci /* backing file name */ 1438c2ecf20Sopenharmony_ci char *file; 1448c2ecf20Sopenharmony_ci /* backing file fd */ 1458c2ecf20Sopenharmony_ci int fd; 1468c2ecf20Sopenharmony_ci unsigned long *bitmap; 1478c2ecf20Sopenharmony_ci unsigned long bitmap_len; 1488c2ecf20Sopenharmony_ci int bitmap_offset; 1498c2ecf20Sopenharmony_ci int data_offset; 1508c2ecf20Sopenharmony_ci}; 1518c2ecf20Sopenharmony_ci 1528c2ecf20Sopenharmony_ci#define MAX_SG 64 1538c2ecf20Sopenharmony_ci 1548c2ecf20Sopenharmony_cistruct ubd { 1558c2ecf20Sopenharmony_ci /* name (and fd, below) of the file opened for writing, either the 1568c2ecf20Sopenharmony_ci * backing or the cow file. */ 1578c2ecf20Sopenharmony_ci char *file; 1588c2ecf20Sopenharmony_ci int count; 1598c2ecf20Sopenharmony_ci int fd; 1608c2ecf20Sopenharmony_ci __u64 size; 1618c2ecf20Sopenharmony_ci struct openflags boot_openflags; 1628c2ecf20Sopenharmony_ci struct openflags openflags; 1638c2ecf20Sopenharmony_ci unsigned shared:1; 1648c2ecf20Sopenharmony_ci unsigned no_cow:1; 1658c2ecf20Sopenharmony_ci unsigned no_trim:1; 1668c2ecf20Sopenharmony_ci struct cow cow; 1678c2ecf20Sopenharmony_ci struct platform_device pdev; 1688c2ecf20Sopenharmony_ci struct request_queue *queue; 1698c2ecf20Sopenharmony_ci struct blk_mq_tag_set tag_set; 1708c2ecf20Sopenharmony_ci spinlock_t lock; 1718c2ecf20Sopenharmony_ci}; 1728c2ecf20Sopenharmony_ci 1738c2ecf20Sopenharmony_ci#define DEFAULT_COW { \ 1748c2ecf20Sopenharmony_ci .file = NULL, \ 1758c2ecf20Sopenharmony_ci .fd = -1, \ 1768c2ecf20Sopenharmony_ci .bitmap = NULL, \ 1778c2ecf20Sopenharmony_ci .bitmap_offset = 0, \ 1788c2ecf20Sopenharmony_ci .data_offset = 0, \ 1798c2ecf20Sopenharmony_ci} 1808c2ecf20Sopenharmony_ci 1818c2ecf20Sopenharmony_ci#define DEFAULT_UBD { \ 1828c2ecf20Sopenharmony_ci .file = NULL, \ 1838c2ecf20Sopenharmony_ci .count = 0, \ 1848c2ecf20Sopenharmony_ci .fd = -1, \ 1858c2ecf20Sopenharmony_ci .size = -1, \ 1868c2ecf20Sopenharmony_ci .boot_openflags = OPEN_FLAGS, \ 1878c2ecf20Sopenharmony_ci .openflags = OPEN_FLAGS, \ 1888c2ecf20Sopenharmony_ci .no_cow = 0, \ 1898c2ecf20Sopenharmony_ci .no_trim = 0, \ 1908c2ecf20Sopenharmony_ci .shared = 0, \ 1918c2ecf20Sopenharmony_ci .cow = DEFAULT_COW, \ 1928c2ecf20Sopenharmony_ci .lock = __SPIN_LOCK_UNLOCKED(ubd_devs.lock), \ 1938c2ecf20Sopenharmony_ci} 1948c2ecf20Sopenharmony_ci 1958c2ecf20Sopenharmony_ci/* Protected by ubd_lock */ 1968c2ecf20Sopenharmony_cistatic struct ubd ubd_devs[MAX_DEV] = { [0 ... MAX_DEV - 1] = DEFAULT_UBD }; 1978c2ecf20Sopenharmony_ci 1988c2ecf20Sopenharmony_ci/* Only changed by fake_ide_setup which is a setup */ 1998c2ecf20Sopenharmony_cistatic int fake_ide = 0; 2008c2ecf20Sopenharmony_cistatic struct proc_dir_entry *proc_ide_root = NULL; 2018c2ecf20Sopenharmony_cistatic struct proc_dir_entry *proc_ide = NULL; 2028c2ecf20Sopenharmony_ci 2038c2ecf20Sopenharmony_cistatic blk_status_t ubd_queue_rq(struct blk_mq_hw_ctx *hctx, 2048c2ecf20Sopenharmony_ci const struct blk_mq_queue_data *bd); 2058c2ecf20Sopenharmony_ci 2068c2ecf20Sopenharmony_cistatic void make_proc_ide(void) 2078c2ecf20Sopenharmony_ci{ 2088c2ecf20Sopenharmony_ci proc_ide_root = proc_mkdir("ide", NULL); 2098c2ecf20Sopenharmony_ci proc_ide = proc_mkdir("ide0", proc_ide_root); 2108c2ecf20Sopenharmony_ci} 2118c2ecf20Sopenharmony_ci 2128c2ecf20Sopenharmony_cistatic int fake_ide_media_proc_show(struct seq_file *m, void *v) 2138c2ecf20Sopenharmony_ci{ 2148c2ecf20Sopenharmony_ci seq_puts(m, "disk\n"); 2158c2ecf20Sopenharmony_ci return 0; 2168c2ecf20Sopenharmony_ci} 2178c2ecf20Sopenharmony_ci 2188c2ecf20Sopenharmony_cistatic void make_ide_entries(const char *dev_name) 2198c2ecf20Sopenharmony_ci{ 2208c2ecf20Sopenharmony_ci struct proc_dir_entry *dir, *ent; 2218c2ecf20Sopenharmony_ci char name[64]; 2228c2ecf20Sopenharmony_ci 2238c2ecf20Sopenharmony_ci if(proc_ide_root == NULL) make_proc_ide(); 2248c2ecf20Sopenharmony_ci 2258c2ecf20Sopenharmony_ci dir = proc_mkdir(dev_name, proc_ide); 2268c2ecf20Sopenharmony_ci if(!dir) return; 2278c2ecf20Sopenharmony_ci 2288c2ecf20Sopenharmony_ci ent = proc_create_single("media", S_IRUGO, dir, 2298c2ecf20Sopenharmony_ci fake_ide_media_proc_show); 2308c2ecf20Sopenharmony_ci if(!ent) return; 2318c2ecf20Sopenharmony_ci snprintf(name, sizeof(name), "ide0/%s", dev_name); 2328c2ecf20Sopenharmony_ci proc_symlink(dev_name, proc_ide_root, name); 2338c2ecf20Sopenharmony_ci} 2348c2ecf20Sopenharmony_ci 2358c2ecf20Sopenharmony_cistatic int fake_ide_setup(char *str) 2368c2ecf20Sopenharmony_ci{ 2378c2ecf20Sopenharmony_ci fake_ide = 1; 2388c2ecf20Sopenharmony_ci return 1; 2398c2ecf20Sopenharmony_ci} 2408c2ecf20Sopenharmony_ci 2418c2ecf20Sopenharmony_ci__setup("fake_ide", fake_ide_setup); 2428c2ecf20Sopenharmony_ci 2438c2ecf20Sopenharmony_ci__uml_help(fake_ide_setup, 2448c2ecf20Sopenharmony_ci"fake_ide\n" 2458c2ecf20Sopenharmony_ci" Create ide0 entries that map onto ubd devices.\n\n" 2468c2ecf20Sopenharmony_ci); 2478c2ecf20Sopenharmony_ci 2488c2ecf20Sopenharmony_cistatic int parse_unit(char **ptr) 2498c2ecf20Sopenharmony_ci{ 2508c2ecf20Sopenharmony_ci char *str = *ptr, *end; 2518c2ecf20Sopenharmony_ci int n = -1; 2528c2ecf20Sopenharmony_ci 2538c2ecf20Sopenharmony_ci if(isdigit(*str)) { 2548c2ecf20Sopenharmony_ci n = simple_strtoul(str, &end, 0); 2558c2ecf20Sopenharmony_ci if(end == str) 2568c2ecf20Sopenharmony_ci return -1; 2578c2ecf20Sopenharmony_ci *ptr = end; 2588c2ecf20Sopenharmony_ci } 2598c2ecf20Sopenharmony_ci else if (('a' <= *str) && (*str <= 'z')) { 2608c2ecf20Sopenharmony_ci n = *str - 'a'; 2618c2ecf20Sopenharmony_ci str++; 2628c2ecf20Sopenharmony_ci *ptr = str; 2638c2ecf20Sopenharmony_ci } 2648c2ecf20Sopenharmony_ci return n; 2658c2ecf20Sopenharmony_ci} 2668c2ecf20Sopenharmony_ci 2678c2ecf20Sopenharmony_ci/* If *index_out == -1 at exit, the passed option was a general one; 2688c2ecf20Sopenharmony_ci * otherwise, the str pointer is used (and owned) inside ubd_devs array, so it 2698c2ecf20Sopenharmony_ci * should not be freed on exit. 2708c2ecf20Sopenharmony_ci */ 2718c2ecf20Sopenharmony_cistatic int ubd_setup_common(char *str, int *index_out, char **error_out) 2728c2ecf20Sopenharmony_ci{ 2738c2ecf20Sopenharmony_ci struct ubd *ubd_dev; 2748c2ecf20Sopenharmony_ci struct openflags flags = global_openflags; 2758c2ecf20Sopenharmony_ci char *backing_file; 2768c2ecf20Sopenharmony_ci int n, err = 0, i; 2778c2ecf20Sopenharmony_ci 2788c2ecf20Sopenharmony_ci if(index_out) *index_out = -1; 2798c2ecf20Sopenharmony_ci n = *str; 2808c2ecf20Sopenharmony_ci if(n == '='){ 2818c2ecf20Sopenharmony_ci char *end; 2828c2ecf20Sopenharmony_ci int major; 2838c2ecf20Sopenharmony_ci 2848c2ecf20Sopenharmony_ci str++; 2858c2ecf20Sopenharmony_ci if(!strcmp(str, "sync")){ 2868c2ecf20Sopenharmony_ci global_openflags = of_sync(global_openflags); 2878c2ecf20Sopenharmony_ci return err; 2888c2ecf20Sopenharmony_ci } 2898c2ecf20Sopenharmony_ci 2908c2ecf20Sopenharmony_ci err = -EINVAL; 2918c2ecf20Sopenharmony_ci major = simple_strtoul(str, &end, 0); 2928c2ecf20Sopenharmony_ci if((*end != '\0') || (end == str)){ 2938c2ecf20Sopenharmony_ci *error_out = "Didn't parse major number"; 2948c2ecf20Sopenharmony_ci return err; 2958c2ecf20Sopenharmony_ci } 2968c2ecf20Sopenharmony_ci 2978c2ecf20Sopenharmony_ci mutex_lock(&ubd_lock); 2988c2ecf20Sopenharmony_ci if (fake_major != UBD_MAJOR) { 2998c2ecf20Sopenharmony_ci *error_out = "Can't assign a fake major twice"; 3008c2ecf20Sopenharmony_ci goto out1; 3018c2ecf20Sopenharmony_ci } 3028c2ecf20Sopenharmony_ci 3038c2ecf20Sopenharmony_ci fake_major = major; 3048c2ecf20Sopenharmony_ci 3058c2ecf20Sopenharmony_ci printk(KERN_INFO "Setting extra ubd major number to %d\n", 3068c2ecf20Sopenharmony_ci major); 3078c2ecf20Sopenharmony_ci err = 0; 3088c2ecf20Sopenharmony_ci out1: 3098c2ecf20Sopenharmony_ci mutex_unlock(&ubd_lock); 3108c2ecf20Sopenharmony_ci return err; 3118c2ecf20Sopenharmony_ci } 3128c2ecf20Sopenharmony_ci 3138c2ecf20Sopenharmony_ci n = parse_unit(&str); 3148c2ecf20Sopenharmony_ci if(n < 0){ 3158c2ecf20Sopenharmony_ci *error_out = "Couldn't parse device number"; 3168c2ecf20Sopenharmony_ci return -EINVAL; 3178c2ecf20Sopenharmony_ci } 3188c2ecf20Sopenharmony_ci if(n >= MAX_DEV){ 3198c2ecf20Sopenharmony_ci *error_out = "Device number out of range"; 3208c2ecf20Sopenharmony_ci return 1; 3218c2ecf20Sopenharmony_ci } 3228c2ecf20Sopenharmony_ci 3238c2ecf20Sopenharmony_ci err = -EBUSY; 3248c2ecf20Sopenharmony_ci mutex_lock(&ubd_lock); 3258c2ecf20Sopenharmony_ci 3268c2ecf20Sopenharmony_ci ubd_dev = &ubd_devs[n]; 3278c2ecf20Sopenharmony_ci if(ubd_dev->file != NULL){ 3288c2ecf20Sopenharmony_ci *error_out = "Device is already configured"; 3298c2ecf20Sopenharmony_ci goto out; 3308c2ecf20Sopenharmony_ci } 3318c2ecf20Sopenharmony_ci 3328c2ecf20Sopenharmony_ci if (index_out) 3338c2ecf20Sopenharmony_ci *index_out = n; 3348c2ecf20Sopenharmony_ci 3358c2ecf20Sopenharmony_ci err = -EINVAL; 3368c2ecf20Sopenharmony_ci for (i = 0; i < sizeof("rscdt="); i++) { 3378c2ecf20Sopenharmony_ci switch (*str) { 3388c2ecf20Sopenharmony_ci case 'r': 3398c2ecf20Sopenharmony_ci flags.w = 0; 3408c2ecf20Sopenharmony_ci break; 3418c2ecf20Sopenharmony_ci case 's': 3428c2ecf20Sopenharmony_ci flags.s = 1; 3438c2ecf20Sopenharmony_ci break; 3448c2ecf20Sopenharmony_ci case 'd': 3458c2ecf20Sopenharmony_ci ubd_dev->no_cow = 1; 3468c2ecf20Sopenharmony_ci break; 3478c2ecf20Sopenharmony_ci case 'c': 3488c2ecf20Sopenharmony_ci ubd_dev->shared = 1; 3498c2ecf20Sopenharmony_ci break; 3508c2ecf20Sopenharmony_ci case 't': 3518c2ecf20Sopenharmony_ci ubd_dev->no_trim = 1; 3528c2ecf20Sopenharmony_ci break; 3538c2ecf20Sopenharmony_ci case '=': 3548c2ecf20Sopenharmony_ci str++; 3558c2ecf20Sopenharmony_ci goto break_loop; 3568c2ecf20Sopenharmony_ci default: 3578c2ecf20Sopenharmony_ci *error_out = "Expected '=' or flag letter " 3588c2ecf20Sopenharmony_ci "(r, s, c, t or d)"; 3598c2ecf20Sopenharmony_ci goto out; 3608c2ecf20Sopenharmony_ci } 3618c2ecf20Sopenharmony_ci str++; 3628c2ecf20Sopenharmony_ci } 3638c2ecf20Sopenharmony_ci 3648c2ecf20Sopenharmony_ci if (*str == '=') 3658c2ecf20Sopenharmony_ci *error_out = "Too many flags specified"; 3668c2ecf20Sopenharmony_ci else 3678c2ecf20Sopenharmony_ci *error_out = "Missing '='"; 3688c2ecf20Sopenharmony_ci goto out; 3698c2ecf20Sopenharmony_ci 3708c2ecf20Sopenharmony_cibreak_loop: 3718c2ecf20Sopenharmony_ci backing_file = strchr(str, ','); 3728c2ecf20Sopenharmony_ci 3738c2ecf20Sopenharmony_ci if (backing_file == NULL) 3748c2ecf20Sopenharmony_ci backing_file = strchr(str, ':'); 3758c2ecf20Sopenharmony_ci 3768c2ecf20Sopenharmony_ci if(backing_file != NULL){ 3778c2ecf20Sopenharmony_ci if(ubd_dev->no_cow){ 3788c2ecf20Sopenharmony_ci *error_out = "Can't specify both 'd' and a cow file"; 3798c2ecf20Sopenharmony_ci goto out; 3808c2ecf20Sopenharmony_ci } 3818c2ecf20Sopenharmony_ci else { 3828c2ecf20Sopenharmony_ci *backing_file = '\0'; 3838c2ecf20Sopenharmony_ci backing_file++; 3848c2ecf20Sopenharmony_ci } 3858c2ecf20Sopenharmony_ci } 3868c2ecf20Sopenharmony_ci err = 0; 3878c2ecf20Sopenharmony_ci ubd_dev->file = str; 3888c2ecf20Sopenharmony_ci ubd_dev->cow.file = backing_file; 3898c2ecf20Sopenharmony_ci ubd_dev->boot_openflags = flags; 3908c2ecf20Sopenharmony_ciout: 3918c2ecf20Sopenharmony_ci mutex_unlock(&ubd_lock); 3928c2ecf20Sopenharmony_ci return err; 3938c2ecf20Sopenharmony_ci} 3948c2ecf20Sopenharmony_ci 3958c2ecf20Sopenharmony_cistatic int ubd_setup(char *str) 3968c2ecf20Sopenharmony_ci{ 3978c2ecf20Sopenharmony_ci char *error; 3988c2ecf20Sopenharmony_ci int err; 3998c2ecf20Sopenharmony_ci 4008c2ecf20Sopenharmony_ci err = ubd_setup_common(str, NULL, &error); 4018c2ecf20Sopenharmony_ci if(err) 4028c2ecf20Sopenharmony_ci printk(KERN_ERR "Failed to initialize device with \"%s\" : " 4038c2ecf20Sopenharmony_ci "%s\n", str, error); 4048c2ecf20Sopenharmony_ci return 1; 4058c2ecf20Sopenharmony_ci} 4068c2ecf20Sopenharmony_ci 4078c2ecf20Sopenharmony_ci__setup("ubd", ubd_setup); 4088c2ecf20Sopenharmony_ci__uml_help(ubd_setup, 4098c2ecf20Sopenharmony_ci"ubd<n><flags>=<filename>[(:|,)<filename2>]\n" 4108c2ecf20Sopenharmony_ci" This is used to associate a device with a file in the underlying\n" 4118c2ecf20Sopenharmony_ci" filesystem. When specifying two filenames, the first one is the\n" 4128c2ecf20Sopenharmony_ci" COW name and the second is the backing file name. As separator you can\n" 4138c2ecf20Sopenharmony_ci" use either a ':' or a ',': the first one allows writing things like;\n" 4148c2ecf20Sopenharmony_ci" ubd0=~/Uml/root_cow:~/Uml/root_backing_file\n" 4158c2ecf20Sopenharmony_ci" while with a ',' the shell would not expand the 2nd '~'.\n" 4168c2ecf20Sopenharmony_ci" When using only one filename, UML will detect whether to treat it like\n" 4178c2ecf20Sopenharmony_ci" a COW file or a backing file. To override this detection, add the 'd'\n" 4188c2ecf20Sopenharmony_ci" flag:\n" 4198c2ecf20Sopenharmony_ci" ubd0d=BackingFile\n" 4208c2ecf20Sopenharmony_ci" Usually, there is a filesystem in the file, but \n" 4218c2ecf20Sopenharmony_ci" that's not required. Swap devices containing swap files can be\n" 4228c2ecf20Sopenharmony_ci" specified like this. Also, a file which doesn't contain a\n" 4238c2ecf20Sopenharmony_ci" filesystem can have its contents read in the virtual \n" 4248c2ecf20Sopenharmony_ci" machine by running 'dd' on the device. <n> must be in the range\n" 4258c2ecf20Sopenharmony_ci" 0 to 7. Appending an 'r' to the number will cause that device\n" 4268c2ecf20Sopenharmony_ci" to be mounted read-only. For example ubd1r=./ext_fs. Appending\n" 4278c2ecf20Sopenharmony_ci" an 's' will cause data to be written to disk on the host immediately.\n" 4288c2ecf20Sopenharmony_ci" 'c' will cause the device to be treated as being shared between multiple\n" 4298c2ecf20Sopenharmony_ci" UMLs and file locking will be turned off - this is appropriate for a\n" 4308c2ecf20Sopenharmony_ci" cluster filesystem and inappropriate at almost all other times.\n\n" 4318c2ecf20Sopenharmony_ci" 't' will disable trim/discard support on the device (enabled by default).\n\n" 4328c2ecf20Sopenharmony_ci); 4338c2ecf20Sopenharmony_ci 4348c2ecf20Sopenharmony_cistatic int udb_setup(char *str) 4358c2ecf20Sopenharmony_ci{ 4368c2ecf20Sopenharmony_ci printk("udb%s specified on command line is almost certainly a ubd -> " 4378c2ecf20Sopenharmony_ci "udb TYPO\n", str); 4388c2ecf20Sopenharmony_ci return 1; 4398c2ecf20Sopenharmony_ci} 4408c2ecf20Sopenharmony_ci 4418c2ecf20Sopenharmony_ci__setup("udb", udb_setup); 4428c2ecf20Sopenharmony_ci__uml_help(udb_setup, 4438c2ecf20Sopenharmony_ci"udb\n" 4448c2ecf20Sopenharmony_ci" This option is here solely to catch ubd -> udb typos, which can be\n" 4458c2ecf20Sopenharmony_ci" to impossible to catch visually unless you specifically look for\n" 4468c2ecf20Sopenharmony_ci" them. The only result of any option starting with 'udb' is an error\n" 4478c2ecf20Sopenharmony_ci" in the boot output.\n\n" 4488c2ecf20Sopenharmony_ci); 4498c2ecf20Sopenharmony_ci 4508c2ecf20Sopenharmony_ci/* Only changed by ubd_init, which is an initcall. */ 4518c2ecf20Sopenharmony_cistatic int thread_fd = -1; 4528c2ecf20Sopenharmony_ci 4538c2ecf20Sopenharmony_ci/* Function to read several request pointers at a time 4548c2ecf20Sopenharmony_ci* handling fractional reads if (and as) needed 4558c2ecf20Sopenharmony_ci*/ 4568c2ecf20Sopenharmony_ci 4578c2ecf20Sopenharmony_cistatic int bulk_req_safe_read( 4588c2ecf20Sopenharmony_ci int fd, 4598c2ecf20Sopenharmony_ci struct io_thread_req * (*request_buffer)[], 4608c2ecf20Sopenharmony_ci struct io_thread_req **remainder, 4618c2ecf20Sopenharmony_ci int *remainder_size, 4628c2ecf20Sopenharmony_ci int max_recs 4638c2ecf20Sopenharmony_ci ) 4648c2ecf20Sopenharmony_ci{ 4658c2ecf20Sopenharmony_ci int n = 0; 4668c2ecf20Sopenharmony_ci int res = 0; 4678c2ecf20Sopenharmony_ci 4688c2ecf20Sopenharmony_ci if (*remainder_size > 0) { 4698c2ecf20Sopenharmony_ci memmove( 4708c2ecf20Sopenharmony_ci (char *) request_buffer, 4718c2ecf20Sopenharmony_ci (char *) remainder, *remainder_size 4728c2ecf20Sopenharmony_ci ); 4738c2ecf20Sopenharmony_ci n = *remainder_size; 4748c2ecf20Sopenharmony_ci } 4758c2ecf20Sopenharmony_ci 4768c2ecf20Sopenharmony_ci res = os_read_file( 4778c2ecf20Sopenharmony_ci fd, 4788c2ecf20Sopenharmony_ci ((char *) request_buffer) + *remainder_size, 4798c2ecf20Sopenharmony_ci sizeof(struct io_thread_req *)*max_recs 4808c2ecf20Sopenharmony_ci - *remainder_size 4818c2ecf20Sopenharmony_ci ); 4828c2ecf20Sopenharmony_ci if (res > 0) { 4838c2ecf20Sopenharmony_ci n += res; 4848c2ecf20Sopenharmony_ci if ((n % sizeof(struct io_thread_req *)) > 0) { 4858c2ecf20Sopenharmony_ci /* 4868c2ecf20Sopenharmony_ci * Read somehow returned not a multiple of dword 4878c2ecf20Sopenharmony_ci * theoretically possible, but never observed in the 4888c2ecf20Sopenharmony_ci * wild, so read routine must be able to handle it 4898c2ecf20Sopenharmony_ci */ 4908c2ecf20Sopenharmony_ci *remainder_size = n % sizeof(struct io_thread_req *); 4918c2ecf20Sopenharmony_ci WARN(*remainder_size > 0, "UBD IPC read returned a partial result"); 4928c2ecf20Sopenharmony_ci memmove( 4938c2ecf20Sopenharmony_ci remainder, 4948c2ecf20Sopenharmony_ci ((char *) request_buffer) + 4958c2ecf20Sopenharmony_ci (n/sizeof(struct io_thread_req *))*sizeof(struct io_thread_req *), 4968c2ecf20Sopenharmony_ci *remainder_size 4978c2ecf20Sopenharmony_ci ); 4988c2ecf20Sopenharmony_ci n = n - *remainder_size; 4998c2ecf20Sopenharmony_ci } 5008c2ecf20Sopenharmony_ci } else { 5018c2ecf20Sopenharmony_ci n = res; 5028c2ecf20Sopenharmony_ci } 5038c2ecf20Sopenharmony_ci return n; 5048c2ecf20Sopenharmony_ci} 5058c2ecf20Sopenharmony_ci 5068c2ecf20Sopenharmony_ci/* Called without dev->lock held, and only in interrupt context. */ 5078c2ecf20Sopenharmony_cistatic void ubd_handler(void) 5088c2ecf20Sopenharmony_ci{ 5098c2ecf20Sopenharmony_ci int n; 5108c2ecf20Sopenharmony_ci int count; 5118c2ecf20Sopenharmony_ci 5128c2ecf20Sopenharmony_ci while(1){ 5138c2ecf20Sopenharmony_ci n = bulk_req_safe_read( 5148c2ecf20Sopenharmony_ci thread_fd, 5158c2ecf20Sopenharmony_ci irq_req_buffer, 5168c2ecf20Sopenharmony_ci &irq_remainder, 5178c2ecf20Sopenharmony_ci &irq_remainder_size, 5188c2ecf20Sopenharmony_ci UBD_REQ_BUFFER_SIZE 5198c2ecf20Sopenharmony_ci ); 5208c2ecf20Sopenharmony_ci if (n < 0) { 5218c2ecf20Sopenharmony_ci if(n == -EAGAIN) 5228c2ecf20Sopenharmony_ci break; 5238c2ecf20Sopenharmony_ci printk(KERN_ERR "spurious interrupt in ubd_handler, " 5248c2ecf20Sopenharmony_ci "err = %d\n", -n); 5258c2ecf20Sopenharmony_ci return; 5268c2ecf20Sopenharmony_ci } 5278c2ecf20Sopenharmony_ci for (count = 0; count < n/sizeof(struct io_thread_req *); count++) { 5288c2ecf20Sopenharmony_ci struct io_thread_req *io_req = (*irq_req_buffer)[count]; 5298c2ecf20Sopenharmony_ci 5308c2ecf20Sopenharmony_ci if ((io_req->error == BLK_STS_NOTSUPP) && (req_op(io_req->req) == REQ_OP_DISCARD)) { 5318c2ecf20Sopenharmony_ci blk_queue_max_discard_sectors(io_req->req->q, 0); 5328c2ecf20Sopenharmony_ci blk_queue_max_write_zeroes_sectors(io_req->req->q, 0); 5338c2ecf20Sopenharmony_ci blk_queue_flag_clear(QUEUE_FLAG_DISCARD, io_req->req->q); 5348c2ecf20Sopenharmony_ci } 5358c2ecf20Sopenharmony_ci blk_mq_end_request(io_req->req, io_req->error); 5368c2ecf20Sopenharmony_ci kfree(io_req); 5378c2ecf20Sopenharmony_ci } 5388c2ecf20Sopenharmony_ci } 5398c2ecf20Sopenharmony_ci} 5408c2ecf20Sopenharmony_ci 5418c2ecf20Sopenharmony_cistatic irqreturn_t ubd_intr(int irq, void *dev) 5428c2ecf20Sopenharmony_ci{ 5438c2ecf20Sopenharmony_ci ubd_handler(); 5448c2ecf20Sopenharmony_ci return IRQ_HANDLED; 5458c2ecf20Sopenharmony_ci} 5468c2ecf20Sopenharmony_ci 5478c2ecf20Sopenharmony_ci/* Only changed by ubd_init, which is an initcall. */ 5488c2ecf20Sopenharmony_cistatic int io_pid = -1; 5498c2ecf20Sopenharmony_ci 5508c2ecf20Sopenharmony_cistatic void kill_io_thread(void) 5518c2ecf20Sopenharmony_ci{ 5528c2ecf20Sopenharmony_ci if(io_pid != -1) 5538c2ecf20Sopenharmony_ci os_kill_process(io_pid, 1); 5548c2ecf20Sopenharmony_ci} 5558c2ecf20Sopenharmony_ci 5568c2ecf20Sopenharmony_ci__uml_exitcall(kill_io_thread); 5578c2ecf20Sopenharmony_ci 5588c2ecf20Sopenharmony_cistatic inline int ubd_file_size(struct ubd *ubd_dev, __u64 *size_out) 5598c2ecf20Sopenharmony_ci{ 5608c2ecf20Sopenharmony_ci char *file; 5618c2ecf20Sopenharmony_ci int fd; 5628c2ecf20Sopenharmony_ci int err; 5638c2ecf20Sopenharmony_ci 5648c2ecf20Sopenharmony_ci __u32 version; 5658c2ecf20Sopenharmony_ci __u32 align; 5668c2ecf20Sopenharmony_ci char *backing_file; 5678c2ecf20Sopenharmony_ci time64_t mtime; 5688c2ecf20Sopenharmony_ci unsigned long long size; 5698c2ecf20Sopenharmony_ci int sector_size; 5708c2ecf20Sopenharmony_ci int bitmap_offset; 5718c2ecf20Sopenharmony_ci 5728c2ecf20Sopenharmony_ci if (ubd_dev->file && ubd_dev->cow.file) { 5738c2ecf20Sopenharmony_ci file = ubd_dev->cow.file; 5748c2ecf20Sopenharmony_ci 5758c2ecf20Sopenharmony_ci goto out; 5768c2ecf20Sopenharmony_ci } 5778c2ecf20Sopenharmony_ci 5788c2ecf20Sopenharmony_ci fd = os_open_file(ubd_dev->file, of_read(OPENFLAGS()), 0); 5798c2ecf20Sopenharmony_ci if (fd < 0) 5808c2ecf20Sopenharmony_ci return fd; 5818c2ecf20Sopenharmony_ci 5828c2ecf20Sopenharmony_ci err = read_cow_header(file_reader, &fd, &version, &backing_file, \ 5838c2ecf20Sopenharmony_ci &mtime, &size, §or_size, &align, &bitmap_offset); 5848c2ecf20Sopenharmony_ci os_close_file(fd); 5858c2ecf20Sopenharmony_ci 5868c2ecf20Sopenharmony_ci if(err == -EINVAL) 5878c2ecf20Sopenharmony_ci file = ubd_dev->file; 5888c2ecf20Sopenharmony_ci else 5898c2ecf20Sopenharmony_ci file = backing_file; 5908c2ecf20Sopenharmony_ci 5918c2ecf20Sopenharmony_ciout: 5928c2ecf20Sopenharmony_ci return os_file_size(file, size_out); 5938c2ecf20Sopenharmony_ci} 5948c2ecf20Sopenharmony_ci 5958c2ecf20Sopenharmony_cistatic int read_cow_bitmap(int fd, void *buf, int offset, int len) 5968c2ecf20Sopenharmony_ci{ 5978c2ecf20Sopenharmony_ci int err; 5988c2ecf20Sopenharmony_ci 5998c2ecf20Sopenharmony_ci err = os_pread_file(fd, buf, len, offset); 6008c2ecf20Sopenharmony_ci if (err < 0) 6018c2ecf20Sopenharmony_ci return err; 6028c2ecf20Sopenharmony_ci 6038c2ecf20Sopenharmony_ci return 0; 6048c2ecf20Sopenharmony_ci} 6058c2ecf20Sopenharmony_ci 6068c2ecf20Sopenharmony_cistatic int backing_file_mismatch(char *file, __u64 size, time64_t mtime) 6078c2ecf20Sopenharmony_ci{ 6088c2ecf20Sopenharmony_ci time64_t modtime; 6098c2ecf20Sopenharmony_ci unsigned long long actual; 6108c2ecf20Sopenharmony_ci int err; 6118c2ecf20Sopenharmony_ci 6128c2ecf20Sopenharmony_ci err = os_file_modtime(file, &modtime); 6138c2ecf20Sopenharmony_ci if (err < 0) { 6148c2ecf20Sopenharmony_ci printk(KERN_ERR "Failed to get modification time of backing " 6158c2ecf20Sopenharmony_ci "file \"%s\", err = %d\n", file, -err); 6168c2ecf20Sopenharmony_ci return err; 6178c2ecf20Sopenharmony_ci } 6188c2ecf20Sopenharmony_ci 6198c2ecf20Sopenharmony_ci err = os_file_size(file, &actual); 6208c2ecf20Sopenharmony_ci if (err < 0) { 6218c2ecf20Sopenharmony_ci printk(KERN_ERR "Failed to get size of backing file \"%s\", " 6228c2ecf20Sopenharmony_ci "err = %d\n", file, -err); 6238c2ecf20Sopenharmony_ci return err; 6248c2ecf20Sopenharmony_ci } 6258c2ecf20Sopenharmony_ci 6268c2ecf20Sopenharmony_ci if (actual != size) { 6278c2ecf20Sopenharmony_ci /*__u64 can be a long on AMD64 and with %lu GCC complains; so 6288c2ecf20Sopenharmony_ci * the typecast.*/ 6298c2ecf20Sopenharmony_ci printk(KERN_ERR "Size mismatch (%llu vs %llu) of COW header " 6308c2ecf20Sopenharmony_ci "vs backing file\n", (unsigned long long) size, actual); 6318c2ecf20Sopenharmony_ci return -EINVAL; 6328c2ecf20Sopenharmony_ci } 6338c2ecf20Sopenharmony_ci if (modtime != mtime) { 6348c2ecf20Sopenharmony_ci printk(KERN_ERR "mtime mismatch (%lld vs %lld) of COW header vs " 6358c2ecf20Sopenharmony_ci "backing file\n", mtime, modtime); 6368c2ecf20Sopenharmony_ci return -EINVAL; 6378c2ecf20Sopenharmony_ci } 6388c2ecf20Sopenharmony_ci return 0; 6398c2ecf20Sopenharmony_ci} 6408c2ecf20Sopenharmony_ci 6418c2ecf20Sopenharmony_cistatic int path_requires_switch(char *from_cmdline, char *from_cow, char *cow) 6428c2ecf20Sopenharmony_ci{ 6438c2ecf20Sopenharmony_ci struct uml_stat buf1, buf2; 6448c2ecf20Sopenharmony_ci int err; 6458c2ecf20Sopenharmony_ci 6468c2ecf20Sopenharmony_ci if (from_cmdline == NULL) 6478c2ecf20Sopenharmony_ci return 0; 6488c2ecf20Sopenharmony_ci if (!strcmp(from_cmdline, from_cow)) 6498c2ecf20Sopenharmony_ci return 0; 6508c2ecf20Sopenharmony_ci 6518c2ecf20Sopenharmony_ci err = os_stat_file(from_cmdline, &buf1); 6528c2ecf20Sopenharmony_ci if (err < 0) { 6538c2ecf20Sopenharmony_ci printk(KERN_ERR "Couldn't stat '%s', err = %d\n", from_cmdline, 6548c2ecf20Sopenharmony_ci -err); 6558c2ecf20Sopenharmony_ci return 0; 6568c2ecf20Sopenharmony_ci } 6578c2ecf20Sopenharmony_ci err = os_stat_file(from_cow, &buf2); 6588c2ecf20Sopenharmony_ci if (err < 0) { 6598c2ecf20Sopenharmony_ci printk(KERN_ERR "Couldn't stat '%s', err = %d\n", from_cow, 6608c2ecf20Sopenharmony_ci -err); 6618c2ecf20Sopenharmony_ci return 1; 6628c2ecf20Sopenharmony_ci } 6638c2ecf20Sopenharmony_ci if ((buf1.ust_dev == buf2.ust_dev) && (buf1.ust_ino == buf2.ust_ino)) 6648c2ecf20Sopenharmony_ci return 0; 6658c2ecf20Sopenharmony_ci 6668c2ecf20Sopenharmony_ci printk(KERN_ERR "Backing file mismatch - \"%s\" requested, " 6678c2ecf20Sopenharmony_ci "\"%s\" specified in COW header of \"%s\"\n", 6688c2ecf20Sopenharmony_ci from_cmdline, from_cow, cow); 6698c2ecf20Sopenharmony_ci return 1; 6708c2ecf20Sopenharmony_ci} 6718c2ecf20Sopenharmony_ci 6728c2ecf20Sopenharmony_cistatic int open_ubd_file(char *file, struct openflags *openflags, int shared, 6738c2ecf20Sopenharmony_ci char **backing_file_out, int *bitmap_offset_out, 6748c2ecf20Sopenharmony_ci unsigned long *bitmap_len_out, int *data_offset_out, 6758c2ecf20Sopenharmony_ci int *create_cow_out) 6768c2ecf20Sopenharmony_ci{ 6778c2ecf20Sopenharmony_ci time64_t mtime; 6788c2ecf20Sopenharmony_ci unsigned long long size; 6798c2ecf20Sopenharmony_ci __u32 version, align; 6808c2ecf20Sopenharmony_ci char *backing_file; 6818c2ecf20Sopenharmony_ci int fd, err, sectorsize, asked_switch, mode = 0644; 6828c2ecf20Sopenharmony_ci 6838c2ecf20Sopenharmony_ci fd = os_open_file(file, *openflags, mode); 6848c2ecf20Sopenharmony_ci if (fd < 0) { 6858c2ecf20Sopenharmony_ci if ((fd == -ENOENT) && (create_cow_out != NULL)) 6868c2ecf20Sopenharmony_ci *create_cow_out = 1; 6878c2ecf20Sopenharmony_ci if (!openflags->w || 6888c2ecf20Sopenharmony_ci ((fd != -EROFS) && (fd != -EACCES))) 6898c2ecf20Sopenharmony_ci return fd; 6908c2ecf20Sopenharmony_ci openflags->w = 0; 6918c2ecf20Sopenharmony_ci fd = os_open_file(file, *openflags, mode); 6928c2ecf20Sopenharmony_ci if (fd < 0) 6938c2ecf20Sopenharmony_ci return fd; 6948c2ecf20Sopenharmony_ci } 6958c2ecf20Sopenharmony_ci 6968c2ecf20Sopenharmony_ci if (shared) 6978c2ecf20Sopenharmony_ci printk(KERN_INFO "Not locking \"%s\" on the host\n", file); 6988c2ecf20Sopenharmony_ci else { 6998c2ecf20Sopenharmony_ci err = os_lock_file(fd, openflags->w); 7008c2ecf20Sopenharmony_ci if (err < 0) { 7018c2ecf20Sopenharmony_ci printk(KERN_ERR "Failed to lock '%s', err = %d\n", 7028c2ecf20Sopenharmony_ci file, -err); 7038c2ecf20Sopenharmony_ci goto out_close; 7048c2ecf20Sopenharmony_ci } 7058c2ecf20Sopenharmony_ci } 7068c2ecf20Sopenharmony_ci 7078c2ecf20Sopenharmony_ci /* Successful return case! */ 7088c2ecf20Sopenharmony_ci if (backing_file_out == NULL) 7098c2ecf20Sopenharmony_ci return fd; 7108c2ecf20Sopenharmony_ci 7118c2ecf20Sopenharmony_ci err = read_cow_header(file_reader, &fd, &version, &backing_file, &mtime, 7128c2ecf20Sopenharmony_ci &size, §orsize, &align, bitmap_offset_out); 7138c2ecf20Sopenharmony_ci if (err && (*backing_file_out != NULL)) { 7148c2ecf20Sopenharmony_ci printk(KERN_ERR "Failed to read COW header from COW file " 7158c2ecf20Sopenharmony_ci "\"%s\", errno = %d\n", file, -err); 7168c2ecf20Sopenharmony_ci goto out_close; 7178c2ecf20Sopenharmony_ci } 7188c2ecf20Sopenharmony_ci if (err) 7198c2ecf20Sopenharmony_ci return fd; 7208c2ecf20Sopenharmony_ci 7218c2ecf20Sopenharmony_ci asked_switch = path_requires_switch(*backing_file_out, backing_file, 7228c2ecf20Sopenharmony_ci file); 7238c2ecf20Sopenharmony_ci 7248c2ecf20Sopenharmony_ci /* Allow switching only if no mismatch. */ 7258c2ecf20Sopenharmony_ci if (asked_switch && !backing_file_mismatch(*backing_file_out, size, 7268c2ecf20Sopenharmony_ci mtime)) { 7278c2ecf20Sopenharmony_ci printk(KERN_ERR "Switching backing file to '%s'\n", 7288c2ecf20Sopenharmony_ci *backing_file_out); 7298c2ecf20Sopenharmony_ci err = write_cow_header(file, fd, *backing_file_out, 7308c2ecf20Sopenharmony_ci sectorsize, align, &size); 7318c2ecf20Sopenharmony_ci if (err) { 7328c2ecf20Sopenharmony_ci printk(KERN_ERR "Switch failed, errno = %d\n", -err); 7338c2ecf20Sopenharmony_ci goto out_close; 7348c2ecf20Sopenharmony_ci } 7358c2ecf20Sopenharmony_ci } else { 7368c2ecf20Sopenharmony_ci *backing_file_out = backing_file; 7378c2ecf20Sopenharmony_ci err = backing_file_mismatch(*backing_file_out, size, mtime); 7388c2ecf20Sopenharmony_ci if (err) 7398c2ecf20Sopenharmony_ci goto out_close; 7408c2ecf20Sopenharmony_ci } 7418c2ecf20Sopenharmony_ci 7428c2ecf20Sopenharmony_ci cow_sizes(version, size, sectorsize, align, *bitmap_offset_out, 7438c2ecf20Sopenharmony_ci bitmap_len_out, data_offset_out); 7448c2ecf20Sopenharmony_ci 7458c2ecf20Sopenharmony_ci return fd; 7468c2ecf20Sopenharmony_ci out_close: 7478c2ecf20Sopenharmony_ci os_close_file(fd); 7488c2ecf20Sopenharmony_ci return err; 7498c2ecf20Sopenharmony_ci} 7508c2ecf20Sopenharmony_ci 7518c2ecf20Sopenharmony_cistatic int create_cow_file(char *cow_file, char *backing_file, 7528c2ecf20Sopenharmony_ci struct openflags flags, 7538c2ecf20Sopenharmony_ci int sectorsize, int alignment, int *bitmap_offset_out, 7548c2ecf20Sopenharmony_ci unsigned long *bitmap_len_out, int *data_offset_out) 7558c2ecf20Sopenharmony_ci{ 7568c2ecf20Sopenharmony_ci int err, fd; 7578c2ecf20Sopenharmony_ci 7588c2ecf20Sopenharmony_ci flags.c = 1; 7598c2ecf20Sopenharmony_ci fd = open_ubd_file(cow_file, &flags, 0, NULL, NULL, NULL, NULL, NULL); 7608c2ecf20Sopenharmony_ci if (fd < 0) { 7618c2ecf20Sopenharmony_ci err = fd; 7628c2ecf20Sopenharmony_ci printk(KERN_ERR "Open of COW file '%s' failed, errno = %d\n", 7638c2ecf20Sopenharmony_ci cow_file, -err); 7648c2ecf20Sopenharmony_ci goto out; 7658c2ecf20Sopenharmony_ci } 7668c2ecf20Sopenharmony_ci 7678c2ecf20Sopenharmony_ci err = init_cow_file(fd, cow_file, backing_file, sectorsize, alignment, 7688c2ecf20Sopenharmony_ci bitmap_offset_out, bitmap_len_out, 7698c2ecf20Sopenharmony_ci data_offset_out); 7708c2ecf20Sopenharmony_ci if (!err) 7718c2ecf20Sopenharmony_ci return fd; 7728c2ecf20Sopenharmony_ci os_close_file(fd); 7738c2ecf20Sopenharmony_ci out: 7748c2ecf20Sopenharmony_ci return err; 7758c2ecf20Sopenharmony_ci} 7768c2ecf20Sopenharmony_ci 7778c2ecf20Sopenharmony_cistatic void ubd_close_dev(struct ubd *ubd_dev) 7788c2ecf20Sopenharmony_ci{ 7798c2ecf20Sopenharmony_ci os_close_file(ubd_dev->fd); 7808c2ecf20Sopenharmony_ci if(ubd_dev->cow.file == NULL) 7818c2ecf20Sopenharmony_ci return; 7828c2ecf20Sopenharmony_ci 7838c2ecf20Sopenharmony_ci os_close_file(ubd_dev->cow.fd); 7848c2ecf20Sopenharmony_ci vfree(ubd_dev->cow.bitmap); 7858c2ecf20Sopenharmony_ci ubd_dev->cow.bitmap = NULL; 7868c2ecf20Sopenharmony_ci} 7878c2ecf20Sopenharmony_ci 7888c2ecf20Sopenharmony_cistatic int ubd_open_dev(struct ubd *ubd_dev) 7898c2ecf20Sopenharmony_ci{ 7908c2ecf20Sopenharmony_ci struct openflags flags; 7918c2ecf20Sopenharmony_ci char **back_ptr; 7928c2ecf20Sopenharmony_ci int err, create_cow, *create_ptr; 7938c2ecf20Sopenharmony_ci int fd; 7948c2ecf20Sopenharmony_ci 7958c2ecf20Sopenharmony_ci ubd_dev->openflags = ubd_dev->boot_openflags; 7968c2ecf20Sopenharmony_ci create_cow = 0; 7978c2ecf20Sopenharmony_ci create_ptr = (ubd_dev->cow.file != NULL) ? &create_cow : NULL; 7988c2ecf20Sopenharmony_ci back_ptr = ubd_dev->no_cow ? NULL : &ubd_dev->cow.file; 7998c2ecf20Sopenharmony_ci 8008c2ecf20Sopenharmony_ci fd = open_ubd_file(ubd_dev->file, &ubd_dev->openflags, ubd_dev->shared, 8018c2ecf20Sopenharmony_ci back_ptr, &ubd_dev->cow.bitmap_offset, 8028c2ecf20Sopenharmony_ci &ubd_dev->cow.bitmap_len, &ubd_dev->cow.data_offset, 8038c2ecf20Sopenharmony_ci create_ptr); 8048c2ecf20Sopenharmony_ci 8058c2ecf20Sopenharmony_ci if((fd == -ENOENT) && create_cow){ 8068c2ecf20Sopenharmony_ci fd = create_cow_file(ubd_dev->file, ubd_dev->cow.file, 8078c2ecf20Sopenharmony_ci ubd_dev->openflags, SECTOR_SIZE, PAGE_SIZE, 8088c2ecf20Sopenharmony_ci &ubd_dev->cow.bitmap_offset, 8098c2ecf20Sopenharmony_ci &ubd_dev->cow.bitmap_len, 8108c2ecf20Sopenharmony_ci &ubd_dev->cow.data_offset); 8118c2ecf20Sopenharmony_ci if(fd >= 0){ 8128c2ecf20Sopenharmony_ci printk(KERN_INFO "Creating \"%s\" as COW file for " 8138c2ecf20Sopenharmony_ci "\"%s\"\n", ubd_dev->file, ubd_dev->cow.file); 8148c2ecf20Sopenharmony_ci } 8158c2ecf20Sopenharmony_ci } 8168c2ecf20Sopenharmony_ci 8178c2ecf20Sopenharmony_ci if(fd < 0){ 8188c2ecf20Sopenharmony_ci printk("Failed to open '%s', errno = %d\n", ubd_dev->file, 8198c2ecf20Sopenharmony_ci -fd); 8208c2ecf20Sopenharmony_ci return fd; 8218c2ecf20Sopenharmony_ci } 8228c2ecf20Sopenharmony_ci ubd_dev->fd = fd; 8238c2ecf20Sopenharmony_ci 8248c2ecf20Sopenharmony_ci if(ubd_dev->cow.file != NULL){ 8258c2ecf20Sopenharmony_ci blk_queue_max_hw_sectors(ubd_dev->queue, 8 * sizeof(long)); 8268c2ecf20Sopenharmony_ci 8278c2ecf20Sopenharmony_ci err = -ENOMEM; 8288c2ecf20Sopenharmony_ci ubd_dev->cow.bitmap = vmalloc(ubd_dev->cow.bitmap_len); 8298c2ecf20Sopenharmony_ci if(ubd_dev->cow.bitmap == NULL){ 8308c2ecf20Sopenharmony_ci printk(KERN_ERR "Failed to vmalloc COW bitmap\n"); 8318c2ecf20Sopenharmony_ci goto error; 8328c2ecf20Sopenharmony_ci } 8338c2ecf20Sopenharmony_ci flush_tlb_kernel_vm(); 8348c2ecf20Sopenharmony_ci 8358c2ecf20Sopenharmony_ci err = read_cow_bitmap(ubd_dev->fd, ubd_dev->cow.bitmap, 8368c2ecf20Sopenharmony_ci ubd_dev->cow.bitmap_offset, 8378c2ecf20Sopenharmony_ci ubd_dev->cow.bitmap_len); 8388c2ecf20Sopenharmony_ci if(err < 0) 8398c2ecf20Sopenharmony_ci goto error; 8408c2ecf20Sopenharmony_ci 8418c2ecf20Sopenharmony_ci flags = ubd_dev->openflags; 8428c2ecf20Sopenharmony_ci flags.w = 0; 8438c2ecf20Sopenharmony_ci err = open_ubd_file(ubd_dev->cow.file, &flags, ubd_dev->shared, NULL, 8448c2ecf20Sopenharmony_ci NULL, NULL, NULL, NULL); 8458c2ecf20Sopenharmony_ci if(err < 0) goto error; 8468c2ecf20Sopenharmony_ci ubd_dev->cow.fd = err; 8478c2ecf20Sopenharmony_ci } 8488c2ecf20Sopenharmony_ci if (ubd_dev->no_trim == 0) { 8498c2ecf20Sopenharmony_ci ubd_dev->queue->limits.discard_granularity = SECTOR_SIZE; 8508c2ecf20Sopenharmony_ci ubd_dev->queue->limits.discard_alignment = SECTOR_SIZE; 8518c2ecf20Sopenharmony_ci blk_queue_max_discard_sectors(ubd_dev->queue, UBD_MAX_REQUEST); 8528c2ecf20Sopenharmony_ci blk_queue_max_write_zeroes_sectors(ubd_dev->queue, UBD_MAX_REQUEST); 8538c2ecf20Sopenharmony_ci blk_queue_flag_set(QUEUE_FLAG_DISCARD, ubd_dev->queue); 8548c2ecf20Sopenharmony_ci } 8558c2ecf20Sopenharmony_ci blk_queue_flag_set(QUEUE_FLAG_NONROT, ubd_dev->queue); 8568c2ecf20Sopenharmony_ci return 0; 8578c2ecf20Sopenharmony_ci error: 8588c2ecf20Sopenharmony_ci os_close_file(ubd_dev->fd); 8598c2ecf20Sopenharmony_ci return err; 8608c2ecf20Sopenharmony_ci} 8618c2ecf20Sopenharmony_ci 8628c2ecf20Sopenharmony_cistatic void ubd_device_release(struct device *dev) 8638c2ecf20Sopenharmony_ci{ 8648c2ecf20Sopenharmony_ci struct ubd *ubd_dev = dev_get_drvdata(dev); 8658c2ecf20Sopenharmony_ci 8668c2ecf20Sopenharmony_ci blk_cleanup_queue(ubd_dev->queue); 8678c2ecf20Sopenharmony_ci blk_mq_free_tag_set(&ubd_dev->tag_set); 8688c2ecf20Sopenharmony_ci *ubd_dev = ((struct ubd) DEFAULT_UBD); 8698c2ecf20Sopenharmony_ci} 8708c2ecf20Sopenharmony_ci 8718c2ecf20Sopenharmony_cistatic int ubd_disk_register(int major, u64 size, int unit, 8728c2ecf20Sopenharmony_ci struct gendisk **disk_out) 8738c2ecf20Sopenharmony_ci{ 8748c2ecf20Sopenharmony_ci struct device *parent = NULL; 8758c2ecf20Sopenharmony_ci struct gendisk *disk; 8768c2ecf20Sopenharmony_ci 8778c2ecf20Sopenharmony_ci disk = alloc_disk(1 << UBD_SHIFT); 8788c2ecf20Sopenharmony_ci if(disk == NULL) 8798c2ecf20Sopenharmony_ci return -ENOMEM; 8808c2ecf20Sopenharmony_ci 8818c2ecf20Sopenharmony_ci disk->major = major; 8828c2ecf20Sopenharmony_ci disk->first_minor = unit << UBD_SHIFT; 8838c2ecf20Sopenharmony_ci disk->fops = &ubd_blops; 8848c2ecf20Sopenharmony_ci set_capacity(disk, size / 512); 8858c2ecf20Sopenharmony_ci if (major == UBD_MAJOR) 8868c2ecf20Sopenharmony_ci sprintf(disk->disk_name, "ubd%c", 'a' + unit); 8878c2ecf20Sopenharmony_ci else 8888c2ecf20Sopenharmony_ci sprintf(disk->disk_name, "ubd_fake%d", unit); 8898c2ecf20Sopenharmony_ci 8908c2ecf20Sopenharmony_ci /* sysfs register (not for ide fake devices) */ 8918c2ecf20Sopenharmony_ci if (major == UBD_MAJOR) { 8928c2ecf20Sopenharmony_ci ubd_devs[unit].pdev.id = unit; 8938c2ecf20Sopenharmony_ci ubd_devs[unit].pdev.name = DRIVER_NAME; 8948c2ecf20Sopenharmony_ci ubd_devs[unit].pdev.dev.release = ubd_device_release; 8958c2ecf20Sopenharmony_ci dev_set_drvdata(&ubd_devs[unit].pdev.dev, &ubd_devs[unit]); 8968c2ecf20Sopenharmony_ci platform_device_register(&ubd_devs[unit].pdev); 8978c2ecf20Sopenharmony_ci parent = &ubd_devs[unit].pdev.dev; 8988c2ecf20Sopenharmony_ci } 8998c2ecf20Sopenharmony_ci 9008c2ecf20Sopenharmony_ci disk->private_data = &ubd_devs[unit]; 9018c2ecf20Sopenharmony_ci disk->queue = ubd_devs[unit].queue; 9028c2ecf20Sopenharmony_ci device_add_disk(parent, disk, NULL); 9038c2ecf20Sopenharmony_ci 9048c2ecf20Sopenharmony_ci *disk_out = disk; 9058c2ecf20Sopenharmony_ci return 0; 9068c2ecf20Sopenharmony_ci} 9078c2ecf20Sopenharmony_ci 9088c2ecf20Sopenharmony_ci#define ROUND_BLOCK(n) ((n + (SECTOR_SIZE - 1)) & (-SECTOR_SIZE)) 9098c2ecf20Sopenharmony_ci 9108c2ecf20Sopenharmony_cistatic const struct blk_mq_ops ubd_mq_ops = { 9118c2ecf20Sopenharmony_ci .queue_rq = ubd_queue_rq, 9128c2ecf20Sopenharmony_ci}; 9138c2ecf20Sopenharmony_ci 9148c2ecf20Sopenharmony_cistatic int ubd_add(int n, char **error_out) 9158c2ecf20Sopenharmony_ci{ 9168c2ecf20Sopenharmony_ci struct ubd *ubd_dev = &ubd_devs[n]; 9178c2ecf20Sopenharmony_ci int err = 0; 9188c2ecf20Sopenharmony_ci 9198c2ecf20Sopenharmony_ci if(ubd_dev->file == NULL) 9208c2ecf20Sopenharmony_ci goto out; 9218c2ecf20Sopenharmony_ci 9228c2ecf20Sopenharmony_ci err = ubd_file_size(ubd_dev, &ubd_dev->size); 9238c2ecf20Sopenharmony_ci if(err < 0){ 9248c2ecf20Sopenharmony_ci *error_out = "Couldn't determine size of device's file"; 9258c2ecf20Sopenharmony_ci goto out; 9268c2ecf20Sopenharmony_ci } 9278c2ecf20Sopenharmony_ci 9288c2ecf20Sopenharmony_ci ubd_dev->size = ROUND_BLOCK(ubd_dev->size); 9298c2ecf20Sopenharmony_ci 9308c2ecf20Sopenharmony_ci ubd_dev->tag_set.ops = &ubd_mq_ops; 9318c2ecf20Sopenharmony_ci ubd_dev->tag_set.queue_depth = 64; 9328c2ecf20Sopenharmony_ci ubd_dev->tag_set.numa_node = NUMA_NO_NODE; 9338c2ecf20Sopenharmony_ci ubd_dev->tag_set.flags = BLK_MQ_F_SHOULD_MERGE; 9348c2ecf20Sopenharmony_ci ubd_dev->tag_set.driver_data = ubd_dev; 9358c2ecf20Sopenharmony_ci ubd_dev->tag_set.nr_hw_queues = 1; 9368c2ecf20Sopenharmony_ci 9378c2ecf20Sopenharmony_ci err = blk_mq_alloc_tag_set(&ubd_dev->tag_set); 9388c2ecf20Sopenharmony_ci if (err) 9398c2ecf20Sopenharmony_ci goto out; 9408c2ecf20Sopenharmony_ci 9418c2ecf20Sopenharmony_ci ubd_dev->queue = blk_mq_init_queue(&ubd_dev->tag_set); 9428c2ecf20Sopenharmony_ci if (IS_ERR(ubd_dev->queue)) { 9438c2ecf20Sopenharmony_ci err = PTR_ERR(ubd_dev->queue); 9448c2ecf20Sopenharmony_ci goto out_cleanup_tags; 9458c2ecf20Sopenharmony_ci } 9468c2ecf20Sopenharmony_ci 9478c2ecf20Sopenharmony_ci ubd_dev->queue->queuedata = ubd_dev; 9488c2ecf20Sopenharmony_ci blk_queue_write_cache(ubd_dev->queue, true, false); 9498c2ecf20Sopenharmony_ci 9508c2ecf20Sopenharmony_ci blk_queue_max_segments(ubd_dev->queue, MAX_SG); 9518c2ecf20Sopenharmony_ci blk_queue_segment_boundary(ubd_dev->queue, PAGE_SIZE - 1); 9528c2ecf20Sopenharmony_ci err = ubd_disk_register(UBD_MAJOR, ubd_dev->size, n, &ubd_gendisk[n]); 9538c2ecf20Sopenharmony_ci if(err){ 9548c2ecf20Sopenharmony_ci *error_out = "Failed to register device"; 9558c2ecf20Sopenharmony_ci goto out_cleanup_tags; 9568c2ecf20Sopenharmony_ci } 9578c2ecf20Sopenharmony_ci 9588c2ecf20Sopenharmony_ci if (fake_major != UBD_MAJOR) 9598c2ecf20Sopenharmony_ci ubd_disk_register(fake_major, ubd_dev->size, n, 9608c2ecf20Sopenharmony_ci &fake_gendisk[n]); 9618c2ecf20Sopenharmony_ci 9628c2ecf20Sopenharmony_ci /* 9638c2ecf20Sopenharmony_ci * Perhaps this should also be under the "if (fake_major)" above 9648c2ecf20Sopenharmony_ci * using the fake_disk->disk_name 9658c2ecf20Sopenharmony_ci */ 9668c2ecf20Sopenharmony_ci if (fake_ide) 9678c2ecf20Sopenharmony_ci make_ide_entries(ubd_gendisk[n]->disk_name); 9688c2ecf20Sopenharmony_ci 9698c2ecf20Sopenharmony_ci err = 0; 9708c2ecf20Sopenharmony_ciout: 9718c2ecf20Sopenharmony_ci return err; 9728c2ecf20Sopenharmony_ci 9738c2ecf20Sopenharmony_ciout_cleanup_tags: 9748c2ecf20Sopenharmony_ci blk_mq_free_tag_set(&ubd_dev->tag_set); 9758c2ecf20Sopenharmony_ci if (!(IS_ERR(ubd_dev->queue))) 9768c2ecf20Sopenharmony_ci blk_cleanup_queue(ubd_dev->queue); 9778c2ecf20Sopenharmony_ci goto out; 9788c2ecf20Sopenharmony_ci} 9798c2ecf20Sopenharmony_ci 9808c2ecf20Sopenharmony_cistatic int ubd_config(char *str, char **error_out) 9818c2ecf20Sopenharmony_ci{ 9828c2ecf20Sopenharmony_ci int n, ret; 9838c2ecf20Sopenharmony_ci 9848c2ecf20Sopenharmony_ci /* This string is possibly broken up and stored, so it's only 9858c2ecf20Sopenharmony_ci * freed if ubd_setup_common fails, or if only general options 9868c2ecf20Sopenharmony_ci * were set. 9878c2ecf20Sopenharmony_ci */ 9888c2ecf20Sopenharmony_ci str = kstrdup(str, GFP_KERNEL); 9898c2ecf20Sopenharmony_ci if (str == NULL) { 9908c2ecf20Sopenharmony_ci *error_out = "Failed to allocate memory"; 9918c2ecf20Sopenharmony_ci return -ENOMEM; 9928c2ecf20Sopenharmony_ci } 9938c2ecf20Sopenharmony_ci 9948c2ecf20Sopenharmony_ci ret = ubd_setup_common(str, &n, error_out); 9958c2ecf20Sopenharmony_ci if (ret) 9968c2ecf20Sopenharmony_ci goto err_free; 9978c2ecf20Sopenharmony_ci 9988c2ecf20Sopenharmony_ci if (n == -1) { 9998c2ecf20Sopenharmony_ci ret = 0; 10008c2ecf20Sopenharmony_ci goto err_free; 10018c2ecf20Sopenharmony_ci } 10028c2ecf20Sopenharmony_ci 10038c2ecf20Sopenharmony_ci mutex_lock(&ubd_lock); 10048c2ecf20Sopenharmony_ci ret = ubd_add(n, error_out); 10058c2ecf20Sopenharmony_ci if (ret) 10068c2ecf20Sopenharmony_ci ubd_devs[n].file = NULL; 10078c2ecf20Sopenharmony_ci mutex_unlock(&ubd_lock); 10088c2ecf20Sopenharmony_ci 10098c2ecf20Sopenharmony_ciout: 10108c2ecf20Sopenharmony_ci return ret; 10118c2ecf20Sopenharmony_ci 10128c2ecf20Sopenharmony_cierr_free: 10138c2ecf20Sopenharmony_ci kfree(str); 10148c2ecf20Sopenharmony_ci goto out; 10158c2ecf20Sopenharmony_ci} 10168c2ecf20Sopenharmony_ci 10178c2ecf20Sopenharmony_cistatic int ubd_get_config(char *name, char *str, int size, char **error_out) 10188c2ecf20Sopenharmony_ci{ 10198c2ecf20Sopenharmony_ci struct ubd *ubd_dev; 10208c2ecf20Sopenharmony_ci int n, len = 0; 10218c2ecf20Sopenharmony_ci 10228c2ecf20Sopenharmony_ci n = parse_unit(&name); 10238c2ecf20Sopenharmony_ci if((n >= MAX_DEV) || (n < 0)){ 10248c2ecf20Sopenharmony_ci *error_out = "ubd_get_config : device number out of range"; 10258c2ecf20Sopenharmony_ci return -1; 10268c2ecf20Sopenharmony_ci } 10278c2ecf20Sopenharmony_ci 10288c2ecf20Sopenharmony_ci ubd_dev = &ubd_devs[n]; 10298c2ecf20Sopenharmony_ci mutex_lock(&ubd_lock); 10308c2ecf20Sopenharmony_ci 10318c2ecf20Sopenharmony_ci if(ubd_dev->file == NULL){ 10328c2ecf20Sopenharmony_ci CONFIG_CHUNK(str, size, len, "", 1); 10338c2ecf20Sopenharmony_ci goto out; 10348c2ecf20Sopenharmony_ci } 10358c2ecf20Sopenharmony_ci 10368c2ecf20Sopenharmony_ci CONFIG_CHUNK(str, size, len, ubd_dev->file, 0); 10378c2ecf20Sopenharmony_ci 10388c2ecf20Sopenharmony_ci if(ubd_dev->cow.file != NULL){ 10398c2ecf20Sopenharmony_ci CONFIG_CHUNK(str, size, len, ",", 0); 10408c2ecf20Sopenharmony_ci CONFIG_CHUNK(str, size, len, ubd_dev->cow.file, 1); 10418c2ecf20Sopenharmony_ci } 10428c2ecf20Sopenharmony_ci else CONFIG_CHUNK(str, size, len, "", 1); 10438c2ecf20Sopenharmony_ci 10448c2ecf20Sopenharmony_ci out: 10458c2ecf20Sopenharmony_ci mutex_unlock(&ubd_lock); 10468c2ecf20Sopenharmony_ci return len; 10478c2ecf20Sopenharmony_ci} 10488c2ecf20Sopenharmony_ci 10498c2ecf20Sopenharmony_cistatic int ubd_id(char **str, int *start_out, int *end_out) 10508c2ecf20Sopenharmony_ci{ 10518c2ecf20Sopenharmony_ci int n; 10528c2ecf20Sopenharmony_ci 10538c2ecf20Sopenharmony_ci n = parse_unit(str); 10548c2ecf20Sopenharmony_ci *start_out = 0; 10558c2ecf20Sopenharmony_ci *end_out = MAX_DEV - 1; 10568c2ecf20Sopenharmony_ci return n; 10578c2ecf20Sopenharmony_ci} 10588c2ecf20Sopenharmony_ci 10598c2ecf20Sopenharmony_cistatic int ubd_remove(int n, char **error_out) 10608c2ecf20Sopenharmony_ci{ 10618c2ecf20Sopenharmony_ci struct gendisk *disk = ubd_gendisk[n]; 10628c2ecf20Sopenharmony_ci struct ubd *ubd_dev; 10638c2ecf20Sopenharmony_ci int err = -ENODEV; 10648c2ecf20Sopenharmony_ci 10658c2ecf20Sopenharmony_ci mutex_lock(&ubd_lock); 10668c2ecf20Sopenharmony_ci 10678c2ecf20Sopenharmony_ci ubd_dev = &ubd_devs[n]; 10688c2ecf20Sopenharmony_ci 10698c2ecf20Sopenharmony_ci if(ubd_dev->file == NULL) 10708c2ecf20Sopenharmony_ci goto out; 10718c2ecf20Sopenharmony_ci 10728c2ecf20Sopenharmony_ci /* you cannot remove a open disk */ 10738c2ecf20Sopenharmony_ci err = -EBUSY; 10748c2ecf20Sopenharmony_ci if(ubd_dev->count > 0) 10758c2ecf20Sopenharmony_ci goto out; 10768c2ecf20Sopenharmony_ci 10778c2ecf20Sopenharmony_ci ubd_gendisk[n] = NULL; 10788c2ecf20Sopenharmony_ci if(disk != NULL){ 10798c2ecf20Sopenharmony_ci del_gendisk(disk); 10808c2ecf20Sopenharmony_ci put_disk(disk); 10818c2ecf20Sopenharmony_ci } 10828c2ecf20Sopenharmony_ci 10838c2ecf20Sopenharmony_ci if(fake_gendisk[n] != NULL){ 10848c2ecf20Sopenharmony_ci del_gendisk(fake_gendisk[n]); 10858c2ecf20Sopenharmony_ci put_disk(fake_gendisk[n]); 10868c2ecf20Sopenharmony_ci fake_gendisk[n] = NULL; 10878c2ecf20Sopenharmony_ci } 10888c2ecf20Sopenharmony_ci 10898c2ecf20Sopenharmony_ci err = 0; 10908c2ecf20Sopenharmony_ci platform_device_unregister(&ubd_dev->pdev); 10918c2ecf20Sopenharmony_ciout: 10928c2ecf20Sopenharmony_ci mutex_unlock(&ubd_lock); 10938c2ecf20Sopenharmony_ci return err; 10948c2ecf20Sopenharmony_ci} 10958c2ecf20Sopenharmony_ci 10968c2ecf20Sopenharmony_ci/* All these are called by mconsole in process context and without 10978c2ecf20Sopenharmony_ci * ubd-specific locks. The structure itself is const except for .list. 10988c2ecf20Sopenharmony_ci */ 10998c2ecf20Sopenharmony_cistatic struct mc_device ubd_mc = { 11008c2ecf20Sopenharmony_ci .list = LIST_HEAD_INIT(ubd_mc.list), 11018c2ecf20Sopenharmony_ci .name = "ubd", 11028c2ecf20Sopenharmony_ci .config = ubd_config, 11038c2ecf20Sopenharmony_ci .get_config = ubd_get_config, 11048c2ecf20Sopenharmony_ci .id = ubd_id, 11058c2ecf20Sopenharmony_ci .remove = ubd_remove, 11068c2ecf20Sopenharmony_ci}; 11078c2ecf20Sopenharmony_ci 11088c2ecf20Sopenharmony_cistatic int __init ubd_mc_init(void) 11098c2ecf20Sopenharmony_ci{ 11108c2ecf20Sopenharmony_ci mconsole_register_dev(&ubd_mc); 11118c2ecf20Sopenharmony_ci return 0; 11128c2ecf20Sopenharmony_ci} 11138c2ecf20Sopenharmony_ci 11148c2ecf20Sopenharmony_ci__initcall(ubd_mc_init); 11158c2ecf20Sopenharmony_ci 11168c2ecf20Sopenharmony_cistatic int __init ubd0_init(void) 11178c2ecf20Sopenharmony_ci{ 11188c2ecf20Sopenharmony_ci struct ubd *ubd_dev = &ubd_devs[0]; 11198c2ecf20Sopenharmony_ci 11208c2ecf20Sopenharmony_ci mutex_lock(&ubd_lock); 11218c2ecf20Sopenharmony_ci if(ubd_dev->file == NULL) 11228c2ecf20Sopenharmony_ci ubd_dev->file = "root_fs"; 11238c2ecf20Sopenharmony_ci mutex_unlock(&ubd_lock); 11248c2ecf20Sopenharmony_ci 11258c2ecf20Sopenharmony_ci return 0; 11268c2ecf20Sopenharmony_ci} 11278c2ecf20Sopenharmony_ci 11288c2ecf20Sopenharmony_ci__initcall(ubd0_init); 11298c2ecf20Sopenharmony_ci 11308c2ecf20Sopenharmony_ci/* Used in ubd_init, which is an initcall */ 11318c2ecf20Sopenharmony_cistatic struct platform_driver ubd_driver = { 11328c2ecf20Sopenharmony_ci .driver = { 11338c2ecf20Sopenharmony_ci .name = DRIVER_NAME, 11348c2ecf20Sopenharmony_ci }, 11358c2ecf20Sopenharmony_ci}; 11368c2ecf20Sopenharmony_ci 11378c2ecf20Sopenharmony_cistatic int __init ubd_init(void) 11388c2ecf20Sopenharmony_ci{ 11398c2ecf20Sopenharmony_ci char *error; 11408c2ecf20Sopenharmony_ci int i, err; 11418c2ecf20Sopenharmony_ci 11428c2ecf20Sopenharmony_ci if (register_blkdev(UBD_MAJOR, "ubd")) 11438c2ecf20Sopenharmony_ci return -1; 11448c2ecf20Sopenharmony_ci 11458c2ecf20Sopenharmony_ci if (fake_major != UBD_MAJOR) { 11468c2ecf20Sopenharmony_ci char name[sizeof("ubd_nnn\0")]; 11478c2ecf20Sopenharmony_ci 11488c2ecf20Sopenharmony_ci snprintf(name, sizeof(name), "ubd_%d", fake_major); 11498c2ecf20Sopenharmony_ci if (register_blkdev(fake_major, "ubd")) 11508c2ecf20Sopenharmony_ci return -1; 11518c2ecf20Sopenharmony_ci } 11528c2ecf20Sopenharmony_ci 11538c2ecf20Sopenharmony_ci irq_req_buffer = kmalloc_array(UBD_REQ_BUFFER_SIZE, 11548c2ecf20Sopenharmony_ci sizeof(struct io_thread_req *), 11558c2ecf20Sopenharmony_ci GFP_KERNEL 11568c2ecf20Sopenharmony_ci ); 11578c2ecf20Sopenharmony_ci irq_remainder = 0; 11588c2ecf20Sopenharmony_ci 11598c2ecf20Sopenharmony_ci if (irq_req_buffer == NULL) { 11608c2ecf20Sopenharmony_ci printk(KERN_ERR "Failed to initialize ubd buffering\n"); 11618c2ecf20Sopenharmony_ci return -1; 11628c2ecf20Sopenharmony_ci } 11638c2ecf20Sopenharmony_ci io_req_buffer = kmalloc_array(UBD_REQ_BUFFER_SIZE, 11648c2ecf20Sopenharmony_ci sizeof(struct io_thread_req *), 11658c2ecf20Sopenharmony_ci GFP_KERNEL 11668c2ecf20Sopenharmony_ci ); 11678c2ecf20Sopenharmony_ci 11688c2ecf20Sopenharmony_ci io_remainder = 0; 11698c2ecf20Sopenharmony_ci 11708c2ecf20Sopenharmony_ci if (io_req_buffer == NULL) { 11718c2ecf20Sopenharmony_ci printk(KERN_ERR "Failed to initialize ubd buffering\n"); 11728c2ecf20Sopenharmony_ci return -1; 11738c2ecf20Sopenharmony_ci } 11748c2ecf20Sopenharmony_ci platform_driver_register(&ubd_driver); 11758c2ecf20Sopenharmony_ci mutex_lock(&ubd_lock); 11768c2ecf20Sopenharmony_ci for (i = 0; i < MAX_DEV; i++){ 11778c2ecf20Sopenharmony_ci err = ubd_add(i, &error); 11788c2ecf20Sopenharmony_ci if(err) 11798c2ecf20Sopenharmony_ci printk(KERN_ERR "Failed to initialize ubd device %d :" 11808c2ecf20Sopenharmony_ci "%s\n", i, error); 11818c2ecf20Sopenharmony_ci } 11828c2ecf20Sopenharmony_ci mutex_unlock(&ubd_lock); 11838c2ecf20Sopenharmony_ci return 0; 11848c2ecf20Sopenharmony_ci} 11858c2ecf20Sopenharmony_ci 11868c2ecf20Sopenharmony_cilate_initcall(ubd_init); 11878c2ecf20Sopenharmony_ci 11888c2ecf20Sopenharmony_cistatic int __init ubd_driver_init(void){ 11898c2ecf20Sopenharmony_ci unsigned long stack; 11908c2ecf20Sopenharmony_ci int err; 11918c2ecf20Sopenharmony_ci 11928c2ecf20Sopenharmony_ci /* Set by CONFIG_BLK_DEV_UBD_SYNC or ubd=sync.*/ 11938c2ecf20Sopenharmony_ci if(global_openflags.s){ 11948c2ecf20Sopenharmony_ci printk(KERN_INFO "ubd: Synchronous mode\n"); 11958c2ecf20Sopenharmony_ci /* Letting ubd=sync be like using ubd#s= instead of ubd#= is 11968c2ecf20Sopenharmony_ci * enough. So use anyway the io thread. */ 11978c2ecf20Sopenharmony_ci } 11988c2ecf20Sopenharmony_ci stack = alloc_stack(0, 0); 11998c2ecf20Sopenharmony_ci io_pid = start_io_thread(stack + PAGE_SIZE - sizeof(void *), 12008c2ecf20Sopenharmony_ci &thread_fd); 12018c2ecf20Sopenharmony_ci if(io_pid < 0){ 12028c2ecf20Sopenharmony_ci printk(KERN_ERR 12038c2ecf20Sopenharmony_ci "ubd : Failed to start I/O thread (errno = %d) - " 12048c2ecf20Sopenharmony_ci "falling back to synchronous I/O\n", -io_pid); 12058c2ecf20Sopenharmony_ci io_pid = -1; 12068c2ecf20Sopenharmony_ci return 0; 12078c2ecf20Sopenharmony_ci } 12088c2ecf20Sopenharmony_ci err = um_request_irq(UBD_IRQ, thread_fd, IRQ_READ, ubd_intr, 12098c2ecf20Sopenharmony_ci 0, "ubd", ubd_devs); 12108c2ecf20Sopenharmony_ci if(err != 0) 12118c2ecf20Sopenharmony_ci printk(KERN_ERR "um_request_irq failed - errno = %d\n", -err); 12128c2ecf20Sopenharmony_ci return 0; 12138c2ecf20Sopenharmony_ci} 12148c2ecf20Sopenharmony_ci 12158c2ecf20Sopenharmony_cidevice_initcall(ubd_driver_init); 12168c2ecf20Sopenharmony_ci 12178c2ecf20Sopenharmony_cistatic int ubd_open(struct block_device *bdev, fmode_t mode) 12188c2ecf20Sopenharmony_ci{ 12198c2ecf20Sopenharmony_ci struct gendisk *disk = bdev->bd_disk; 12208c2ecf20Sopenharmony_ci struct ubd *ubd_dev = disk->private_data; 12218c2ecf20Sopenharmony_ci int err = 0; 12228c2ecf20Sopenharmony_ci 12238c2ecf20Sopenharmony_ci mutex_lock(&ubd_mutex); 12248c2ecf20Sopenharmony_ci if(ubd_dev->count == 0){ 12258c2ecf20Sopenharmony_ci err = ubd_open_dev(ubd_dev); 12268c2ecf20Sopenharmony_ci if(err){ 12278c2ecf20Sopenharmony_ci printk(KERN_ERR "%s: Can't open \"%s\": errno = %d\n", 12288c2ecf20Sopenharmony_ci disk->disk_name, ubd_dev->file, -err); 12298c2ecf20Sopenharmony_ci goto out; 12308c2ecf20Sopenharmony_ci } 12318c2ecf20Sopenharmony_ci } 12328c2ecf20Sopenharmony_ci ubd_dev->count++; 12338c2ecf20Sopenharmony_ci set_disk_ro(disk, !ubd_dev->openflags.w); 12348c2ecf20Sopenharmony_ci 12358c2ecf20Sopenharmony_ci /* This should no more be needed. And it didn't work anyway to exclude 12368c2ecf20Sopenharmony_ci * read-write remounting of filesystems.*/ 12378c2ecf20Sopenharmony_ci /*if((mode & FMODE_WRITE) && !ubd_dev->openflags.w){ 12388c2ecf20Sopenharmony_ci if(--ubd_dev->count == 0) ubd_close_dev(ubd_dev); 12398c2ecf20Sopenharmony_ci err = -EROFS; 12408c2ecf20Sopenharmony_ci }*/ 12418c2ecf20Sopenharmony_ciout: 12428c2ecf20Sopenharmony_ci mutex_unlock(&ubd_mutex); 12438c2ecf20Sopenharmony_ci return err; 12448c2ecf20Sopenharmony_ci} 12458c2ecf20Sopenharmony_ci 12468c2ecf20Sopenharmony_cistatic void ubd_release(struct gendisk *disk, fmode_t mode) 12478c2ecf20Sopenharmony_ci{ 12488c2ecf20Sopenharmony_ci struct ubd *ubd_dev = disk->private_data; 12498c2ecf20Sopenharmony_ci 12508c2ecf20Sopenharmony_ci mutex_lock(&ubd_mutex); 12518c2ecf20Sopenharmony_ci if(--ubd_dev->count == 0) 12528c2ecf20Sopenharmony_ci ubd_close_dev(ubd_dev); 12538c2ecf20Sopenharmony_ci mutex_unlock(&ubd_mutex); 12548c2ecf20Sopenharmony_ci} 12558c2ecf20Sopenharmony_ci 12568c2ecf20Sopenharmony_cistatic void cowify_bitmap(__u64 io_offset, int length, unsigned long *cow_mask, 12578c2ecf20Sopenharmony_ci __u64 *cow_offset, unsigned long *bitmap, 12588c2ecf20Sopenharmony_ci __u64 bitmap_offset, unsigned long *bitmap_words, 12598c2ecf20Sopenharmony_ci __u64 bitmap_len) 12608c2ecf20Sopenharmony_ci{ 12618c2ecf20Sopenharmony_ci __u64 sector = io_offset >> SECTOR_SHIFT; 12628c2ecf20Sopenharmony_ci int i, update_bitmap = 0; 12638c2ecf20Sopenharmony_ci 12648c2ecf20Sopenharmony_ci for (i = 0; i < length >> SECTOR_SHIFT; i++) { 12658c2ecf20Sopenharmony_ci if(cow_mask != NULL) 12668c2ecf20Sopenharmony_ci ubd_set_bit(i, (unsigned char *) cow_mask); 12678c2ecf20Sopenharmony_ci if(ubd_test_bit(sector + i, (unsigned char *) bitmap)) 12688c2ecf20Sopenharmony_ci continue; 12698c2ecf20Sopenharmony_ci 12708c2ecf20Sopenharmony_ci update_bitmap = 1; 12718c2ecf20Sopenharmony_ci ubd_set_bit(sector + i, (unsigned char *) bitmap); 12728c2ecf20Sopenharmony_ci } 12738c2ecf20Sopenharmony_ci 12748c2ecf20Sopenharmony_ci if(!update_bitmap) 12758c2ecf20Sopenharmony_ci return; 12768c2ecf20Sopenharmony_ci 12778c2ecf20Sopenharmony_ci *cow_offset = sector / (sizeof(unsigned long) * 8); 12788c2ecf20Sopenharmony_ci 12798c2ecf20Sopenharmony_ci /* This takes care of the case where we're exactly at the end of the 12808c2ecf20Sopenharmony_ci * device, and *cow_offset + 1 is off the end. So, just back it up 12818c2ecf20Sopenharmony_ci * by one word. Thanks to Lynn Kerby for the fix and James McMechan 12828c2ecf20Sopenharmony_ci * for the original diagnosis. 12838c2ecf20Sopenharmony_ci */ 12848c2ecf20Sopenharmony_ci if (*cow_offset == (DIV_ROUND_UP(bitmap_len, 12858c2ecf20Sopenharmony_ci sizeof(unsigned long)) - 1)) 12868c2ecf20Sopenharmony_ci (*cow_offset)--; 12878c2ecf20Sopenharmony_ci 12888c2ecf20Sopenharmony_ci bitmap_words[0] = bitmap[*cow_offset]; 12898c2ecf20Sopenharmony_ci bitmap_words[1] = bitmap[*cow_offset + 1]; 12908c2ecf20Sopenharmony_ci 12918c2ecf20Sopenharmony_ci *cow_offset *= sizeof(unsigned long); 12928c2ecf20Sopenharmony_ci *cow_offset += bitmap_offset; 12938c2ecf20Sopenharmony_ci} 12948c2ecf20Sopenharmony_ci 12958c2ecf20Sopenharmony_cistatic void cowify_req(struct io_thread_req *req, struct io_desc *segment, 12968c2ecf20Sopenharmony_ci unsigned long offset, unsigned long *bitmap, 12978c2ecf20Sopenharmony_ci __u64 bitmap_offset, __u64 bitmap_len) 12988c2ecf20Sopenharmony_ci{ 12998c2ecf20Sopenharmony_ci __u64 sector = offset >> SECTOR_SHIFT; 13008c2ecf20Sopenharmony_ci int i; 13018c2ecf20Sopenharmony_ci 13028c2ecf20Sopenharmony_ci if (segment->length > (sizeof(segment->sector_mask) * 8) << SECTOR_SHIFT) 13038c2ecf20Sopenharmony_ci panic("Operation too long"); 13048c2ecf20Sopenharmony_ci 13058c2ecf20Sopenharmony_ci if (req_op(req->req) == REQ_OP_READ) { 13068c2ecf20Sopenharmony_ci for (i = 0; i < segment->length >> SECTOR_SHIFT; i++) { 13078c2ecf20Sopenharmony_ci if(ubd_test_bit(sector + i, (unsigned char *) bitmap)) 13088c2ecf20Sopenharmony_ci ubd_set_bit(i, (unsigned char *) 13098c2ecf20Sopenharmony_ci &segment->sector_mask); 13108c2ecf20Sopenharmony_ci } 13118c2ecf20Sopenharmony_ci } else { 13128c2ecf20Sopenharmony_ci cowify_bitmap(offset, segment->length, &segment->sector_mask, 13138c2ecf20Sopenharmony_ci &segment->cow_offset, bitmap, bitmap_offset, 13148c2ecf20Sopenharmony_ci segment->bitmap_words, bitmap_len); 13158c2ecf20Sopenharmony_ci } 13168c2ecf20Sopenharmony_ci} 13178c2ecf20Sopenharmony_ci 13188c2ecf20Sopenharmony_cistatic void ubd_map_req(struct ubd *dev, struct io_thread_req *io_req, 13198c2ecf20Sopenharmony_ci struct request *req) 13208c2ecf20Sopenharmony_ci{ 13218c2ecf20Sopenharmony_ci struct bio_vec bvec; 13228c2ecf20Sopenharmony_ci struct req_iterator iter; 13238c2ecf20Sopenharmony_ci int i = 0; 13248c2ecf20Sopenharmony_ci unsigned long byte_offset = io_req->offset; 13258c2ecf20Sopenharmony_ci int op = req_op(req); 13268c2ecf20Sopenharmony_ci 13278c2ecf20Sopenharmony_ci if (op == REQ_OP_WRITE_ZEROES || op == REQ_OP_DISCARD) { 13288c2ecf20Sopenharmony_ci io_req->io_desc[0].buffer = NULL; 13298c2ecf20Sopenharmony_ci io_req->io_desc[0].length = blk_rq_bytes(req); 13308c2ecf20Sopenharmony_ci } else { 13318c2ecf20Sopenharmony_ci rq_for_each_segment(bvec, req, iter) { 13328c2ecf20Sopenharmony_ci BUG_ON(i >= io_req->desc_cnt); 13338c2ecf20Sopenharmony_ci 13348c2ecf20Sopenharmony_ci io_req->io_desc[i].buffer = 13358c2ecf20Sopenharmony_ci page_address(bvec.bv_page) + bvec.bv_offset; 13368c2ecf20Sopenharmony_ci io_req->io_desc[i].length = bvec.bv_len; 13378c2ecf20Sopenharmony_ci i++; 13388c2ecf20Sopenharmony_ci } 13398c2ecf20Sopenharmony_ci } 13408c2ecf20Sopenharmony_ci 13418c2ecf20Sopenharmony_ci if (dev->cow.file) { 13428c2ecf20Sopenharmony_ci for (i = 0; i < io_req->desc_cnt; i++) { 13438c2ecf20Sopenharmony_ci cowify_req(io_req, &io_req->io_desc[i], byte_offset, 13448c2ecf20Sopenharmony_ci dev->cow.bitmap, dev->cow.bitmap_offset, 13458c2ecf20Sopenharmony_ci dev->cow.bitmap_len); 13468c2ecf20Sopenharmony_ci byte_offset += io_req->io_desc[i].length; 13478c2ecf20Sopenharmony_ci } 13488c2ecf20Sopenharmony_ci 13498c2ecf20Sopenharmony_ci } 13508c2ecf20Sopenharmony_ci} 13518c2ecf20Sopenharmony_ci 13528c2ecf20Sopenharmony_cistatic struct io_thread_req *ubd_alloc_req(struct ubd *dev, struct request *req, 13538c2ecf20Sopenharmony_ci int desc_cnt) 13548c2ecf20Sopenharmony_ci{ 13558c2ecf20Sopenharmony_ci struct io_thread_req *io_req; 13568c2ecf20Sopenharmony_ci int i; 13578c2ecf20Sopenharmony_ci 13588c2ecf20Sopenharmony_ci io_req = kmalloc(sizeof(*io_req) + 13598c2ecf20Sopenharmony_ci (desc_cnt * sizeof(struct io_desc)), 13608c2ecf20Sopenharmony_ci GFP_ATOMIC); 13618c2ecf20Sopenharmony_ci if (!io_req) 13628c2ecf20Sopenharmony_ci return NULL; 13638c2ecf20Sopenharmony_ci 13648c2ecf20Sopenharmony_ci io_req->req = req; 13658c2ecf20Sopenharmony_ci if (dev->cow.file) 13668c2ecf20Sopenharmony_ci io_req->fds[0] = dev->cow.fd; 13678c2ecf20Sopenharmony_ci else 13688c2ecf20Sopenharmony_ci io_req->fds[0] = dev->fd; 13698c2ecf20Sopenharmony_ci io_req->error = 0; 13708c2ecf20Sopenharmony_ci io_req->sectorsize = SECTOR_SIZE; 13718c2ecf20Sopenharmony_ci io_req->fds[1] = dev->fd; 13728c2ecf20Sopenharmony_ci io_req->offset = (u64) blk_rq_pos(req) << SECTOR_SHIFT; 13738c2ecf20Sopenharmony_ci io_req->offsets[0] = 0; 13748c2ecf20Sopenharmony_ci io_req->offsets[1] = dev->cow.data_offset; 13758c2ecf20Sopenharmony_ci 13768c2ecf20Sopenharmony_ci for (i = 0 ; i < desc_cnt; i++) { 13778c2ecf20Sopenharmony_ci io_req->io_desc[i].sector_mask = 0; 13788c2ecf20Sopenharmony_ci io_req->io_desc[i].cow_offset = -1; 13798c2ecf20Sopenharmony_ci } 13808c2ecf20Sopenharmony_ci 13818c2ecf20Sopenharmony_ci return io_req; 13828c2ecf20Sopenharmony_ci} 13838c2ecf20Sopenharmony_ci 13848c2ecf20Sopenharmony_cistatic int ubd_submit_request(struct ubd *dev, struct request *req) 13858c2ecf20Sopenharmony_ci{ 13868c2ecf20Sopenharmony_ci int segs = 0; 13878c2ecf20Sopenharmony_ci struct io_thread_req *io_req; 13888c2ecf20Sopenharmony_ci int ret; 13898c2ecf20Sopenharmony_ci int op = req_op(req); 13908c2ecf20Sopenharmony_ci 13918c2ecf20Sopenharmony_ci if (op == REQ_OP_FLUSH) 13928c2ecf20Sopenharmony_ci segs = 0; 13938c2ecf20Sopenharmony_ci else if (op == REQ_OP_WRITE_ZEROES || op == REQ_OP_DISCARD) 13948c2ecf20Sopenharmony_ci segs = 1; 13958c2ecf20Sopenharmony_ci else 13968c2ecf20Sopenharmony_ci segs = blk_rq_nr_phys_segments(req); 13978c2ecf20Sopenharmony_ci 13988c2ecf20Sopenharmony_ci io_req = ubd_alloc_req(dev, req, segs); 13998c2ecf20Sopenharmony_ci if (!io_req) 14008c2ecf20Sopenharmony_ci return -ENOMEM; 14018c2ecf20Sopenharmony_ci 14028c2ecf20Sopenharmony_ci io_req->desc_cnt = segs; 14038c2ecf20Sopenharmony_ci if (segs) 14048c2ecf20Sopenharmony_ci ubd_map_req(dev, io_req, req); 14058c2ecf20Sopenharmony_ci 14068c2ecf20Sopenharmony_ci ret = os_write_file(thread_fd, &io_req, sizeof(io_req)); 14078c2ecf20Sopenharmony_ci if (ret != sizeof(io_req)) { 14088c2ecf20Sopenharmony_ci if (ret != -EAGAIN) 14098c2ecf20Sopenharmony_ci pr_err("write to io thread failed: %d\n", -ret); 14108c2ecf20Sopenharmony_ci kfree(io_req); 14118c2ecf20Sopenharmony_ci } 14128c2ecf20Sopenharmony_ci return ret; 14138c2ecf20Sopenharmony_ci} 14148c2ecf20Sopenharmony_ci 14158c2ecf20Sopenharmony_cistatic blk_status_t ubd_queue_rq(struct blk_mq_hw_ctx *hctx, 14168c2ecf20Sopenharmony_ci const struct blk_mq_queue_data *bd) 14178c2ecf20Sopenharmony_ci{ 14188c2ecf20Sopenharmony_ci struct ubd *ubd_dev = hctx->queue->queuedata; 14198c2ecf20Sopenharmony_ci struct request *req = bd->rq; 14208c2ecf20Sopenharmony_ci int ret = 0, res = BLK_STS_OK; 14218c2ecf20Sopenharmony_ci 14228c2ecf20Sopenharmony_ci blk_mq_start_request(req); 14238c2ecf20Sopenharmony_ci 14248c2ecf20Sopenharmony_ci spin_lock_irq(&ubd_dev->lock); 14258c2ecf20Sopenharmony_ci 14268c2ecf20Sopenharmony_ci switch (req_op(req)) { 14278c2ecf20Sopenharmony_ci case REQ_OP_FLUSH: 14288c2ecf20Sopenharmony_ci case REQ_OP_READ: 14298c2ecf20Sopenharmony_ci case REQ_OP_WRITE: 14308c2ecf20Sopenharmony_ci case REQ_OP_DISCARD: 14318c2ecf20Sopenharmony_ci case REQ_OP_WRITE_ZEROES: 14328c2ecf20Sopenharmony_ci ret = ubd_submit_request(ubd_dev, req); 14338c2ecf20Sopenharmony_ci break; 14348c2ecf20Sopenharmony_ci default: 14358c2ecf20Sopenharmony_ci WARN_ON_ONCE(1); 14368c2ecf20Sopenharmony_ci res = BLK_STS_NOTSUPP; 14378c2ecf20Sopenharmony_ci } 14388c2ecf20Sopenharmony_ci 14398c2ecf20Sopenharmony_ci spin_unlock_irq(&ubd_dev->lock); 14408c2ecf20Sopenharmony_ci 14418c2ecf20Sopenharmony_ci if (ret < 0) { 14428c2ecf20Sopenharmony_ci if (ret == -ENOMEM) 14438c2ecf20Sopenharmony_ci res = BLK_STS_RESOURCE; 14448c2ecf20Sopenharmony_ci else 14458c2ecf20Sopenharmony_ci res = BLK_STS_DEV_RESOURCE; 14468c2ecf20Sopenharmony_ci } 14478c2ecf20Sopenharmony_ci 14488c2ecf20Sopenharmony_ci return res; 14498c2ecf20Sopenharmony_ci} 14508c2ecf20Sopenharmony_ci 14518c2ecf20Sopenharmony_cistatic int ubd_getgeo(struct block_device *bdev, struct hd_geometry *geo) 14528c2ecf20Sopenharmony_ci{ 14538c2ecf20Sopenharmony_ci struct ubd *ubd_dev = bdev->bd_disk->private_data; 14548c2ecf20Sopenharmony_ci 14558c2ecf20Sopenharmony_ci geo->heads = 128; 14568c2ecf20Sopenharmony_ci geo->sectors = 32; 14578c2ecf20Sopenharmony_ci geo->cylinders = ubd_dev->size / (128 * 32 * 512); 14588c2ecf20Sopenharmony_ci return 0; 14598c2ecf20Sopenharmony_ci} 14608c2ecf20Sopenharmony_ci 14618c2ecf20Sopenharmony_cistatic int ubd_ioctl(struct block_device *bdev, fmode_t mode, 14628c2ecf20Sopenharmony_ci unsigned int cmd, unsigned long arg) 14638c2ecf20Sopenharmony_ci{ 14648c2ecf20Sopenharmony_ci struct ubd *ubd_dev = bdev->bd_disk->private_data; 14658c2ecf20Sopenharmony_ci u16 ubd_id[ATA_ID_WORDS]; 14668c2ecf20Sopenharmony_ci 14678c2ecf20Sopenharmony_ci switch (cmd) { 14688c2ecf20Sopenharmony_ci struct cdrom_volctrl volume; 14698c2ecf20Sopenharmony_ci case HDIO_GET_IDENTITY: 14708c2ecf20Sopenharmony_ci memset(&ubd_id, 0, ATA_ID_WORDS * 2); 14718c2ecf20Sopenharmony_ci ubd_id[ATA_ID_CYLS] = ubd_dev->size / (128 * 32 * 512); 14728c2ecf20Sopenharmony_ci ubd_id[ATA_ID_HEADS] = 128; 14738c2ecf20Sopenharmony_ci ubd_id[ATA_ID_SECTORS] = 32; 14748c2ecf20Sopenharmony_ci if(copy_to_user((char __user *) arg, (char *) &ubd_id, 14758c2ecf20Sopenharmony_ci sizeof(ubd_id))) 14768c2ecf20Sopenharmony_ci return -EFAULT; 14778c2ecf20Sopenharmony_ci return 0; 14788c2ecf20Sopenharmony_ci 14798c2ecf20Sopenharmony_ci case CDROMVOLREAD: 14808c2ecf20Sopenharmony_ci if(copy_from_user(&volume, (char __user *) arg, sizeof(volume))) 14818c2ecf20Sopenharmony_ci return -EFAULT; 14828c2ecf20Sopenharmony_ci volume.channel0 = 255; 14838c2ecf20Sopenharmony_ci volume.channel1 = 255; 14848c2ecf20Sopenharmony_ci volume.channel2 = 255; 14858c2ecf20Sopenharmony_ci volume.channel3 = 255; 14868c2ecf20Sopenharmony_ci if(copy_to_user((char __user *) arg, &volume, sizeof(volume))) 14878c2ecf20Sopenharmony_ci return -EFAULT; 14888c2ecf20Sopenharmony_ci return 0; 14898c2ecf20Sopenharmony_ci } 14908c2ecf20Sopenharmony_ci return -EINVAL; 14918c2ecf20Sopenharmony_ci} 14928c2ecf20Sopenharmony_ci 14938c2ecf20Sopenharmony_cistatic int map_error(int error_code) 14948c2ecf20Sopenharmony_ci{ 14958c2ecf20Sopenharmony_ci switch (error_code) { 14968c2ecf20Sopenharmony_ci case 0: 14978c2ecf20Sopenharmony_ci return BLK_STS_OK; 14988c2ecf20Sopenharmony_ci case ENOSYS: 14998c2ecf20Sopenharmony_ci case EOPNOTSUPP: 15008c2ecf20Sopenharmony_ci return BLK_STS_NOTSUPP; 15018c2ecf20Sopenharmony_ci case ENOSPC: 15028c2ecf20Sopenharmony_ci return BLK_STS_NOSPC; 15038c2ecf20Sopenharmony_ci } 15048c2ecf20Sopenharmony_ci return BLK_STS_IOERR; 15058c2ecf20Sopenharmony_ci} 15068c2ecf20Sopenharmony_ci 15078c2ecf20Sopenharmony_ci/* 15088c2ecf20Sopenharmony_ci * Everything from here onwards *IS NOT PART OF THE KERNEL* 15098c2ecf20Sopenharmony_ci * 15108c2ecf20Sopenharmony_ci * The following functions are part of UML hypervisor code. 15118c2ecf20Sopenharmony_ci * All functions from here onwards are executed as a helper 15128c2ecf20Sopenharmony_ci * thread and are not allowed to execute any kernel functions. 15138c2ecf20Sopenharmony_ci * 15148c2ecf20Sopenharmony_ci * Any communication must occur strictly via shared memory and IPC. 15158c2ecf20Sopenharmony_ci * 15168c2ecf20Sopenharmony_ci * Do not add printks, locks, kernel memory operations, etc - it 15178c2ecf20Sopenharmony_ci * will result in unpredictable behaviour and/or crashes. 15188c2ecf20Sopenharmony_ci */ 15198c2ecf20Sopenharmony_ci 15208c2ecf20Sopenharmony_cistatic int update_bitmap(struct io_thread_req *req, struct io_desc *segment) 15218c2ecf20Sopenharmony_ci{ 15228c2ecf20Sopenharmony_ci int n; 15238c2ecf20Sopenharmony_ci 15248c2ecf20Sopenharmony_ci if (segment->cow_offset == -1) 15258c2ecf20Sopenharmony_ci return map_error(0); 15268c2ecf20Sopenharmony_ci 15278c2ecf20Sopenharmony_ci n = os_pwrite_file(req->fds[1], &segment->bitmap_words, 15288c2ecf20Sopenharmony_ci sizeof(segment->bitmap_words), segment->cow_offset); 15298c2ecf20Sopenharmony_ci if (n != sizeof(segment->bitmap_words)) 15308c2ecf20Sopenharmony_ci return map_error(-n); 15318c2ecf20Sopenharmony_ci 15328c2ecf20Sopenharmony_ci return map_error(0); 15338c2ecf20Sopenharmony_ci} 15348c2ecf20Sopenharmony_ci 15358c2ecf20Sopenharmony_cistatic void do_io(struct io_thread_req *req, struct io_desc *desc) 15368c2ecf20Sopenharmony_ci{ 15378c2ecf20Sopenharmony_ci char *buf = NULL; 15388c2ecf20Sopenharmony_ci unsigned long len; 15398c2ecf20Sopenharmony_ci int n, nsectors, start, end, bit; 15408c2ecf20Sopenharmony_ci __u64 off; 15418c2ecf20Sopenharmony_ci 15428c2ecf20Sopenharmony_ci /* FLUSH is really a special case, we cannot "case" it with others */ 15438c2ecf20Sopenharmony_ci 15448c2ecf20Sopenharmony_ci if (req_op(req->req) == REQ_OP_FLUSH) { 15458c2ecf20Sopenharmony_ci /* fds[0] is always either the rw image or our cow file */ 15468c2ecf20Sopenharmony_ci req->error = map_error(-os_sync_file(req->fds[0])); 15478c2ecf20Sopenharmony_ci return; 15488c2ecf20Sopenharmony_ci } 15498c2ecf20Sopenharmony_ci 15508c2ecf20Sopenharmony_ci nsectors = desc->length / req->sectorsize; 15518c2ecf20Sopenharmony_ci start = 0; 15528c2ecf20Sopenharmony_ci do { 15538c2ecf20Sopenharmony_ci bit = ubd_test_bit(start, (unsigned char *) &desc->sector_mask); 15548c2ecf20Sopenharmony_ci end = start; 15558c2ecf20Sopenharmony_ci while((end < nsectors) && 15568c2ecf20Sopenharmony_ci (ubd_test_bit(end, (unsigned char *) &desc->sector_mask) == bit)) 15578c2ecf20Sopenharmony_ci end++; 15588c2ecf20Sopenharmony_ci 15598c2ecf20Sopenharmony_ci off = req->offset + req->offsets[bit] + 15608c2ecf20Sopenharmony_ci start * req->sectorsize; 15618c2ecf20Sopenharmony_ci len = (end - start) * req->sectorsize; 15628c2ecf20Sopenharmony_ci if (desc->buffer != NULL) 15638c2ecf20Sopenharmony_ci buf = &desc->buffer[start * req->sectorsize]; 15648c2ecf20Sopenharmony_ci 15658c2ecf20Sopenharmony_ci switch (req_op(req->req)) { 15668c2ecf20Sopenharmony_ci case REQ_OP_READ: 15678c2ecf20Sopenharmony_ci n = 0; 15688c2ecf20Sopenharmony_ci do { 15698c2ecf20Sopenharmony_ci buf = &buf[n]; 15708c2ecf20Sopenharmony_ci len -= n; 15718c2ecf20Sopenharmony_ci n = os_pread_file(req->fds[bit], buf, len, off); 15728c2ecf20Sopenharmony_ci if (n < 0) { 15738c2ecf20Sopenharmony_ci req->error = map_error(-n); 15748c2ecf20Sopenharmony_ci return; 15758c2ecf20Sopenharmony_ci } 15768c2ecf20Sopenharmony_ci } while((n < len) && (n != 0)); 15778c2ecf20Sopenharmony_ci if (n < len) memset(&buf[n], 0, len - n); 15788c2ecf20Sopenharmony_ci break; 15798c2ecf20Sopenharmony_ci case REQ_OP_WRITE: 15808c2ecf20Sopenharmony_ci n = os_pwrite_file(req->fds[bit], buf, len, off); 15818c2ecf20Sopenharmony_ci if(n != len){ 15828c2ecf20Sopenharmony_ci req->error = map_error(-n); 15838c2ecf20Sopenharmony_ci return; 15848c2ecf20Sopenharmony_ci } 15858c2ecf20Sopenharmony_ci break; 15868c2ecf20Sopenharmony_ci case REQ_OP_DISCARD: 15878c2ecf20Sopenharmony_ci case REQ_OP_WRITE_ZEROES: 15888c2ecf20Sopenharmony_ci n = os_falloc_punch(req->fds[bit], off, len); 15898c2ecf20Sopenharmony_ci if (n) { 15908c2ecf20Sopenharmony_ci req->error = map_error(-n); 15918c2ecf20Sopenharmony_ci return; 15928c2ecf20Sopenharmony_ci } 15938c2ecf20Sopenharmony_ci break; 15948c2ecf20Sopenharmony_ci default: 15958c2ecf20Sopenharmony_ci WARN_ON_ONCE(1); 15968c2ecf20Sopenharmony_ci req->error = BLK_STS_NOTSUPP; 15978c2ecf20Sopenharmony_ci return; 15988c2ecf20Sopenharmony_ci } 15998c2ecf20Sopenharmony_ci 16008c2ecf20Sopenharmony_ci start = end; 16018c2ecf20Sopenharmony_ci } while(start < nsectors); 16028c2ecf20Sopenharmony_ci 16038c2ecf20Sopenharmony_ci req->offset += len; 16048c2ecf20Sopenharmony_ci req->error = update_bitmap(req, desc); 16058c2ecf20Sopenharmony_ci} 16068c2ecf20Sopenharmony_ci 16078c2ecf20Sopenharmony_ci/* Changed in start_io_thread, which is serialized by being called only 16088c2ecf20Sopenharmony_ci * from ubd_init, which is an initcall. 16098c2ecf20Sopenharmony_ci */ 16108c2ecf20Sopenharmony_ciint kernel_fd = -1; 16118c2ecf20Sopenharmony_ci 16128c2ecf20Sopenharmony_ci/* Only changed by the io thread. XXX: currently unused. */ 16138c2ecf20Sopenharmony_cistatic int io_count = 0; 16148c2ecf20Sopenharmony_ci 16158c2ecf20Sopenharmony_ciint io_thread(void *arg) 16168c2ecf20Sopenharmony_ci{ 16178c2ecf20Sopenharmony_ci int n, count, written, res; 16188c2ecf20Sopenharmony_ci 16198c2ecf20Sopenharmony_ci os_fix_helper_signals(); 16208c2ecf20Sopenharmony_ci 16218c2ecf20Sopenharmony_ci while(1){ 16228c2ecf20Sopenharmony_ci n = bulk_req_safe_read( 16238c2ecf20Sopenharmony_ci kernel_fd, 16248c2ecf20Sopenharmony_ci io_req_buffer, 16258c2ecf20Sopenharmony_ci &io_remainder, 16268c2ecf20Sopenharmony_ci &io_remainder_size, 16278c2ecf20Sopenharmony_ci UBD_REQ_BUFFER_SIZE 16288c2ecf20Sopenharmony_ci ); 16298c2ecf20Sopenharmony_ci if (n <= 0) { 16308c2ecf20Sopenharmony_ci if (n == -EAGAIN) 16318c2ecf20Sopenharmony_ci ubd_read_poll(-1); 16328c2ecf20Sopenharmony_ci 16338c2ecf20Sopenharmony_ci continue; 16348c2ecf20Sopenharmony_ci } 16358c2ecf20Sopenharmony_ci 16368c2ecf20Sopenharmony_ci for (count = 0; count < n/sizeof(struct io_thread_req *); count++) { 16378c2ecf20Sopenharmony_ci struct io_thread_req *req = (*io_req_buffer)[count]; 16388c2ecf20Sopenharmony_ci int i; 16398c2ecf20Sopenharmony_ci 16408c2ecf20Sopenharmony_ci io_count++; 16418c2ecf20Sopenharmony_ci for (i = 0; !req->error && i < req->desc_cnt; i++) 16428c2ecf20Sopenharmony_ci do_io(req, &(req->io_desc[i])); 16438c2ecf20Sopenharmony_ci 16448c2ecf20Sopenharmony_ci } 16458c2ecf20Sopenharmony_ci 16468c2ecf20Sopenharmony_ci written = 0; 16478c2ecf20Sopenharmony_ci 16488c2ecf20Sopenharmony_ci do { 16498c2ecf20Sopenharmony_ci res = os_write_file(kernel_fd, 16508c2ecf20Sopenharmony_ci ((char *) io_req_buffer) + written, 16518c2ecf20Sopenharmony_ci n - written); 16528c2ecf20Sopenharmony_ci if (res >= 0) { 16538c2ecf20Sopenharmony_ci written += res; 16548c2ecf20Sopenharmony_ci } 16558c2ecf20Sopenharmony_ci if (written < n) { 16568c2ecf20Sopenharmony_ci ubd_write_poll(-1); 16578c2ecf20Sopenharmony_ci } 16588c2ecf20Sopenharmony_ci } while (written < n); 16598c2ecf20Sopenharmony_ci } 16608c2ecf20Sopenharmony_ci 16618c2ecf20Sopenharmony_ci return 0; 16628c2ecf20Sopenharmony_ci} 1663