18c2ecf20Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0
28c2ecf20Sopenharmony_ci/*
38c2ecf20Sopenharmony_ci * Copyright (C) 2018 Cambridge Greys Ltd
48c2ecf20Sopenharmony_ci * Copyright (C) 2015-2016 Anton Ivanov (aivanov@brocade.com)
58c2ecf20Sopenharmony_ci * Copyright (C) 2000 Jeff Dike (jdike@karaya.com)
68c2ecf20Sopenharmony_ci */
78c2ecf20Sopenharmony_ci
88c2ecf20Sopenharmony_ci/* 2001-09-28...2002-04-17
98c2ecf20Sopenharmony_ci * Partition stuff by James_McMechan@hotmail.com
108c2ecf20Sopenharmony_ci * old style ubd by setting UBD_SHIFT to 0
118c2ecf20Sopenharmony_ci * 2002-09-27...2002-10-18 massive tinkering for 2.5
128c2ecf20Sopenharmony_ci * partitions have changed in 2.5
138c2ecf20Sopenharmony_ci * 2003-01-29 more tinkering for 2.5.59-1
148c2ecf20Sopenharmony_ci * This should now address the sysfs problems and has
158c2ecf20Sopenharmony_ci * the symlink for devfs to allow for booting with
168c2ecf20Sopenharmony_ci * the common /dev/ubd/discX/... names rather than
178c2ecf20Sopenharmony_ci * only /dev/ubdN/discN this version also has lots of
188c2ecf20Sopenharmony_ci * clean ups preparing for ubd-many.
198c2ecf20Sopenharmony_ci * James McMechan
208c2ecf20Sopenharmony_ci */
218c2ecf20Sopenharmony_ci
228c2ecf20Sopenharmony_ci#define UBD_SHIFT 4
238c2ecf20Sopenharmony_ci
248c2ecf20Sopenharmony_ci#include <linux/module.h>
258c2ecf20Sopenharmony_ci#include <linux/init.h>
268c2ecf20Sopenharmony_ci#include <linux/blkdev.h>
278c2ecf20Sopenharmony_ci#include <linux/blk-mq.h>
288c2ecf20Sopenharmony_ci#include <linux/ata.h>
298c2ecf20Sopenharmony_ci#include <linux/hdreg.h>
308c2ecf20Sopenharmony_ci#include <linux/cdrom.h>
318c2ecf20Sopenharmony_ci#include <linux/proc_fs.h>
328c2ecf20Sopenharmony_ci#include <linux/seq_file.h>
338c2ecf20Sopenharmony_ci#include <linux/ctype.h>
348c2ecf20Sopenharmony_ci#include <linux/slab.h>
358c2ecf20Sopenharmony_ci#include <linux/vmalloc.h>
368c2ecf20Sopenharmony_ci#include <linux/platform_device.h>
378c2ecf20Sopenharmony_ci#include <linux/scatterlist.h>
388c2ecf20Sopenharmony_ci#include <asm/tlbflush.h>
398c2ecf20Sopenharmony_ci#include <kern_util.h>
408c2ecf20Sopenharmony_ci#include "mconsole_kern.h"
418c2ecf20Sopenharmony_ci#include <init.h>
428c2ecf20Sopenharmony_ci#include <irq_kern.h>
438c2ecf20Sopenharmony_ci#include "ubd.h"
448c2ecf20Sopenharmony_ci#include <os.h>
458c2ecf20Sopenharmony_ci#include "cow.h"
468c2ecf20Sopenharmony_ci
478c2ecf20Sopenharmony_ci/* Max request size is determined by sector mask - 32K */
488c2ecf20Sopenharmony_ci#define UBD_MAX_REQUEST (8 * sizeof(long))
498c2ecf20Sopenharmony_ci
508c2ecf20Sopenharmony_cistruct io_desc {
518c2ecf20Sopenharmony_ci	char *buffer;
528c2ecf20Sopenharmony_ci	unsigned long length;
538c2ecf20Sopenharmony_ci	unsigned long sector_mask;
548c2ecf20Sopenharmony_ci	unsigned long long cow_offset;
558c2ecf20Sopenharmony_ci	unsigned long bitmap_words[2];
568c2ecf20Sopenharmony_ci};
578c2ecf20Sopenharmony_ci
588c2ecf20Sopenharmony_cistruct io_thread_req {
598c2ecf20Sopenharmony_ci	struct request *req;
608c2ecf20Sopenharmony_ci	int fds[2];
618c2ecf20Sopenharmony_ci	unsigned long offsets[2];
628c2ecf20Sopenharmony_ci	unsigned long long offset;
638c2ecf20Sopenharmony_ci	int sectorsize;
648c2ecf20Sopenharmony_ci	int error;
658c2ecf20Sopenharmony_ci
668c2ecf20Sopenharmony_ci	int desc_cnt;
678c2ecf20Sopenharmony_ci	/* io_desc has to be the last element of the struct */
688c2ecf20Sopenharmony_ci	struct io_desc io_desc[];
698c2ecf20Sopenharmony_ci};
708c2ecf20Sopenharmony_ci
718c2ecf20Sopenharmony_ci
728c2ecf20Sopenharmony_cistatic struct io_thread_req * (*irq_req_buffer)[];
738c2ecf20Sopenharmony_cistatic struct io_thread_req *irq_remainder;
748c2ecf20Sopenharmony_cistatic int irq_remainder_size;
758c2ecf20Sopenharmony_ci
768c2ecf20Sopenharmony_cistatic struct io_thread_req * (*io_req_buffer)[];
778c2ecf20Sopenharmony_cistatic struct io_thread_req *io_remainder;
788c2ecf20Sopenharmony_cistatic int io_remainder_size;
798c2ecf20Sopenharmony_ci
808c2ecf20Sopenharmony_ci
818c2ecf20Sopenharmony_ci
828c2ecf20Sopenharmony_cistatic inline int ubd_test_bit(__u64 bit, unsigned char *data)
838c2ecf20Sopenharmony_ci{
848c2ecf20Sopenharmony_ci	__u64 n;
858c2ecf20Sopenharmony_ci	int bits, off;
868c2ecf20Sopenharmony_ci
878c2ecf20Sopenharmony_ci	bits = sizeof(data[0]) * 8;
888c2ecf20Sopenharmony_ci	n = bit / bits;
898c2ecf20Sopenharmony_ci	off = bit % bits;
908c2ecf20Sopenharmony_ci	return (data[n] & (1 << off)) != 0;
918c2ecf20Sopenharmony_ci}
928c2ecf20Sopenharmony_ci
938c2ecf20Sopenharmony_cistatic inline void ubd_set_bit(__u64 bit, unsigned char *data)
948c2ecf20Sopenharmony_ci{
958c2ecf20Sopenharmony_ci	__u64 n;
968c2ecf20Sopenharmony_ci	int bits, off;
978c2ecf20Sopenharmony_ci
988c2ecf20Sopenharmony_ci	bits = sizeof(data[0]) * 8;
998c2ecf20Sopenharmony_ci	n = bit / bits;
1008c2ecf20Sopenharmony_ci	off = bit % bits;
1018c2ecf20Sopenharmony_ci	data[n] |= (1 << off);
1028c2ecf20Sopenharmony_ci}
1038c2ecf20Sopenharmony_ci/*End stuff from ubd_user.h*/
1048c2ecf20Sopenharmony_ci
1058c2ecf20Sopenharmony_ci#define DRIVER_NAME "uml-blkdev"
1068c2ecf20Sopenharmony_ci
1078c2ecf20Sopenharmony_cistatic DEFINE_MUTEX(ubd_lock);
1088c2ecf20Sopenharmony_cistatic DEFINE_MUTEX(ubd_mutex); /* replaces BKL, might not be needed */
1098c2ecf20Sopenharmony_ci
1108c2ecf20Sopenharmony_cistatic int ubd_open(struct block_device *bdev, fmode_t mode);
1118c2ecf20Sopenharmony_cistatic void ubd_release(struct gendisk *disk, fmode_t mode);
1128c2ecf20Sopenharmony_cistatic int ubd_ioctl(struct block_device *bdev, fmode_t mode,
1138c2ecf20Sopenharmony_ci		     unsigned int cmd, unsigned long arg);
1148c2ecf20Sopenharmony_cistatic int ubd_getgeo(struct block_device *bdev, struct hd_geometry *geo);
1158c2ecf20Sopenharmony_ci
1168c2ecf20Sopenharmony_ci#define MAX_DEV (16)
1178c2ecf20Sopenharmony_ci
1188c2ecf20Sopenharmony_cistatic const struct block_device_operations ubd_blops = {
1198c2ecf20Sopenharmony_ci        .owner		= THIS_MODULE,
1208c2ecf20Sopenharmony_ci        .open		= ubd_open,
1218c2ecf20Sopenharmony_ci        .release	= ubd_release,
1228c2ecf20Sopenharmony_ci        .ioctl		= ubd_ioctl,
1238c2ecf20Sopenharmony_ci        .compat_ioctl	= blkdev_compat_ptr_ioctl,
1248c2ecf20Sopenharmony_ci	.getgeo		= ubd_getgeo,
1258c2ecf20Sopenharmony_ci};
1268c2ecf20Sopenharmony_ci
1278c2ecf20Sopenharmony_ci/* Protected by ubd_lock */
1288c2ecf20Sopenharmony_cistatic int fake_major = UBD_MAJOR;
1298c2ecf20Sopenharmony_cistatic struct gendisk *ubd_gendisk[MAX_DEV];
1308c2ecf20Sopenharmony_cistatic struct gendisk *fake_gendisk[MAX_DEV];
1318c2ecf20Sopenharmony_ci
1328c2ecf20Sopenharmony_ci#ifdef CONFIG_BLK_DEV_UBD_SYNC
1338c2ecf20Sopenharmony_ci#define OPEN_FLAGS ((struct openflags) { .r = 1, .w = 1, .s = 1, .c = 0, \
1348c2ecf20Sopenharmony_ci					 .cl = 1 })
1358c2ecf20Sopenharmony_ci#else
1368c2ecf20Sopenharmony_ci#define OPEN_FLAGS ((struct openflags) { .r = 1, .w = 1, .s = 0, .c = 0, \
1378c2ecf20Sopenharmony_ci					 .cl = 1 })
1388c2ecf20Sopenharmony_ci#endif
1398c2ecf20Sopenharmony_cistatic struct openflags global_openflags = OPEN_FLAGS;
1408c2ecf20Sopenharmony_ci
1418c2ecf20Sopenharmony_cistruct cow {
1428c2ecf20Sopenharmony_ci	/* backing file name */
1438c2ecf20Sopenharmony_ci	char *file;
1448c2ecf20Sopenharmony_ci	/* backing file fd */
1458c2ecf20Sopenharmony_ci	int fd;
1468c2ecf20Sopenharmony_ci	unsigned long *bitmap;
1478c2ecf20Sopenharmony_ci	unsigned long bitmap_len;
1488c2ecf20Sopenharmony_ci	int bitmap_offset;
1498c2ecf20Sopenharmony_ci	int data_offset;
1508c2ecf20Sopenharmony_ci};
1518c2ecf20Sopenharmony_ci
1528c2ecf20Sopenharmony_ci#define MAX_SG 64
1538c2ecf20Sopenharmony_ci
1548c2ecf20Sopenharmony_cistruct ubd {
1558c2ecf20Sopenharmony_ci	/* name (and fd, below) of the file opened for writing, either the
1568c2ecf20Sopenharmony_ci	 * backing or the cow file. */
1578c2ecf20Sopenharmony_ci	char *file;
1588c2ecf20Sopenharmony_ci	int count;
1598c2ecf20Sopenharmony_ci	int fd;
1608c2ecf20Sopenharmony_ci	__u64 size;
1618c2ecf20Sopenharmony_ci	struct openflags boot_openflags;
1628c2ecf20Sopenharmony_ci	struct openflags openflags;
1638c2ecf20Sopenharmony_ci	unsigned shared:1;
1648c2ecf20Sopenharmony_ci	unsigned no_cow:1;
1658c2ecf20Sopenharmony_ci	unsigned no_trim:1;
1668c2ecf20Sopenharmony_ci	struct cow cow;
1678c2ecf20Sopenharmony_ci	struct platform_device pdev;
1688c2ecf20Sopenharmony_ci	struct request_queue *queue;
1698c2ecf20Sopenharmony_ci	struct blk_mq_tag_set tag_set;
1708c2ecf20Sopenharmony_ci	spinlock_t lock;
1718c2ecf20Sopenharmony_ci};
1728c2ecf20Sopenharmony_ci
1738c2ecf20Sopenharmony_ci#define DEFAULT_COW { \
1748c2ecf20Sopenharmony_ci	.file =			NULL, \
1758c2ecf20Sopenharmony_ci	.fd =			-1,	\
1768c2ecf20Sopenharmony_ci	.bitmap =		NULL, \
1778c2ecf20Sopenharmony_ci	.bitmap_offset =	0, \
1788c2ecf20Sopenharmony_ci	.data_offset =		0, \
1798c2ecf20Sopenharmony_ci}
1808c2ecf20Sopenharmony_ci
1818c2ecf20Sopenharmony_ci#define DEFAULT_UBD { \
1828c2ecf20Sopenharmony_ci	.file = 		NULL, \
1838c2ecf20Sopenharmony_ci	.count =		0, \
1848c2ecf20Sopenharmony_ci	.fd =			-1, \
1858c2ecf20Sopenharmony_ci	.size =			-1, \
1868c2ecf20Sopenharmony_ci	.boot_openflags =	OPEN_FLAGS, \
1878c2ecf20Sopenharmony_ci	.openflags =		OPEN_FLAGS, \
1888c2ecf20Sopenharmony_ci	.no_cow =               0, \
1898c2ecf20Sopenharmony_ci	.no_trim =		0, \
1908c2ecf20Sopenharmony_ci	.shared =		0, \
1918c2ecf20Sopenharmony_ci	.cow =			DEFAULT_COW, \
1928c2ecf20Sopenharmony_ci	.lock =			__SPIN_LOCK_UNLOCKED(ubd_devs.lock), \
1938c2ecf20Sopenharmony_ci}
1948c2ecf20Sopenharmony_ci
1958c2ecf20Sopenharmony_ci/* Protected by ubd_lock */
1968c2ecf20Sopenharmony_cistatic struct ubd ubd_devs[MAX_DEV] = { [0 ... MAX_DEV - 1] = DEFAULT_UBD };
1978c2ecf20Sopenharmony_ci
1988c2ecf20Sopenharmony_ci/* Only changed by fake_ide_setup which is a setup */
1998c2ecf20Sopenharmony_cistatic int fake_ide = 0;
2008c2ecf20Sopenharmony_cistatic struct proc_dir_entry *proc_ide_root = NULL;
2018c2ecf20Sopenharmony_cistatic struct proc_dir_entry *proc_ide = NULL;
2028c2ecf20Sopenharmony_ci
2038c2ecf20Sopenharmony_cistatic blk_status_t ubd_queue_rq(struct blk_mq_hw_ctx *hctx,
2048c2ecf20Sopenharmony_ci				 const struct blk_mq_queue_data *bd);
2058c2ecf20Sopenharmony_ci
2068c2ecf20Sopenharmony_cistatic void make_proc_ide(void)
2078c2ecf20Sopenharmony_ci{
2088c2ecf20Sopenharmony_ci	proc_ide_root = proc_mkdir("ide", NULL);
2098c2ecf20Sopenharmony_ci	proc_ide = proc_mkdir("ide0", proc_ide_root);
2108c2ecf20Sopenharmony_ci}
2118c2ecf20Sopenharmony_ci
2128c2ecf20Sopenharmony_cistatic int fake_ide_media_proc_show(struct seq_file *m, void *v)
2138c2ecf20Sopenharmony_ci{
2148c2ecf20Sopenharmony_ci	seq_puts(m, "disk\n");
2158c2ecf20Sopenharmony_ci	return 0;
2168c2ecf20Sopenharmony_ci}
2178c2ecf20Sopenharmony_ci
2188c2ecf20Sopenharmony_cistatic void make_ide_entries(const char *dev_name)
2198c2ecf20Sopenharmony_ci{
2208c2ecf20Sopenharmony_ci	struct proc_dir_entry *dir, *ent;
2218c2ecf20Sopenharmony_ci	char name[64];
2228c2ecf20Sopenharmony_ci
2238c2ecf20Sopenharmony_ci	if(proc_ide_root == NULL) make_proc_ide();
2248c2ecf20Sopenharmony_ci
2258c2ecf20Sopenharmony_ci	dir = proc_mkdir(dev_name, proc_ide);
2268c2ecf20Sopenharmony_ci	if(!dir) return;
2278c2ecf20Sopenharmony_ci
2288c2ecf20Sopenharmony_ci	ent = proc_create_single("media", S_IRUGO, dir,
2298c2ecf20Sopenharmony_ci			fake_ide_media_proc_show);
2308c2ecf20Sopenharmony_ci	if(!ent) return;
2318c2ecf20Sopenharmony_ci	snprintf(name, sizeof(name), "ide0/%s", dev_name);
2328c2ecf20Sopenharmony_ci	proc_symlink(dev_name, proc_ide_root, name);
2338c2ecf20Sopenharmony_ci}
2348c2ecf20Sopenharmony_ci
2358c2ecf20Sopenharmony_cistatic int fake_ide_setup(char *str)
2368c2ecf20Sopenharmony_ci{
2378c2ecf20Sopenharmony_ci	fake_ide = 1;
2388c2ecf20Sopenharmony_ci	return 1;
2398c2ecf20Sopenharmony_ci}
2408c2ecf20Sopenharmony_ci
2418c2ecf20Sopenharmony_ci__setup("fake_ide", fake_ide_setup);
2428c2ecf20Sopenharmony_ci
2438c2ecf20Sopenharmony_ci__uml_help(fake_ide_setup,
2448c2ecf20Sopenharmony_ci"fake_ide\n"
2458c2ecf20Sopenharmony_ci"    Create ide0 entries that map onto ubd devices.\n\n"
2468c2ecf20Sopenharmony_ci);
2478c2ecf20Sopenharmony_ci
2488c2ecf20Sopenharmony_cistatic int parse_unit(char **ptr)
2498c2ecf20Sopenharmony_ci{
2508c2ecf20Sopenharmony_ci	char *str = *ptr, *end;
2518c2ecf20Sopenharmony_ci	int n = -1;
2528c2ecf20Sopenharmony_ci
2538c2ecf20Sopenharmony_ci	if(isdigit(*str)) {
2548c2ecf20Sopenharmony_ci		n = simple_strtoul(str, &end, 0);
2558c2ecf20Sopenharmony_ci		if(end == str)
2568c2ecf20Sopenharmony_ci			return -1;
2578c2ecf20Sopenharmony_ci		*ptr = end;
2588c2ecf20Sopenharmony_ci	}
2598c2ecf20Sopenharmony_ci	else if (('a' <= *str) && (*str <= 'z')) {
2608c2ecf20Sopenharmony_ci		n = *str - 'a';
2618c2ecf20Sopenharmony_ci		str++;
2628c2ecf20Sopenharmony_ci		*ptr = str;
2638c2ecf20Sopenharmony_ci	}
2648c2ecf20Sopenharmony_ci	return n;
2658c2ecf20Sopenharmony_ci}
2668c2ecf20Sopenharmony_ci
2678c2ecf20Sopenharmony_ci/* If *index_out == -1 at exit, the passed option was a general one;
2688c2ecf20Sopenharmony_ci * otherwise, the str pointer is used (and owned) inside ubd_devs array, so it
2698c2ecf20Sopenharmony_ci * should not be freed on exit.
2708c2ecf20Sopenharmony_ci */
2718c2ecf20Sopenharmony_cistatic int ubd_setup_common(char *str, int *index_out, char **error_out)
2728c2ecf20Sopenharmony_ci{
2738c2ecf20Sopenharmony_ci	struct ubd *ubd_dev;
2748c2ecf20Sopenharmony_ci	struct openflags flags = global_openflags;
2758c2ecf20Sopenharmony_ci	char *backing_file;
2768c2ecf20Sopenharmony_ci	int n, err = 0, i;
2778c2ecf20Sopenharmony_ci
2788c2ecf20Sopenharmony_ci	if(index_out) *index_out = -1;
2798c2ecf20Sopenharmony_ci	n = *str;
2808c2ecf20Sopenharmony_ci	if(n == '='){
2818c2ecf20Sopenharmony_ci		char *end;
2828c2ecf20Sopenharmony_ci		int major;
2838c2ecf20Sopenharmony_ci
2848c2ecf20Sopenharmony_ci		str++;
2858c2ecf20Sopenharmony_ci		if(!strcmp(str, "sync")){
2868c2ecf20Sopenharmony_ci			global_openflags = of_sync(global_openflags);
2878c2ecf20Sopenharmony_ci			return err;
2888c2ecf20Sopenharmony_ci		}
2898c2ecf20Sopenharmony_ci
2908c2ecf20Sopenharmony_ci		err = -EINVAL;
2918c2ecf20Sopenharmony_ci		major = simple_strtoul(str, &end, 0);
2928c2ecf20Sopenharmony_ci		if((*end != '\0') || (end == str)){
2938c2ecf20Sopenharmony_ci			*error_out = "Didn't parse major number";
2948c2ecf20Sopenharmony_ci			return err;
2958c2ecf20Sopenharmony_ci		}
2968c2ecf20Sopenharmony_ci
2978c2ecf20Sopenharmony_ci		mutex_lock(&ubd_lock);
2988c2ecf20Sopenharmony_ci		if (fake_major != UBD_MAJOR) {
2998c2ecf20Sopenharmony_ci			*error_out = "Can't assign a fake major twice";
3008c2ecf20Sopenharmony_ci			goto out1;
3018c2ecf20Sopenharmony_ci		}
3028c2ecf20Sopenharmony_ci
3038c2ecf20Sopenharmony_ci		fake_major = major;
3048c2ecf20Sopenharmony_ci
3058c2ecf20Sopenharmony_ci		printk(KERN_INFO "Setting extra ubd major number to %d\n",
3068c2ecf20Sopenharmony_ci		       major);
3078c2ecf20Sopenharmony_ci		err = 0;
3088c2ecf20Sopenharmony_ci	out1:
3098c2ecf20Sopenharmony_ci		mutex_unlock(&ubd_lock);
3108c2ecf20Sopenharmony_ci		return err;
3118c2ecf20Sopenharmony_ci	}
3128c2ecf20Sopenharmony_ci
3138c2ecf20Sopenharmony_ci	n = parse_unit(&str);
3148c2ecf20Sopenharmony_ci	if(n < 0){
3158c2ecf20Sopenharmony_ci		*error_out = "Couldn't parse device number";
3168c2ecf20Sopenharmony_ci		return -EINVAL;
3178c2ecf20Sopenharmony_ci	}
3188c2ecf20Sopenharmony_ci	if(n >= MAX_DEV){
3198c2ecf20Sopenharmony_ci		*error_out = "Device number out of range";
3208c2ecf20Sopenharmony_ci		return 1;
3218c2ecf20Sopenharmony_ci	}
3228c2ecf20Sopenharmony_ci
3238c2ecf20Sopenharmony_ci	err = -EBUSY;
3248c2ecf20Sopenharmony_ci	mutex_lock(&ubd_lock);
3258c2ecf20Sopenharmony_ci
3268c2ecf20Sopenharmony_ci	ubd_dev = &ubd_devs[n];
3278c2ecf20Sopenharmony_ci	if(ubd_dev->file != NULL){
3288c2ecf20Sopenharmony_ci		*error_out = "Device is already configured";
3298c2ecf20Sopenharmony_ci		goto out;
3308c2ecf20Sopenharmony_ci	}
3318c2ecf20Sopenharmony_ci
3328c2ecf20Sopenharmony_ci	if (index_out)
3338c2ecf20Sopenharmony_ci		*index_out = n;
3348c2ecf20Sopenharmony_ci
3358c2ecf20Sopenharmony_ci	err = -EINVAL;
3368c2ecf20Sopenharmony_ci	for (i = 0; i < sizeof("rscdt="); i++) {
3378c2ecf20Sopenharmony_ci		switch (*str) {
3388c2ecf20Sopenharmony_ci		case 'r':
3398c2ecf20Sopenharmony_ci			flags.w = 0;
3408c2ecf20Sopenharmony_ci			break;
3418c2ecf20Sopenharmony_ci		case 's':
3428c2ecf20Sopenharmony_ci			flags.s = 1;
3438c2ecf20Sopenharmony_ci			break;
3448c2ecf20Sopenharmony_ci		case 'd':
3458c2ecf20Sopenharmony_ci			ubd_dev->no_cow = 1;
3468c2ecf20Sopenharmony_ci			break;
3478c2ecf20Sopenharmony_ci		case 'c':
3488c2ecf20Sopenharmony_ci			ubd_dev->shared = 1;
3498c2ecf20Sopenharmony_ci			break;
3508c2ecf20Sopenharmony_ci		case 't':
3518c2ecf20Sopenharmony_ci			ubd_dev->no_trim = 1;
3528c2ecf20Sopenharmony_ci			break;
3538c2ecf20Sopenharmony_ci		case '=':
3548c2ecf20Sopenharmony_ci			str++;
3558c2ecf20Sopenharmony_ci			goto break_loop;
3568c2ecf20Sopenharmony_ci		default:
3578c2ecf20Sopenharmony_ci			*error_out = "Expected '=' or flag letter "
3588c2ecf20Sopenharmony_ci				"(r, s, c, t or d)";
3598c2ecf20Sopenharmony_ci			goto out;
3608c2ecf20Sopenharmony_ci		}
3618c2ecf20Sopenharmony_ci		str++;
3628c2ecf20Sopenharmony_ci	}
3638c2ecf20Sopenharmony_ci
3648c2ecf20Sopenharmony_ci	if (*str == '=')
3658c2ecf20Sopenharmony_ci		*error_out = "Too many flags specified";
3668c2ecf20Sopenharmony_ci	else
3678c2ecf20Sopenharmony_ci		*error_out = "Missing '='";
3688c2ecf20Sopenharmony_ci	goto out;
3698c2ecf20Sopenharmony_ci
3708c2ecf20Sopenharmony_cibreak_loop:
3718c2ecf20Sopenharmony_ci	backing_file = strchr(str, ',');
3728c2ecf20Sopenharmony_ci
3738c2ecf20Sopenharmony_ci	if (backing_file == NULL)
3748c2ecf20Sopenharmony_ci		backing_file = strchr(str, ':');
3758c2ecf20Sopenharmony_ci
3768c2ecf20Sopenharmony_ci	if(backing_file != NULL){
3778c2ecf20Sopenharmony_ci		if(ubd_dev->no_cow){
3788c2ecf20Sopenharmony_ci			*error_out = "Can't specify both 'd' and a cow file";
3798c2ecf20Sopenharmony_ci			goto out;
3808c2ecf20Sopenharmony_ci		}
3818c2ecf20Sopenharmony_ci		else {
3828c2ecf20Sopenharmony_ci			*backing_file = '\0';
3838c2ecf20Sopenharmony_ci			backing_file++;
3848c2ecf20Sopenharmony_ci		}
3858c2ecf20Sopenharmony_ci	}
3868c2ecf20Sopenharmony_ci	err = 0;
3878c2ecf20Sopenharmony_ci	ubd_dev->file = str;
3888c2ecf20Sopenharmony_ci	ubd_dev->cow.file = backing_file;
3898c2ecf20Sopenharmony_ci	ubd_dev->boot_openflags = flags;
3908c2ecf20Sopenharmony_ciout:
3918c2ecf20Sopenharmony_ci	mutex_unlock(&ubd_lock);
3928c2ecf20Sopenharmony_ci	return err;
3938c2ecf20Sopenharmony_ci}
3948c2ecf20Sopenharmony_ci
3958c2ecf20Sopenharmony_cistatic int ubd_setup(char *str)
3968c2ecf20Sopenharmony_ci{
3978c2ecf20Sopenharmony_ci	char *error;
3988c2ecf20Sopenharmony_ci	int err;
3998c2ecf20Sopenharmony_ci
4008c2ecf20Sopenharmony_ci	err = ubd_setup_common(str, NULL, &error);
4018c2ecf20Sopenharmony_ci	if(err)
4028c2ecf20Sopenharmony_ci		printk(KERN_ERR "Failed to initialize device with \"%s\" : "
4038c2ecf20Sopenharmony_ci		       "%s\n", str, error);
4048c2ecf20Sopenharmony_ci	return 1;
4058c2ecf20Sopenharmony_ci}
4068c2ecf20Sopenharmony_ci
4078c2ecf20Sopenharmony_ci__setup("ubd", ubd_setup);
4088c2ecf20Sopenharmony_ci__uml_help(ubd_setup,
4098c2ecf20Sopenharmony_ci"ubd<n><flags>=<filename>[(:|,)<filename2>]\n"
4108c2ecf20Sopenharmony_ci"    This is used to associate a device with a file in the underlying\n"
4118c2ecf20Sopenharmony_ci"    filesystem. When specifying two filenames, the first one is the\n"
4128c2ecf20Sopenharmony_ci"    COW name and the second is the backing file name. As separator you can\n"
4138c2ecf20Sopenharmony_ci"    use either a ':' or a ',': the first one allows writing things like;\n"
4148c2ecf20Sopenharmony_ci"	ubd0=~/Uml/root_cow:~/Uml/root_backing_file\n"
4158c2ecf20Sopenharmony_ci"    while with a ',' the shell would not expand the 2nd '~'.\n"
4168c2ecf20Sopenharmony_ci"    When using only one filename, UML will detect whether to treat it like\n"
4178c2ecf20Sopenharmony_ci"    a COW file or a backing file. To override this detection, add the 'd'\n"
4188c2ecf20Sopenharmony_ci"    flag:\n"
4198c2ecf20Sopenharmony_ci"	ubd0d=BackingFile\n"
4208c2ecf20Sopenharmony_ci"    Usually, there is a filesystem in the file, but \n"
4218c2ecf20Sopenharmony_ci"    that's not required. Swap devices containing swap files can be\n"
4228c2ecf20Sopenharmony_ci"    specified like this. Also, a file which doesn't contain a\n"
4238c2ecf20Sopenharmony_ci"    filesystem can have its contents read in the virtual \n"
4248c2ecf20Sopenharmony_ci"    machine by running 'dd' on the device. <n> must be in the range\n"
4258c2ecf20Sopenharmony_ci"    0 to 7. Appending an 'r' to the number will cause that device\n"
4268c2ecf20Sopenharmony_ci"    to be mounted read-only. For example ubd1r=./ext_fs. Appending\n"
4278c2ecf20Sopenharmony_ci"    an 's' will cause data to be written to disk on the host immediately.\n"
4288c2ecf20Sopenharmony_ci"    'c' will cause the device to be treated as being shared between multiple\n"
4298c2ecf20Sopenharmony_ci"    UMLs and file locking will be turned off - this is appropriate for a\n"
4308c2ecf20Sopenharmony_ci"    cluster filesystem and inappropriate at almost all other times.\n\n"
4318c2ecf20Sopenharmony_ci"    't' will disable trim/discard support on the device (enabled by default).\n\n"
4328c2ecf20Sopenharmony_ci);
4338c2ecf20Sopenharmony_ci
4348c2ecf20Sopenharmony_cistatic int udb_setup(char *str)
4358c2ecf20Sopenharmony_ci{
4368c2ecf20Sopenharmony_ci	printk("udb%s specified on command line is almost certainly a ubd -> "
4378c2ecf20Sopenharmony_ci	       "udb TYPO\n", str);
4388c2ecf20Sopenharmony_ci	return 1;
4398c2ecf20Sopenharmony_ci}
4408c2ecf20Sopenharmony_ci
4418c2ecf20Sopenharmony_ci__setup("udb", udb_setup);
4428c2ecf20Sopenharmony_ci__uml_help(udb_setup,
4438c2ecf20Sopenharmony_ci"udb\n"
4448c2ecf20Sopenharmony_ci"    This option is here solely to catch ubd -> udb typos, which can be\n"
4458c2ecf20Sopenharmony_ci"    to impossible to catch visually unless you specifically look for\n"
4468c2ecf20Sopenharmony_ci"    them.  The only result of any option starting with 'udb' is an error\n"
4478c2ecf20Sopenharmony_ci"    in the boot output.\n\n"
4488c2ecf20Sopenharmony_ci);
4498c2ecf20Sopenharmony_ci
4508c2ecf20Sopenharmony_ci/* Only changed by ubd_init, which is an initcall. */
4518c2ecf20Sopenharmony_cistatic int thread_fd = -1;
4528c2ecf20Sopenharmony_ci
4538c2ecf20Sopenharmony_ci/* Function to read several request pointers at a time
4548c2ecf20Sopenharmony_ci* handling fractional reads if (and as) needed
4558c2ecf20Sopenharmony_ci*/
4568c2ecf20Sopenharmony_ci
4578c2ecf20Sopenharmony_cistatic int bulk_req_safe_read(
4588c2ecf20Sopenharmony_ci	int fd,
4598c2ecf20Sopenharmony_ci	struct io_thread_req * (*request_buffer)[],
4608c2ecf20Sopenharmony_ci	struct io_thread_req **remainder,
4618c2ecf20Sopenharmony_ci	int *remainder_size,
4628c2ecf20Sopenharmony_ci	int max_recs
4638c2ecf20Sopenharmony_ci	)
4648c2ecf20Sopenharmony_ci{
4658c2ecf20Sopenharmony_ci	int n = 0;
4668c2ecf20Sopenharmony_ci	int res = 0;
4678c2ecf20Sopenharmony_ci
4688c2ecf20Sopenharmony_ci	if (*remainder_size > 0) {
4698c2ecf20Sopenharmony_ci		memmove(
4708c2ecf20Sopenharmony_ci			(char *) request_buffer,
4718c2ecf20Sopenharmony_ci			(char *) remainder, *remainder_size
4728c2ecf20Sopenharmony_ci		);
4738c2ecf20Sopenharmony_ci		n = *remainder_size;
4748c2ecf20Sopenharmony_ci	}
4758c2ecf20Sopenharmony_ci
4768c2ecf20Sopenharmony_ci	res = os_read_file(
4778c2ecf20Sopenharmony_ci			fd,
4788c2ecf20Sopenharmony_ci			((char *) request_buffer) + *remainder_size,
4798c2ecf20Sopenharmony_ci			sizeof(struct io_thread_req *)*max_recs
4808c2ecf20Sopenharmony_ci				- *remainder_size
4818c2ecf20Sopenharmony_ci		);
4828c2ecf20Sopenharmony_ci	if (res > 0) {
4838c2ecf20Sopenharmony_ci		n += res;
4848c2ecf20Sopenharmony_ci		if ((n % sizeof(struct io_thread_req *)) > 0) {
4858c2ecf20Sopenharmony_ci			/*
4868c2ecf20Sopenharmony_ci			* Read somehow returned not a multiple of dword
4878c2ecf20Sopenharmony_ci			* theoretically possible, but never observed in the
4888c2ecf20Sopenharmony_ci			* wild, so read routine must be able to handle it
4898c2ecf20Sopenharmony_ci			*/
4908c2ecf20Sopenharmony_ci			*remainder_size = n % sizeof(struct io_thread_req *);
4918c2ecf20Sopenharmony_ci			WARN(*remainder_size > 0, "UBD IPC read returned a partial result");
4928c2ecf20Sopenharmony_ci			memmove(
4938c2ecf20Sopenharmony_ci				remainder,
4948c2ecf20Sopenharmony_ci				((char *) request_buffer) +
4958c2ecf20Sopenharmony_ci					(n/sizeof(struct io_thread_req *))*sizeof(struct io_thread_req *),
4968c2ecf20Sopenharmony_ci				*remainder_size
4978c2ecf20Sopenharmony_ci			);
4988c2ecf20Sopenharmony_ci			n = n - *remainder_size;
4998c2ecf20Sopenharmony_ci		}
5008c2ecf20Sopenharmony_ci	} else {
5018c2ecf20Sopenharmony_ci		n = res;
5028c2ecf20Sopenharmony_ci	}
5038c2ecf20Sopenharmony_ci	return n;
5048c2ecf20Sopenharmony_ci}
5058c2ecf20Sopenharmony_ci
5068c2ecf20Sopenharmony_ci/* Called without dev->lock held, and only in interrupt context. */
5078c2ecf20Sopenharmony_cistatic void ubd_handler(void)
5088c2ecf20Sopenharmony_ci{
5098c2ecf20Sopenharmony_ci	int n;
5108c2ecf20Sopenharmony_ci	int count;
5118c2ecf20Sopenharmony_ci
5128c2ecf20Sopenharmony_ci	while(1){
5138c2ecf20Sopenharmony_ci		n = bulk_req_safe_read(
5148c2ecf20Sopenharmony_ci			thread_fd,
5158c2ecf20Sopenharmony_ci			irq_req_buffer,
5168c2ecf20Sopenharmony_ci			&irq_remainder,
5178c2ecf20Sopenharmony_ci			&irq_remainder_size,
5188c2ecf20Sopenharmony_ci			UBD_REQ_BUFFER_SIZE
5198c2ecf20Sopenharmony_ci		);
5208c2ecf20Sopenharmony_ci		if (n < 0) {
5218c2ecf20Sopenharmony_ci			if(n == -EAGAIN)
5228c2ecf20Sopenharmony_ci				break;
5238c2ecf20Sopenharmony_ci			printk(KERN_ERR "spurious interrupt in ubd_handler, "
5248c2ecf20Sopenharmony_ci			       "err = %d\n", -n);
5258c2ecf20Sopenharmony_ci			return;
5268c2ecf20Sopenharmony_ci		}
5278c2ecf20Sopenharmony_ci		for (count = 0; count < n/sizeof(struct io_thread_req *); count++) {
5288c2ecf20Sopenharmony_ci			struct io_thread_req *io_req = (*irq_req_buffer)[count];
5298c2ecf20Sopenharmony_ci
5308c2ecf20Sopenharmony_ci			if ((io_req->error == BLK_STS_NOTSUPP) && (req_op(io_req->req) == REQ_OP_DISCARD)) {
5318c2ecf20Sopenharmony_ci				blk_queue_max_discard_sectors(io_req->req->q, 0);
5328c2ecf20Sopenharmony_ci				blk_queue_max_write_zeroes_sectors(io_req->req->q, 0);
5338c2ecf20Sopenharmony_ci				blk_queue_flag_clear(QUEUE_FLAG_DISCARD, io_req->req->q);
5348c2ecf20Sopenharmony_ci			}
5358c2ecf20Sopenharmony_ci			blk_mq_end_request(io_req->req, io_req->error);
5368c2ecf20Sopenharmony_ci			kfree(io_req);
5378c2ecf20Sopenharmony_ci		}
5388c2ecf20Sopenharmony_ci	}
5398c2ecf20Sopenharmony_ci}
5408c2ecf20Sopenharmony_ci
5418c2ecf20Sopenharmony_cistatic irqreturn_t ubd_intr(int irq, void *dev)
5428c2ecf20Sopenharmony_ci{
5438c2ecf20Sopenharmony_ci	ubd_handler();
5448c2ecf20Sopenharmony_ci	return IRQ_HANDLED;
5458c2ecf20Sopenharmony_ci}
5468c2ecf20Sopenharmony_ci
5478c2ecf20Sopenharmony_ci/* Only changed by ubd_init, which is an initcall. */
5488c2ecf20Sopenharmony_cistatic int io_pid = -1;
5498c2ecf20Sopenharmony_ci
5508c2ecf20Sopenharmony_cistatic void kill_io_thread(void)
5518c2ecf20Sopenharmony_ci{
5528c2ecf20Sopenharmony_ci	if(io_pid != -1)
5538c2ecf20Sopenharmony_ci		os_kill_process(io_pid, 1);
5548c2ecf20Sopenharmony_ci}
5558c2ecf20Sopenharmony_ci
5568c2ecf20Sopenharmony_ci__uml_exitcall(kill_io_thread);
5578c2ecf20Sopenharmony_ci
5588c2ecf20Sopenharmony_cistatic inline int ubd_file_size(struct ubd *ubd_dev, __u64 *size_out)
5598c2ecf20Sopenharmony_ci{
5608c2ecf20Sopenharmony_ci	char *file;
5618c2ecf20Sopenharmony_ci	int fd;
5628c2ecf20Sopenharmony_ci	int err;
5638c2ecf20Sopenharmony_ci
5648c2ecf20Sopenharmony_ci	__u32 version;
5658c2ecf20Sopenharmony_ci	__u32 align;
5668c2ecf20Sopenharmony_ci	char *backing_file;
5678c2ecf20Sopenharmony_ci	time64_t mtime;
5688c2ecf20Sopenharmony_ci	unsigned long long size;
5698c2ecf20Sopenharmony_ci	int sector_size;
5708c2ecf20Sopenharmony_ci	int bitmap_offset;
5718c2ecf20Sopenharmony_ci
5728c2ecf20Sopenharmony_ci	if (ubd_dev->file && ubd_dev->cow.file) {
5738c2ecf20Sopenharmony_ci		file = ubd_dev->cow.file;
5748c2ecf20Sopenharmony_ci
5758c2ecf20Sopenharmony_ci		goto out;
5768c2ecf20Sopenharmony_ci	}
5778c2ecf20Sopenharmony_ci
5788c2ecf20Sopenharmony_ci	fd = os_open_file(ubd_dev->file, of_read(OPENFLAGS()), 0);
5798c2ecf20Sopenharmony_ci	if (fd < 0)
5808c2ecf20Sopenharmony_ci		return fd;
5818c2ecf20Sopenharmony_ci
5828c2ecf20Sopenharmony_ci	err = read_cow_header(file_reader, &fd, &version, &backing_file, \
5838c2ecf20Sopenharmony_ci		&mtime, &size, &sector_size, &align, &bitmap_offset);
5848c2ecf20Sopenharmony_ci	os_close_file(fd);
5858c2ecf20Sopenharmony_ci
5868c2ecf20Sopenharmony_ci	if(err == -EINVAL)
5878c2ecf20Sopenharmony_ci		file = ubd_dev->file;
5888c2ecf20Sopenharmony_ci	else
5898c2ecf20Sopenharmony_ci		file = backing_file;
5908c2ecf20Sopenharmony_ci
5918c2ecf20Sopenharmony_ciout:
5928c2ecf20Sopenharmony_ci	return os_file_size(file, size_out);
5938c2ecf20Sopenharmony_ci}
5948c2ecf20Sopenharmony_ci
5958c2ecf20Sopenharmony_cistatic int read_cow_bitmap(int fd, void *buf, int offset, int len)
5968c2ecf20Sopenharmony_ci{
5978c2ecf20Sopenharmony_ci	int err;
5988c2ecf20Sopenharmony_ci
5998c2ecf20Sopenharmony_ci	err = os_pread_file(fd, buf, len, offset);
6008c2ecf20Sopenharmony_ci	if (err < 0)
6018c2ecf20Sopenharmony_ci		return err;
6028c2ecf20Sopenharmony_ci
6038c2ecf20Sopenharmony_ci	return 0;
6048c2ecf20Sopenharmony_ci}
6058c2ecf20Sopenharmony_ci
6068c2ecf20Sopenharmony_cistatic int backing_file_mismatch(char *file, __u64 size, time64_t mtime)
6078c2ecf20Sopenharmony_ci{
6088c2ecf20Sopenharmony_ci	time64_t modtime;
6098c2ecf20Sopenharmony_ci	unsigned long long actual;
6108c2ecf20Sopenharmony_ci	int err;
6118c2ecf20Sopenharmony_ci
6128c2ecf20Sopenharmony_ci	err = os_file_modtime(file, &modtime);
6138c2ecf20Sopenharmony_ci	if (err < 0) {
6148c2ecf20Sopenharmony_ci		printk(KERN_ERR "Failed to get modification time of backing "
6158c2ecf20Sopenharmony_ci		       "file \"%s\", err = %d\n", file, -err);
6168c2ecf20Sopenharmony_ci		return err;
6178c2ecf20Sopenharmony_ci	}
6188c2ecf20Sopenharmony_ci
6198c2ecf20Sopenharmony_ci	err = os_file_size(file, &actual);
6208c2ecf20Sopenharmony_ci	if (err < 0) {
6218c2ecf20Sopenharmony_ci		printk(KERN_ERR "Failed to get size of backing file \"%s\", "
6228c2ecf20Sopenharmony_ci		       "err = %d\n", file, -err);
6238c2ecf20Sopenharmony_ci		return err;
6248c2ecf20Sopenharmony_ci	}
6258c2ecf20Sopenharmony_ci
6268c2ecf20Sopenharmony_ci	if (actual != size) {
6278c2ecf20Sopenharmony_ci		/*__u64 can be a long on AMD64 and with %lu GCC complains; so
6288c2ecf20Sopenharmony_ci		 * the typecast.*/
6298c2ecf20Sopenharmony_ci		printk(KERN_ERR "Size mismatch (%llu vs %llu) of COW header "
6308c2ecf20Sopenharmony_ci		       "vs backing file\n", (unsigned long long) size, actual);
6318c2ecf20Sopenharmony_ci		return -EINVAL;
6328c2ecf20Sopenharmony_ci	}
6338c2ecf20Sopenharmony_ci	if (modtime != mtime) {
6348c2ecf20Sopenharmony_ci		printk(KERN_ERR "mtime mismatch (%lld vs %lld) of COW header vs "
6358c2ecf20Sopenharmony_ci		       "backing file\n", mtime, modtime);
6368c2ecf20Sopenharmony_ci		return -EINVAL;
6378c2ecf20Sopenharmony_ci	}
6388c2ecf20Sopenharmony_ci	return 0;
6398c2ecf20Sopenharmony_ci}
6408c2ecf20Sopenharmony_ci
6418c2ecf20Sopenharmony_cistatic int path_requires_switch(char *from_cmdline, char *from_cow, char *cow)
6428c2ecf20Sopenharmony_ci{
6438c2ecf20Sopenharmony_ci	struct uml_stat buf1, buf2;
6448c2ecf20Sopenharmony_ci	int err;
6458c2ecf20Sopenharmony_ci
6468c2ecf20Sopenharmony_ci	if (from_cmdline == NULL)
6478c2ecf20Sopenharmony_ci		return 0;
6488c2ecf20Sopenharmony_ci	if (!strcmp(from_cmdline, from_cow))
6498c2ecf20Sopenharmony_ci		return 0;
6508c2ecf20Sopenharmony_ci
6518c2ecf20Sopenharmony_ci	err = os_stat_file(from_cmdline, &buf1);
6528c2ecf20Sopenharmony_ci	if (err < 0) {
6538c2ecf20Sopenharmony_ci		printk(KERN_ERR "Couldn't stat '%s', err = %d\n", from_cmdline,
6548c2ecf20Sopenharmony_ci		       -err);
6558c2ecf20Sopenharmony_ci		return 0;
6568c2ecf20Sopenharmony_ci	}
6578c2ecf20Sopenharmony_ci	err = os_stat_file(from_cow, &buf2);
6588c2ecf20Sopenharmony_ci	if (err < 0) {
6598c2ecf20Sopenharmony_ci		printk(KERN_ERR "Couldn't stat '%s', err = %d\n", from_cow,
6608c2ecf20Sopenharmony_ci		       -err);
6618c2ecf20Sopenharmony_ci		return 1;
6628c2ecf20Sopenharmony_ci	}
6638c2ecf20Sopenharmony_ci	if ((buf1.ust_dev == buf2.ust_dev) && (buf1.ust_ino == buf2.ust_ino))
6648c2ecf20Sopenharmony_ci		return 0;
6658c2ecf20Sopenharmony_ci
6668c2ecf20Sopenharmony_ci	printk(KERN_ERR "Backing file mismatch - \"%s\" requested, "
6678c2ecf20Sopenharmony_ci	       "\"%s\" specified in COW header of \"%s\"\n",
6688c2ecf20Sopenharmony_ci	       from_cmdline, from_cow, cow);
6698c2ecf20Sopenharmony_ci	return 1;
6708c2ecf20Sopenharmony_ci}
6718c2ecf20Sopenharmony_ci
6728c2ecf20Sopenharmony_cistatic int open_ubd_file(char *file, struct openflags *openflags, int shared,
6738c2ecf20Sopenharmony_ci		  char **backing_file_out, int *bitmap_offset_out,
6748c2ecf20Sopenharmony_ci		  unsigned long *bitmap_len_out, int *data_offset_out,
6758c2ecf20Sopenharmony_ci		  int *create_cow_out)
6768c2ecf20Sopenharmony_ci{
6778c2ecf20Sopenharmony_ci	time64_t mtime;
6788c2ecf20Sopenharmony_ci	unsigned long long size;
6798c2ecf20Sopenharmony_ci	__u32 version, align;
6808c2ecf20Sopenharmony_ci	char *backing_file;
6818c2ecf20Sopenharmony_ci	int fd, err, sectorsize, asked_switch, mode = 0644;
6828c2ecf20Sopenharmony_ci
6838c2ecf20Sopenharmony_ci	fd = os_open_file(file, *openflags, mode);
6848c2ecf20Sopenharmony_ci	if (fd < 0) {
6858c2ecf20Sopenharmony_ci		if ((fd == -ENOENT) && (create_cow_out != NULL))
6868c2ecf20Sopenharmony_ci			*create_cow_out = 1;
6878c2ecf20Sopenharmony_ci		if (!openflags->w ||
6888c2ecf20Sopenharmony_ci		    ((fd != -EROFS) && (fd != -EACCES)))
6898c2ecf20Sopenharmony_ci			return fd;
6908c2ecf20Sopenharmony_ci		openflags->w = 0;
6918c2ecf20Sopenharmony_ci		fd = os_open_file(file, *openflags, mode);
6928c2ecf20Sopenharmony_ci		if (fd < 0)
6938c2ecf20Sopenharmony_ci			return fd;
6948c2ecf20Sopenharmony_ci	}
6958c2ecf20Sopenharmony_ci
6968c2ecf20Sopenharmony_ci	if (shared)
6978c2ecf20Sopenharmony_ci		printk(KERN_INFO "Not locking \"%s\" on the host\n", file);
6988c2ecf20Sopenharmony_ci	else {
6998c2ecf20Sopenharmony_ci		err = os_lock_file(fd, openflags->w);
7008c2ecf20Sopenharmony_ci		if (err < 0) {
7018c2ecf20Sopenharmony_ci			printk(KERN_ERR "Failed to lock '%s', err = %d\n",
7028c2ecf20Sopenharmony_ci			       file, -err);
7038c2ecf20Sopenharmony_ci			goto out_close;
7048c2ecf20Sopenharmony_ci		}
7058c2ecf20Sopenharmony_ci	}
7068c2ecf20Sopenharmony_ci
7078c2ecf20Sopenharmony_ci	/* Successful return case! */
7088c2ecf20Sopenharmony_ci	if (backing_file_out == NULL)
7098c2ecf20Sopenharmony_ci		return fd;
7108c2ecf20Sopenharmony_ci
7118c2ecf20Sopenharmony_ci	err = read_cow_header(file_reader, &fd, &version, &backing_file, &mtime,
7128c2ecf20Sopenharmony_ci			      &size, &sectorsize, &align, bitmap_offset_out);
7138c2ecf20Sopenharmony_ci	if (err && (*backing_file_out != NULL)) {
7148c2ecf20Sopenharmony_ci		printk(KERN_ERR "Failed to read COW header from COW file "
7158c2ecf20Sopenharmony_ci		       "\"%s\", errno = %d\n", file, -err);
7168c2ecf20Sopenharmony_ci		goto out_close;
7178c2ecf20Sopenharmony_ci	}
7188c2ecf20Sopenharmony_ci	if (err)
7198c2ecf20Sopenharmony_ci		return fd;
7208c2ecf20Sopenharmony_ci
7218c2ecf20Sopenharmony_ci	asked_switch = path_requires_switch(*backing_file_out, backing_file,
7228c2ecf20Sopenharmony_ci					    file);
7238c2ecf20Sopenharmony_ci
7248c2ecf20Sopenharmony_ci	/* Allow switching only if no mismatch. */
7258c2ecf20Sopenharmony_ci	if (asked_switch && !backing_file_mismatch(*backing_file_out, size,
7268c2ecf20Sopenharmony_ci						   mtime)) {
7278c2ecf20Sopenharmony_ci		printk(KERN_ERR "Switching backing file to '%s'\n",
7288c2ecf20Sopenharmony_ci		       *backing_file_out);
7298c2ecf20Sopenharmony_ci		err = write_cow_header(file, fd, *backing_file_out,
7308c2ecf20Sopenharmony_ci				       sectorsize, align, &size);
7318c2ecf20Sopenharmony_ci		if (err) {
7328c2ecf20Sopenharmony_ci			printk(KERN_ERR "Switch failed, errno = %d\n", -err);
7338c2ecf20Sopenharmony_ci			goto out_close;
7348c2ecf20Sopenharmony_ci		}
7358c2ecf20Sopenharmony_ci	} else {
7368c2ecf20Sopenharmony_ci		*backing_file_out = backing_file;
7378c2ecf20Sopenharmony_ci		err = backing_file_mismatch(*backing_file_out, size, mtime);
7388c2ecf20Sopenharmony_ci		if (err)
7398c2ecf20Sopenharmony_ci			goto out_close;
7408c2ecf20Sopenharmony_ci	}
7418c2ecf20Sopenharmony_ci
7428c2ecf20Sopenharmony_ci	cow_sizes(version, size, sectorsize, align, *bitmap_offset_out,
7438c2ecf20Sopenharmony_ci		  bitmap_len_out, data_offset_out);
7448c2ecf20Sopenharmony_ci
7458c2ecf20Sopenharmony_ci	return fd;
7468c2ecf20Sopenharmony_ci out_close:
7478c2ecf20Sopenharmony_ci	os_close_file(fd);
7488c2ecf20Sopenharmony_ci	return err;
7498c2ecf20Sopenharmony_ci}
7508c2ecf20Sopenharmony_ci
7518c2ecf20Sopenharmony_cistatic int create_cow_file(char *cow_file, char *backing_file,
7528c2ecf20Sopenharmony_ci		    struct openflags flags,
7538c2ecf20Sopenharmony_ci		    int sectorsize, int alignment, int *bitmap_offset_out,
7548c2ecf20Sopenharmony_ci		    unsigned long *bitmap_len_out, int *data_offset_out)
7558c2ecf20Sopenharmony_ci{
7568c2ecf20Sopenharmony_ci	int err, fd;
7578c2ecf20Sopenharmony_ci
7588c2ecf20Sopenharmony_ci	flags.c = 1;
7598c2ecf20Sopenharmony_ci	fd = open_ubd_file(cow_file, &flags, 0, NULL, NULL, NULL, NULL, NULL);
7608c2ecf20Sopenharmony_ci	if (fd < 0) {
7618c2ecf20Sopenharmony_ci		err = fd;
7628c2ecf20Sopenharmony_ci		printk(KERN_ERR "Open of COW file '%s' failed, errno = %d\n",
7638c2ecf20Sopenharmony_ci		       cow_file, -err);
7648c2ecf20Sopenharmony_ci		goto out;
7658c2ecf20Sopenharmony_ci	}
7668c2ecf20Sopenharmony_ci
7678c2ecf20Sopenharmony_ci	err = init_cow_file(fd, cow_file, backing_file, sectorsize, alignment,
7688c2ecf20Sopenharmony_ci			    bitmap_offset_out, bitmap_len_out,
7698c2ecf20Sopenharmony_ci			    data_offset_out);
7708c2ecf20Sopenharmony_ci	if (!err)
7718c2ecf20Sopenharmony_ci		return fd;
7728c2ecf20Sopenharmony_ci	os_close_file(fd);
7738c2ecf20Sopenharmony_ci out:
7748c2ecf20Sopenharmony_ci	return err;
7758c2ecf20Sopenharmony_ci}
7768c2ecf20Sopenharmony_ci
7778c2ecf20Sopenharmony_cistatic void ubd_close_dev(struct ubd *ubd_dev)
7788c2ecf20Sopenharmony_ci{
7798c2ecf20Sopenharmony_ci	os_close_file(ubd_dev->fd);
7808c2ecf20Sopenharmony_ci	if(ubd_dev->cow.file == NULL)
7818c2ecf20Sopenharmony_ci		return;
7828c2ecf20Sopenharmony_ci
7838c2ecf20Sopenharmony_ci	os_close_file(ubd_dev->cow.fd);
7848c2ecf20Sopenharmony_ci	vfree(ubd_dev->cow.bitmap);
7858c2ecf20Sopenharmony_ci	ubd_dev->cow.bitmap = NULL;
7868c2ecf20Sopenharmony_ci}
7878c2ecf20Sopenharmony_ci
7888c2ecf20Sopenharmony_cistatic int ubd_open_dev(struct ubd *ubd_dev)
7898c2ecf20Sopenharmony_ci{
7908c2ecf20Sopenharmony_ci	struct openflags flags;
7918c2ecf20Sopenharmony_ci	char **back_ptr;
7928c2ecf20Sopenharmony_ci	int err, create_cow, *create_ptr;
7938c2ecf20Sopenharmony_ci	int fd;
7948c2ecf20Sopenharmony_ci
7958c2ecf20Sopenharmony_ci	ubd_dev->openflags = ubd_dev->boot_openflags;
7968c2ecf20Sopenharmony_ci	create_cow = 0;
7978c2ecf20Sopenharmony_ci	create_ptr = (ubd_dev->cow.file != NULL) ? &create_cow : NULL;
7988c2ecf20Sopenharmony_ci	back_ptr = ubd_dev->no_cow ? NULL : &ubd_dev->cow.file;
7998c2ecf20Sopenharmony_ci
8008c2ecf20Sopenharmony_ci	fd = open_ubd_file(ubd_dev->file, &ubd_dev->openflags, ubd_dev->shared,
8018c2ecf20Sopenharmony_ci				back_ptr, &ubd_dev->cow.bitmap_offset,
8028c2ecf20Sopenharmony_ci				&ubd_dev->cow.bitmap_len, &ubd_dev->cow.data_offset,
8038c2ecf20Sopenharmony_ci				create_ptr);
8048c2ecf20Sopenharmony_ci
8058c2ecf20Sopenharmony_ci	if((fd == -ENOENT) && create_cow){
8068c2ecf20Sopenharmony_ci		fd = create_cow_file(ubd_dev->file, ubd_dev->cow.file,
8078c2ecf20Sopenharmony_ci					  ubd_dev->openflags, SECTOR_SIZE, PAGE_SIZE,
8088c2ecf20Sopenharmony_ci					  &ubd_dev->cow.bitmap_offset,
8098c2ecf20Sopenharmony_ci					  &ubd_dev->cow.bitmap_len,
8108c2ecf20Sopenharmony_ci					  &ubd_dev->cow.data_offset);
8118c2ecf20Sopenharmony_ci		if(fd >= 0){
8128c2ecf20Sopenharmony_ci			printk(KERN_INFO "Creating \"%s\" as COW file for "
8138c2ecf20Sopenharmony_ci			       "\"%s\"\n", ubd_dev->file, ubd_dev->cow.file);
8148c2ecf20Sopenharmony_ci		}
8158c2ecf20Sopenharmony_ci	}
8168c2ecf20Sopenharmony_ci
8178c2ecf20Sopenharmony_ci	if(fd < 0){
8188c2ecf20Sopenharmony_ci		printk("Failed to open '%s', errno = %d\n", ubd_dev->file,
8198c2ecf20Sopenharmony_ci		       -fd);
8208c2ecf20Sopenharmony_ci		return fd;
8218c2ecf20Sopenharmony_ci	}
8228c2ecf20Sopenharmony_ci	ubd_dev->fd = fd;
8238c2ecf20Sopenharmony_ci
8248c2ecf20Sopenharmony_ci	if(ubd_dev->cow.file != NULL){
8258c2ecf20Sopenharmony_ci		blk_queue_max_hw_sectors(ubd_dev->queue, 8 * sizeof(long));
8268c2ecf20Sopenharmony_ci
8278c2ecf20Sopenharmony_ci		err = -ENOMEM;
8288c2ecf20Sopenharmony_ci		ubd_dev->cow.bitmap = vmalloc(ubd_dev->cow.bitmap_len);
8298c2ecf20Sopenharmony_ci		if(ubd_dev->cow.bitmap == NULL){
8308c2ecf20Sopenharmony_ci			printk(KERN_ERR "Failed to vmalloc COW bitmap\n");
8318c2ecf20Sopenharmony_ci			goto error;
8328c2ecf20Sopenharmony_ci		}
8338c2ecf20Sopenharmony_ci		flush_tlb_kernel_vm();
8348c2ecf20Sopenharmony_ci
8358c2ecf20Sopenharmony_ci		err = read_cow_bitmap(ubd_dev->fd, ubd_dev->cow.bitmap,
8368c2ecf20Sopenharmony_ci				      ubd_dev->cow.bitmap_offset,
8378c2ecf20Sopenharmony_ci				      ubd_dev->cow.bitmap_len);
8388c2ecf20Sopenharmony_ci		if(err < 0)
8398c2ecf20Sopenharmony_ci			goto error;
8408c2ecf20Sopenharmony_ci
8418c2ecf20Sopenharmony_ci		flags = ubd_dev->openflags;
8428c2ecf20Sopenharmony_ci		flags.w = 0;
8438c2ecf20Sopenharmony_ci		err = open_ubd_file(ubd_dev->cow.file, &flags, ubd_dev->shared, NULL,
8448c2ecf20Sopenharmony_ci				    NULL, NULL, NULL, NULL);
8458c2ecf20Sopenharmony_ci		if(err < 0) goto error;
8468c2ecf20Sopenharmony_ci		ubd_dev->cow.fd = err;
8478c2ecf20Sopenharmony_ci	}
8488c2ecf20Sopenharmony_ci	if (ubd_dev->no_trim == 0) {
8498c2ecf20Sopenharmony_ci		ubd_dev->queue->limits.discard_granularity = SECTOR_SIZE;
8508c2ecf20Sopenharmony_ci		ubd_dev->queue->limits.discard_alignment = SECTOR_SIZE;
8518c2ecf20Sopenharmony_ci		blk_queue_max_discard_sectors(ubd_dev->queue, UBD_MAX_REQUEST);
8528c2ecf20Sopenharmony_ci		blk_queue_max_write_zeroes_sectors(ubd_dev->queue, UBD_MAX_REQUEST);
8538c2ecf20Sopenharmony_ci		blk_queue_flag_set(QUEUE_FLAG_DISCARD, ubd_dev->queue);
8548c2ecf20Sopenharmony_ci	}
8558c2ecf20Sopenharmony_ci	blk_queue_flag_set(QUEUE_FLAG_NONROT, ubd_dev->queue);
8568c2ecf20Sopenharmony_ci	return 0;
8578c2ecf20Sopenharmony_ci error:
8588c2ecf20Sopenharmony_ci	os_close_file(ubd_dev->fd);
8598c2ecf20Sopenharmony_ci	return err;
8608c2ecf20Sopenharmony_ci}
8618c2ecf20Sopenharmony_ci
8628c2ecf20Sopenharmony_cistatic void ubd_device_release(struct device *dev)
8638c2ecf20Sopenharmony_ci{
8648c2ecf20Sopenharmony_ci	struct ubd *ubd_dev = dev_get_drvdata(dev);
8658c2ecf20Sopenharmony_ci
8668c2ecf20Sopenharmony_ci	blk_cleanup_queue(ubd_dev->queue);
8678c2ecf20Sopenharmony_ci	blk_mq_free_tag_set(&ubd_dev->tag_set);
8688c2ecf20Sopenharmony_ci	*ubd_dev = ((struct ubd) DEFAULT_UBD);
8698c2ecf20Sopenharmony_ci}
8708c2ecf20Sopenharmony_ci
8718c2ecf20Sopenharmony_cistatic int ubd_disk_register(int major, u64 size, int unit,
8728c2ecf20Sopenharmony_ci			     struct gendisk **disk_out)
8738c2ecf20Sopenharmony_ci{
8748c2ecf20Sopenharmony_ci	struct device *parent = NULL;
8758c2ecf20Sopenharmony_ci	struct gendisk *disk;
8768c2ecf20Sopenharmony_ci
8778c2ecf20Sopenharmony_ci	disk = alloc_disk(1 << UBD_SHIFT);
8788c2ecf20Sopenharmony_ci	if(disk == NULL)
8798c2ecf20Sopenharmony_ci		return -ENOMEM;
8808c2ecf20Sopenharmony_ci
8818c2ecf20Sopenharmony_ci	disk->major = major;
8828c2ecf20Sopenharmony_ci	disk->first_minor = unit << UBD_SHIFT;
8838c2ecf20Sopenharmony_ci	disk->fops = &ubd_blops;
8848c2ecf20Sopenharmony_ci	set_capacity(disk, size / 512);
8858c2ecf20Sopenharmony_ci	if (major == UBD_MAJOR)
8868c2ecf20Sopenharmony_ci		sprintf(disk->disk_name, "ubd%c", 'a' + unit);
8878c2ecf20Sopenharmony_ci	else
8888c2ecf20Sopenharmony_ci		sprintf(disk->disk_name, "ubd_fake%d", unit);
8898c2ecf20Sopenharmony_ci
8908c2ecf20Sopenharmony_ci	/* sysfs register (not for ide fake devices) */
8918c2ecf20Sopenharmony_ci	if (major == UBD_MAJOR) {
8928c2ecf20Sopenharmony_ci		ubd_devs[unit].pdev.id   = unit;
8938c2ecf20Sopenharmony_ci		ubd_devs[unit].pdev.name = DRIVER_NAME;
8948c2ecf20Sopenharmony_ci		ubd_devs[unit].pdev.dev.release = ubd_device_release;
8958c2ecf20Sopenharmony_ci		dev_set_drvdata(&ubd_devs[unit].pdev.dev, &ubd_devs[unit]);
8968c2ecf20Sopenharmony_ci		platform_device_register(&ubd_devs[unit].pdev);
8978c2ecf20Sopenharmony_ci		parent = &ubd_devs[unit].pdev.dev;
8988c2ecf20Sopenharmony_ci	}
8998c2ecf20Sopenharmony_ci
9008c2ecf20Sopenharmony_ci	disk->private_data = &ubd_devs[unit];
9018c2ecf20Sopenharmony_ci	disk->queue = ubd_devs[unit].queue;
9028c2ecf20Sopenharmony_ci	device_add_disk(parent, disk, NULL);
9038c2ecf20Sopenharmony_ci
9048c2ecf20Sopenharmony_ci	*disk_out = disk;
9058c2ecf20Sopenharmony_ci	return 0;
9068c2ecf20Sopenharmony_ci}
9078c2ecf20Sopenharmony_ci
9088c2ecf20Sopenharmony_ci#define ROUND_BLOCK(n) ((n + (SECTOR_SIZE - 1)) & (-SECTOR_SIZE))
9098c2ecf20Sopenharmony_ci
9108c2ecf20Sopenharmony_cistatic const struct blk_mq_ops ubd_mq_ops = {
9118c2ecf20Sopenharmony_ci	.queue_rq = ubd_queue_rq,
9128c2ecf20Sopenharmony_ci};
9138c2ecf20Sopenharmony_ci
9148c2ecf20Sopenharmony_cistatic int ubd_add(int n, char **error_out)
9158c2ecf20Sopenharmony_ci{
9168c2ecf20Sopenharmony_ci	struct ubd *ubd_dev = &ubd_devs[n];
9178c2ecf20Sopenharmony_ci	int err = 0;
9188c2ecf20Sopenharmony_ci
9198c2ecf20Sopenharmony_ci	if(ubd_dev->file == NULL)
9208c2ecf20Sopenharmony_ci		goto out;
9218c2ecf20Sopenharmony_ci
9228c2ecf20Sopenharmony_ci	err = ubd_file_size(ubd_dev, &ubd_dev->size);
9238c2ecf20Sopenharmony_ci	if(err < 0){
9248c2ecf20Sopenharmony_ci		*error_out = "Couldn't determine size of device's file";
9258c2ecf20Sopenharmony_ci		goto out;
9268c2ecf20Sopenharmony_ci	}
9278c2ecf20Sopenharmony_ci
9288c2ecf20Sopenharmony_ci	ubd_dev->size = ROUND_BLOCK(ubd_dev->size);
9298c2ecf20Sopenharmony_ci
9308c2ecf20Sopenharmony_ci	ubd_dev->tag_set.ops = &ubd_mq_ops;
9318c2ecf20Sopenharmony_ci	ubd_dev->tag_set.queue_depth = 64;
9328c2ecf20Sopenharmony_ci	ubd_dev->tag_set.numa_node = NUMA_NO_NODE;
9338c2ecf20Sopenharmony_ci	ubd_dev->tag_set.flags = BLK_MQ_F_SHOULD_MERGE;
9348c2ecf20Sopenharmony_ci	ubd_dev->tag_set.driver_data = ubd_dev;
9358c2ecf20Sopenharmony_ci	ubd_dev->tag_set.nr_hw_queues = 1;
9368c2ecf20Sopenharmony_ci
9378c2ecf20Sopenharmony_ci	err = blk_mq_alloc_tag_set(&ubd_dev->tag_set);
9388c2ecf20Sopenharmony_ci	if (err)
9398c2ecf20Sopenharmony_ci		goto out;
9408c2ecf20Sopenharmony_ci
9418c2ecf20Sopenharmony_ci	ubd_dev->queue = blk_mq_init_queue(&ubd_dev->tag_set);
9428c2ecf20Sopenharmony_ci	if (IS_ERR(ubd_dev->queue)) {
9438c2ecf20Sopenharmony_ci		err = PTR_ERR(ubd_dev->queue);
9448c2ecf20Sopenharmony_ci		goto out_cleanup_tags;
9458c2ecf20Sopenharmony_ci	}
9468c2ecf20Sopenharmony_ci
9478c2ecf20Sopenharmony_ci	ubd_dev->queue->queuedata = ubd_dev;
9488c2ecf20Sopenharmony_ci	blk_queue_write_cache(ubd_dev->queue, true, false);
9498c2ecf20Sopenharmony_ci
9508c2ecf20Sopenharmony_ci	blk_queue_max_segments(ubd_dev->queue, MAX_SG);
9518c2ecf20Sopenharmony_ci	blk_queue_segment_boundary(ubd_dev->queue, PAGE_SIZE - 1);
9528c2ecf20Sopenharmony_ci	err = ubd_disk_register(UBD_MAJOR, ubd_dev->size, n, &ubd_gendisk[n]);
9538c2ecf20Sopenharmony_ci	if(err){
9548c2ecf20Sopenharmony_ci		*error_out = "Failed to register device";
9558c2ecf20Sopenharmony_ci		goto out_cleanup_tags;
9568c2ecf20Sopenharmony_ci	}
9578c2ecf20Sopenharmony_ci
9588c2ecf20Sopenharmony_ci	if (fake_major != UBD_MAJOR)
9598c2ecf20Sopenharmony_ci		ubd_disk_register(fake_major, ubd_dev->size, n,
9608c2ecf20Sopenharmony_ci				  &fake_gendisk[n]);
9618c2ecf20Sopenharmony_ci
9628c2ecf20Sopenharmony_ci	/*
9638c2ecf20Sopenharmony_ci	 * Perhaps this should also be under the "if (fake_major)" above
9648c2ecf20Sopenharmony_ci	 * using the fake_disk->disk_name
9658c2ecf20Sopenharmony_ci	 */
9668c2ecf20Sopenharmony_ci	if (fake_ide)
9678c2ecf20Sopenharmony_ci		make_ide_entries(ubd_gendisk[n]->disk_name);
9688c2ecf20Sopenharmony_ci
9698c2ecf20Sopenharmony_ci	err = 0;
9708c2ecf20Sopenharmony_ciout:
9718c2ecf20Sopenharmony_ci	return err;
9728c2ecf20Sopenharmony_ci
9738c2ecf20Sopenharmony_ciout_cleanup_tags:
9748c2ecf20Sopenharmony_ci	blk_mq_free_tag_set(&ubd_dev->tag_set);
9758c2ecf20Sopenharmony_ci	if (!(IS_ERR(ubd_dev->queue)))
9768c2ecf20Sopenharmony_ci		blk_cleanup_queue(ubd_dev->queue);
9778c2ecf20Sopenharmony_ci	goto out;
9788c2ecf20Sopenharmony_ci}
9798c2ecf20Sopenharmony_ci
9808c2ecf20Sopenharmony_cistatic int ubd_config(char *str, char **error_out)
9818c2ecf20Sopenharmony_ci{
9828c2ecf20Sopenharmony_ci	int n, ret;
9838c2ecf20Sopenharmony_ci
9848c2ecf20Sopenharmony_ci	/* This string is possibly broken up and stored, so it's only
9858c2ecf20Sopenharmony_ci	 * freed if ubd_setup_common fails, or if only general options
9868c2ecf20Sopenharmony_ci	 * were set.
9878c2ecf20Sopenharmony_ci	 */
9888c2ecf20Sopenharmony_ci	str = kstrdup(str, GFP_KERNEL);
9898c2ecf20Sopenharmony_ci	if (str == NULL) {
9908c2ecf20Sopenharmony_ci		*error_out = "Failed to allocate memory";
9918c2ecf20Sopenharmony_ci		return -ENOMEM;
9928c2ecf20Sopenharmony_ci	}
9938c2ecf20Sopenharmony_ci
9948c2ecf20Sopenharmony_ci	ret = ubd_setup_common(str, &n, error_out);
9958c2ecf20Sopenharmony_ci	if (ret)
9968c2ecf20Sopenharmony_ci		goto err_free;
9978c2ecf20Sopenharmony_ci
9988c2ecf20Sopenharmony_ci	if (n == -1) {
9998c2ecf20Sopenharmony_ci		ret = 0;
10008c2ecf20Sopenharmony_ci		goto err_free;
10018c2ecf20Sopenharmony_ci	}
10028c2ecf20Sopenharmony_ci
10038c2ecf20Sopenharmony_ci	mutex_lock(&ubd_lock);
10048c2ecf20Sopenharmony_ci	ret = ubd_add(n, error_out);
10058c2ecf20Sopenharmony_ci	if (ret)
10068c2ecf20Sopenharmony_ci		ubd_devs[n].file = NULL;
10078c2ecf20Sopenharmony_ci	mutex_unlock(&ubd_lock);
10088c2ecf20Sopenharmony_ci
10098c2ecf20Sopenharmony_ciout:
10108c2ecf20Sopenharmony_ci	return ret;
10118c2ecf20Sopenharmony_ci
10128c2ecf20Sopenharmony_cierr_free:
10138c2ecf20Sopenharmony_ci	kfree(str);
10148c2ecf20Sopenharmony_ci	goto out;
10158c2ecf20Sopenharmony_ci}
10168c2ecf20Sopenharmony_ci
10178c2ecf20Sopenharmony_cistatic int ubd_get_config(char *name, char *str, int size, char **error_out)
10188c2ecf20Sopenharmony_ci{
10198c2ecf20Sopenharmony_ci	struct ubd *ubd_dev;
10208c2ecf20Sopenharmony_ci	int n, len = 0;
10218c2ecf20Sopenharmony_ci
10228c2ecf20Sopenharmony_ci	n = parse_unit(&name);
10238c2ecf20Sopenharmony_ci	if((n >= MAX_DEV) || (n < 0)){
10248c2ecf20Sopenharmony_ci		*error_out = "ubd_get_config : device number out of range";
10258c2ecf20Sopenharmony_ci		return -1;
10268c2ecf20Sopenharmony_ci	}
10278c2ecf20Sopenharmony_ci
10288c2ecf20Sopenharmony_ci	ubd_dev = &ubd_devs[n];
10298c2ecf20Sopenharmony_ci	mutex_lock(&ubd_lock);
10308c2ecf20Sopenharmony_ci
10318c2ecf20Sopenharmony_ci	if(ubd_dev->file == NULL){
10328c2ecf20Sopenharmony_ci		CONFIG_CHUNK(str, size, len, "", 1);
10338c2ecf20Sopenharmony_ci		goto out;
10348c2ecf20Sopenharmony_ci	}
10358c2ecf20Sopenharmony_ci
10368c2ecf20Sopenharmony_ci	CONFIG_CHUNK(str, size, len, ubd_dev->file, 0);
10378c2ecf20Sopenharmony_ci
10388c2ecf20Sopenharmony_ci	if(ubd_dev->cow.file != NULL){
10398c2ecf20Sopenharmony_ci		CONFIG_CHUNK(str, size, len, ",", 0);
10408c2ecf20Sopenharmony_ci		CONFIG_CHUNK(str, size, len, ubd_dev->cow.file, 1);
10418c2ecf20Sopenharmony_ci	}
10428c2ecf20Sopenharmony_ci	else CONFIG_CHUNK(str, size, len, "", 1);
10438c2ecf20Sopenharmony_ci
10448c2ecf20Sopenharmony_ci out:
10458c2ecf20Sopenharmony_ci	mutex_unlock(&ubd_lock);
10468c2ecf20Sopenharmony_ci	return len;
10478c2ecf20Sopenharmony_ci}
10488c2ecf20Sopenharmony_ci
10498c2ecf20Sopenharmony_cistatic int ubd_id(char **str, int *start_out, int *end_out)
10508c2ecf20Sopenharmony_ci{
10518c2ecf20Sopenharmony_ci	int n;
10528c2ecf20Sopenharmony_ci
10538c2ecf20Sopenharmony_ci	n = parse_unit(str);
10548c2ecf20Sopenharmony_ci	*start_out = 0;
10558c2ecf20Sopenharmony_ci	*end_out = MAX_DEV - 1;
10568c2ecf20Sopenharmony_ci	return n;
10578c2ecf20Sopenharmony_ci}
10588c2ecf20Sopenharmony_ci
10598c2ecf20Sopenharmony_cistatic int ubd_remove(int n, char **error_out)
10608c2ecf20Sopenharmony_ci{
10618c2ecf20Sopenharmony_ci	struct gendisk *disk = ubd_gendisk[n];
10628c2ecf20Sopenharmony_ci	struct ubd *ubd_dev;
10638c2ecf20Sopenharmony_ci	int err = -ENODEV;
10648c2ecf20Sopenharmony_ci
10658c2ecf20Sopenharmony_ci	mutex_lock(&ubd_lock);
10668c2ecf20Sopenharmony_ci
10678c2ecf20Sopenharmony_ci	ubd_dev = &ubd_devs[n];
10688c2ecf20Sopenharmony_ci
10698c2ecf20Sopenharmony_ci	if(ubd_dev->file == NULL)
10708c2ecf20Sopenharmony_ci		goto out;
10718c2ecf20Sopenharmony_ci
10728c2ecf20Sopenharmony_ci	/* you cannot remove a open disk */
10738c2ecf20Sopenharmony_ci	err = -EBUSY;
10748c2ecf20Sopenharmony_ci	if(ubd_dev->count > 0)
10758c2ecf20Sopenharmony_ci		goto out;
10768c2ecf20Sopenharmony_ci
10778c2ecf20Sopenharmony_ci	ubd_gendisk[n] = NULL;
10788c2ecf20Sopenharmony_ci	if(disk != NULL){
10798c2ecf20Sopenharmony_ci		del_gendisk(disk);
10808c2ecf20Sopenharmony_ci		put_disk(disk);
10818c2ecf20Sopenharmony_ci	}
10828c2ecf20Sopenharmony_ci
10838c2ecf20Sopenharmony_ci	if(fake_gendisk[n] != NULL){
10848c2ecf20Sopenharmony_ci		del_gendisk(fake_gendisk[n]);
10858c2ecf20Sopenharmony_ci		put_disk(fake_gendisk[n]);
10868c2ecf20Sopenharmony_ci		fake_gendisk[n] = NULL;
10878c2ecf20Sopenharmony_ci	}
10888c2ecf20Sopenharmony_ci
10898c2ecf20Sopenharmony_ci	err = 0;
10908c2ecf20Sopenharmony_ci	platform_device_unregister(&ubd_dev->pdev);
10918c2ecf20Sopenharmony_ciout:
10928c2ecf20Sopenharmony_ci	mutex_unlock(&ubd_lock);
10938c2ecf20Sopenharmony_ci	return err;
10948c2ecf20Sopenharmony_ci}
10958c2ecf20Sopenharmony_ci
10968c2ecf20Sopenharmony_ci/* All these are called by mconsole in process context and without
10978c2ecf20Sopenharmony_ci * ubd-specific locks.  The structure itself is const except for .list.
10988c2ecf20Sopenharmony_ci */
10998c2ecf20Sopenharmony_cistatic struct mc_device ubd_mc = {
11008c2ecf20Sopenharmony_ci	.list		= LIST_HEAD_INIT(ubd_mc.list),
11018c2ecf20Sopenharmony_ci	.name		= "ubd",
11028c2ecf20Sopenharmony_ci	.config		= ubd_config,
11038c2ecf20Sopenharmony_ci	.get_config	= ubd_get_config,
11048c2ecf20Sopenharmony_ci	.id		= ubd_id,
11058c2ecf20Sopenharmony_ci	.remove		= ubd_remove,
11068c2ecf20Sopenharmony_ci};
11078c2ecf20Sopenharmony_ci
11088c2ecf20Sopenharmony_cistatic int __init ubd_mc_init(void)
11098c2ecf20Sopenharmony_ci{
11108c2ecf20Sopenharmony_ci	mconsole_register_dev(&ubd_mc);
11118c2ecf20Sopenharmony_ci	return 0;
11128c2ecf20Sopenharmony_ci}
11138c2ecf20Sopenharmony_ci
11148c2ecf20Sopenharmony_ci__initcall(ubd_mc_init);
11158c2ecf20Sopenharmony_ci
11168c2ecf20Sopenharmony_cistatic int __init ubd0_init(void)
11178c2ecf20Sopenharmony_ci{
11188c2ecf20Sopenharmony_ci	struct ubd *ubd_dev = &ubd_devs[0];
11198c2ecf20Sopenharmony_ci
11208c2ecf20Sopenharmony_ci	mutex_lock(&ubd_lock);
11218c2ecf20Sopenharmony_ci	if(ubd_dev->file == NULL)
11228c2ecf20Sopenharmony_ci		ubd_dev->file = "root_fs";
11238c2ecf20Sopenharmony_ci	mutex_unlock(&ubd_lock);
11248c2ecf20Sopenharmony_ci
11258c2ecf20Sopenharmony_ci	return 0;
11268c2ecf20Sopenharmony_ci}
11278c2ecf20Sopenharmony_ci
11288c2ecf20Sopenharmony_ci__initcall(ubd0_init);
11298c2ecf20Sopenharmony_ci
11308c2ecf20Sopenharmony_ci/* Used in ubd_init, which is an initcall */
11318c2ecf20Sopenharmony_cistatic struct platform_driver ubd_driver = {
11328c2ecf20Sopenharmony_ci	.driver = {
11338c2ecf20Sopenharmony_ci		.name  = DRIVER_NAME,
11348c2ecf20Sopenharmony_ci	},
11358c2ecf20Sopenharmony_ci};
11368c2ecf20Sopenharmony_ci
11378c2ecf20Sopenharmony_cistatic int __init ubd_init(void)
11388c2ecf20Sopenharmony_ci{
11398c2ecf20Sopenharmony_ci	char *error;
11408c2ecf20Sopenharmony_ci	int i, err;
11418c2ecf20Sopenharmony_ci
11428c2ecf20Sopenharmony_ci	if (register_blkdev(UBD_MAJOR, "ubd"))
11438c2ecf20Sopenharmony_ci		return -1;
11448c2ecf20Sopenharmony_ci
11458c2ecf20Sopenharmony_ci	if (fake_major != UBD_MAJOR) {
11468c2ecf20Sopenharmony_ci		char name[sizeof("ubd_nnn\0")];
11478c2ecf20Sopenharmony_ci
11488c2ecf20Sopenharmony_ci		snprintf(name, sizeof(name), "ubd_%d", fake_major);
11498c2ecf20Sopenharmony_ci		if (register_blkdev(fake_major, "ubd"))
11508c2ecf20Sopenharmony_ci			return -1;
11518c2ecf20Sopenharmony_ci	}
11528c2ecf20Sopenharmony_ci
11538c2ecf20Sopenharmony_ci	irq_req_buffer = kmalloc_array(UBD_REQ_BUFFER_SIZE,
11548c2ecf20Sopenharmony_ci				       sizeof(struct io_thread_req *),
11558c2ecf20Sopenharmony_ci				       GFP_KERNEL
11568c2ecf20Sopenharmony_ci		);
11578c2ecf20Sopenharmony_ci	irq_remainder = 0;
11588c2ecf20Sopenharmony_ci
11598c2ecf20Sopenharmony_ci	if (irq_req_buffer == NULL) {
11608c2ecf20Sopenharmony_ci		printk(KERN_ERR "Failed to initialize ubd buffering\n");
11618c2ecf20Sopenharmony_ci		return -1;
11628c2ecf20Sopenharmony_ci	}
11638c2ecf20Sopenharmony_ci	io_req_buffer = kmalloc_array(UBD_REQ_BUFFER_SIZE,
11648c2ecf20Sopenharmony_ci				      sizeof(struct io_thread_req *),
11658c2ecf20Sopenharmony_ci				      GFP_KERNEL
11668c2ecf20Sopenharmony_ci		);
11678c2ecf20Sopenharmony_ci
11688c2ecf20Sopenharmony_ci	io_remainder = 0;
11698c2ecf20Sopenharmony_ci
11708c2ecf20Sopenharmony_ci	if (io_req_buffer == NULL) {
11718c2ecf20Sopenharmony_ci		printk(KERN_ERR "Failed to initialize ubd buffering\n");
11728c2ecf20Sopenharmony_ci		return -1;
11738c2ecf20Sopenharmony_ci	}
11748c2ecf20Sopenharmony_ci	platform_driver_register(&ubd_driver);
11758c2ecf20Sopenharmony_ci	mutex_lock(&ubd_lock);
11768c2ecf20Sopenharmony_ci	for (i = 0; i < MAX_DEV; i++){
11778c2ecf20Sopenharmony_ci		err = ubd_add(i, &error);
11788c2ecf20Sopenharmony_ci		if(err)
11798c2ecf20Sopenharmony_ci			printk(KERN_ERR "Failed to initialize ubd device %d :"
11808c2ecf20Sopenharmony_ci			       "%s\n", i, error);
11818c2ecf20Sopenharmony_ci	}
11828c2ecf20Sopenharmony_ci	mutex_unlock(&ubd_lock);
11838c2ecf20Sopenharmony_ci	return 0;
11848c2ecf20Sopenharmony_ci}
11858c2ecf20Sopenharmony_ci
11868c2ecf20Sopenharmony_cilate_initcall(ubd_init);
11878c2ecf20Sopenharmony_ci
11888c2ecf20Sopenharmony_cistatic int __init ubd_driver_init(void){
11898c2ecf20Sopenharmony_ci	unsigned long stack;
11908c2ecf20Sopenharmony_ci	int err;
11918c2ecf20Sopenharmony_ci
11928c2ecf20Sopenharmony_ci	/* Set by CONFIG_BLK_DEV_UBD_SYNC or ubd=sync.*/
11938c2ecf20Sopenharmony_ci	if(global_openflags.s){
11948c2ecf20Sopenharmony_ci		printk(KERN_INFO "ubd: Synchronous mode\n");
11958c2ecf20Sopenharmony_ci		/* Letting ubd=sync be like using ubd#s= instead of ubd#= is
11968c2ecf20Sopenharmony_ci		 * enough. So use anyway the io thread. */
11978c2ecf20Sopenharmony_ci	}
11988c2ecf20Sopenharmony_ci	stack = alloc_stack(0, 0);
11998c2ecf20Sopenharmony_ci	io_pid = start_io_thread(stack + PAGE_SIZE - sizeof(void *),
12008c2ecf20Sopenharmony_ci				 &thread_fd);
12018c2ecf20Sopenharmony_ci	if(io_pid < 0){
12028c2ecf20Sopenharmony_ci		printk(KERN_ERR
12038c2ecf20Sopenharmony_ci		       "ubd : Failed to start I/O thread (errno = %d) - "
12048c2ecf20Sopenharmony_ci		       "falling back to synchronous I/O\n", -io_pid);
12058c2ecf20Sopenharmony_ci		io_pid = -1;
12068c2ecf20Sopenharmony_ci		return 0;
12078c2ecf20Sopenharmony_ci	}
12088c2ecf20Sopenharmony_ci	err = um_request_irq(UBD_IRQ, thread_fd, IRQ_READ, ubd_intr,
12098c2ecf20Sopenharmony_ci			     0, "ubd", ubd_devs);
12108c2ecf20Sopenharmony_ci	if(err != 0)
12118c2ecf20Sopenharmony_ci		printk(KERN_ERR "um_request_irq failed - errno = %d\n", -err);
12128c2ecf20Sopenharmony_ci	return 0;
12138c2ecf20Sopenharmony_ci}
12148c2ecf20Sopenharmony_ci
12158c2ecf20Sopenharmony_cidevice_initcall(ubd_driver_init);
12168c2ecf20Sopenharmony_ci
12178c2ecf20Sopenharmony_cistatic int ubd_open(struct block_device *bdev, fmode_t mode)
12188c2ecf20Sopenharmony_ci{
12198c2ecf20Sopenharmony_ci	struct gendisk *disk = bdev->bd_disk;
12208c2ecf20Sopenharmony_ci	struct ubd *ubd_dev = disk->private_data;
12218c2ecf20Sopenharmony_ci	int err = 0;
12228c2ecf20Sopenharmony_ci
12238c2ecf20Sopenharmony_ci	mutex_lock(&ubd_mutex);
12248c2ecf20Sopenharmony_ci	if(ubd_dev->count == 0){
12258c2ecf20Sopenharmony_ci		err = ubd_open_dev(ubd_dev);
12268c2ecf20Sopenharmony_ci		if(err){
12278c2ecf20Sopenharmony_ci			printk(KERN_ERR "%s: Can't open \"%s\": errno = %d\n",
12288c2ecf20Sopenharmony_ci			       disk->disk_name, ubd_dev->file, -err);
12298c2ecf20Sopenharmony_ci			goto out;
12308c2ecf20Sopenharmony_ci		}
12318c2ecf20Sopenharmony_ci	}
12328c2ecf20Sopenharmony_ci	ubd_dev->count++;
12338c2ecf20Sopenharmony_ci	set_disk_ro(disk, !ubd_dev->openflags.w);
12348c2ecf20Sopenharmony_ci
12358c2ecf20Sopenharmony_ci	/* This should no more be needed. And it didn't work anyway to exclude
12368c2ecf20Sopenharmony_ci	 * read-write remounting of filesystems.*/
12378c2ecf20Sopenharmony_ci	/*if((mode & FMODE_WRITE) && !ubd_dev->openflags.w){
12388c2ecf20Sopenharmony_ci	        if(--ubd_dev->count == 0) ubd_close_dev(ubd_dev);
12398c2ecf20Sopenharmony_ci	        err = -EROFS;
12408c2ecf20Sopenharmony_ci	}*/
12418c2ecf20Sopenharmony_ciout:
12428c2ecf20Sopenharmony_ci	mutex_unlock(&ubd_mutex);
12438c2ecf20Sopenharmony_ci	return err;
12448c2ecf20Sopenharmony_ci}
12458c2ecf20Sopenharmony_ci
12468c2ecf20Sopenharmony_cistatic void ubd_release(struct gendisk *disk, fmode_t mode)
12478c2ecf20Sopenharmony_ci{
12488c2ecf20Sopenharmony_ci	struct ubd *ubd_dev = disk->private_data;
12498c2ecf20Sopenharmony_ci
12508c2ecf20Sopenharmony_ci	mutex_lock(&ubd_mutex);
12518c2ecf20Sopenharmony_ci	if(--ubd_dev->count == 0)
12528c2ecf20Sopenharmony_ci		ubd_close_dev(ubd_dev);
12538c2ecf20Sopenharmony_ci	mutex_unlock(&ubd_mutex);
12548c2ecf20Sopenharmony_ci}
12558c2ecf20Sopenharmony_ci
12568c2ecf20Sopenharmony_cistatic void cowify_bitmap(__u64 io_offset, int length, unsigned long *cow_mask,
12578c2ecf20Sopenharmony_ci			  __u64 *cow_offset, unsigned long *bitmap,
12588c2ecf20Sopenharmony_ci			  __u64 bitmap_offset, unsigned long *bitmap_words,
12598c2ecf20Sopenharmony_ci			  __u64 bitmap_len)
12608c2ecf20Sopenharmony_ci{
12618c2ecf20Sopenharmony_ci	__u64 sector = io_offset >> SECTOR_SHIFT;
12628c2ecf20Sopenharmony_ci	int i, update_bitmap = 0;
12638c2ecf20Sopenharmony_ci
12648c2ecf20Sopenharmony_ci	for (i = 0; i < length >> SECTOR_SHIFT; i++) {
12658c2ecf20Sopenharmony_ci		if(cow_mask != NULL)
12668c2ecf20Sopenharmony_ci			ubd_set_bit(i, (unsigned char *) cow_mask);
12678c2ecf20Sopenharmony_ci		if(ubd_test_bit(sector + i, (unsigned char *) bitmap))
12688c2ecf20Sopenharmony_ci			continue;
12698c2ecf20Sopenharmony_ci
12708c2ecf20Sopenharmony_ci		update_bitmap = 1;
12718c2ecf20Sopenharmony_ci		ubd_set_bit(sector + i, (unsigned char *) bitmap);
12728c2ecf20Sopenharmony_ci	}
12738c2ecf20Sopenharmony_ci
12748c2ecf20Sopenharmony_ci	if(!update_bitmap)
12758c2ecf20Sopenharmony_ci		return;
12768c2ecf20Sopenharmony_ci
12778c2ecf20Sopenharmony_ci	*cow_offset = sector / (sizeof(unsigned long) * 8);
12788c2ecf20Sopenharmony_ci
12798c2ecf20Sopenharmony_ci	/* This takes care of the case where we're exactly at the end of the
12808c2ecf20Sopenharmony_ci	 * device, and *cow_offset + 1 is off the end.  So, just back it up
12818c2ecf20Sopenharmony_ci	 * by one word.  Thanks to Lynn Kerby for the fix and James McMechan
12828c2ecf20Sopenharmony_ci	 * for the original diagnosis.
12838c2ecf20Sopenharmony_ci	 */
12848c2ecf20Sopenharmony_ci	if (*cow_offset == (DIV_ROUND_UP(bitmap_len,
12858c2ecf20Sopenharmony_ci					 sizeof(unsigned long)) - 1))
12868c2ecf20Sopenharmony_ci		(*cow_offset)--;
12878c2ecf20Sopenharmony_ci
12888c2ecf20Sopenharmony_ci	bitmap_words[0] = bitmap[*cow_offset];
12898c2ecf20Sopenharmony_ci	bitmap_words[1] = bitmap[*cow_offset + 1];
12908c2ecf20Sopenharmony_ci
12918c2ecf20Sopenharmony_ci	*cow_offset *= sizeof(unsigned long);
12928c2ecf20Sopenharmony_ci	*cow_offset += bitmap_offset;
12938c2ecf20Sopenharmony_ci}
12948c2ecf20Sopenharmony_ci
12958c2ecf20Sopenharmony_cistatic void cowify_req(struct io_thread_req *req, struct io_desc *segment,
12968c2ecf20Sopenharmony_ci		       unsigned long offset, unsigned long *bitmap,
12978c2ecf20Sopenharmony_ci		       __u64 bitmap_offset, __u64 bitmap_len)
12988c2ecf20Sopenharmony_ci{
12998c2ecf20Sopenharmony_ci	__u64 sector = offset >> SECTOR_SHIFT;
13008c2ecf20Sopenharmony_ci	int i;
13018c2ecf20Sopenharmony_ci
13028c2ecf20Sopenharmony_ci	if (segment->length > (sizeof(segment->sector_mask) * 8) << SECTOR_SHIFT)
13038c2ecf20Sopenharmony_ci		panic("Operation too long");
13048c2ecf20Sopenharmony_ci
13058c2ecf20Sopenharmony_ci	if (req_op(req->req) == REQ_OP_READ) {
13068c2ecf20Sopenharmony_ci		for (i = 0; i < segment->length >> SECTOR_SHIFT; i++) {
13078c2ecf20Sopenharmony_ci			if(ubd_test_bit(sector + i, (unsigned char *) bitmap))
13088c2ecf20Sopenharmony_ci				ubd_set_bit(i, (unsigned char *)
13098c2ecf20Sopenharmony_ci					    &segment->sector_mask);
13108c2ecf20Sopenharmony_ci		}
13118c2ecf20Sopenharmony_ci	} else {
13128c2ecf20Sopenharmony_ci		cowify_bitmap(offset, segment->length, &segment->sector_mask,
13138c2ecf20Sopenharmony_ci			      &segment->cow_offset, bitmap, bitmap_offset,
13148c2ecf20Sopenharmony_ci			      segment->bitmap_words, bitmap_len);
13158c2ecf20Sopenharmony_ci	}
13168c2ecf20Sopenharmony_ci}
13178c2ecf20Sopenharmony_ci
13188c2ecf20Sopenharmony_cistatic void ubd_map_req(struct ubd *dev, struct io_thread_req *io_req,
13198c2ecf20Sopenharmony_ci			struct request *req)
13208c2ecf20Sopenharmony_ci{
13218c2ecf20Sopenharmony_ci	struct bio_vec bvec;
13228c2ecf20Sopenharmony_ci	struct req_iterator iter;
13238c2ecf20Sopenharmony_ci	int i = 0;
13248c2ecf20Sopenharmony_ci	unsigned long byte_offset = io_req->offset;
13258c2ecf20Sopenharmony_ci	int op = req_op(req);
13268c2ecf20Sopenharmony_ci
13278c2ecf20Sopenharmony_ci	if (op == REQ_OP_WRITE_ZEROES || op == REQ_OP_DISCARD) {
13288c2ecf20Sopenharmony_ci		io_req->io_desc[0].buffer = NULL;
13298c2ecf20Sopenharmony_ci		io_req->io_desc[0].length = blk_rq_bytes(req);
13308c2ecf20Sopenharmony_ci	} else {
13318c2ecf20Sopenharmony_ci		rq_for_each_segment(bvec, req, iter) {
13328c2ecf20Sopenharmony_ci			BUG_ON(i >= io_req->desc_cnt);
13338c2ecf20Sopenharmony_ci
13348c2ecf20Sopenharmony_ci			io_req->io_desc[i].buffer =
13358c2ecf20Sopenharmony_ci				page_address(bvec.bv_page) + bvec.bv_offset;
13368c2ecf20Sopenharmony_ci			io_req->io_desc[i].length = bvec.bv_len;
13378c2ecf20Sopenharmony_ci			i++;
13388c2ecf20Sopenharmony_ci		}
13398c2ecf20Sopenharmony_ci	}
13408c2ecf20Sopenharmony_ci
13418c2ecf20Sopenharmony_ci	if (dev->cow.file) {
13428c2ecf20Sopenharmony_ci		for (i = 0; i < io_req->desc_cnt; i++) {
13438c2ecf20Sopenharmony_ci			cowify_req(io_req, &io_req->io_desc[i], byte_offset,
13448c2ecf20Sopenharmony_ci				   dev->cow.bitmap, dev->cow.bitmap_offset,
13458c2ecf20Sopenharmony_ci				   dev->cow.bitmap_len);
13468c2ecf20Sopenharmony_ci			byte_offset += io_req->io_desc[i].length;
13478c2ecf20Sopenharmony_ci		}
13488c2ecf20Sopenharmony_ci
13498c2ecf20Sopenharmony_ci	}
13508c2ecf20Sopenharmony_ci}
13518c2ecf20Sopenharmony_ci
13528c2ecf20Sopenharmony_cistatic struct io_thread_req *ubd_alloc_req(struct ubd *dev, struct request *req,
13538c2ecf20Sopenharmony_ci					   int desc_cnt)
13548c2ecf20Sopenharmony_ci{
13558c2ecf20Sopenharmony_ci	struct io_thread_req *io_req;
13568c2ecf20Sopenharmony_ci	int i;
13578c2ecf20Sopenharmony_ci
13588c2ecf20Sopenharmony_ci	io_req = kmalloc(sizeof(*io_req) +
13598c2ecf20Sopenharmony_ci			 (desc_cnt * sizeof(struct io_desc)),
13608c2ecf20Sopenharmony_ci			 GFP_ATOMIC);
13618c2ecf20Sopenharmony_ci	if (!io_req)
13628c2ecf20Sopenharmony_ci		return NULL;
13638c2ecf20Sopenharmony_ci
13648c2ecf20Sopenharmony_ci	io_req->req = req;
13658c2ecf20Sopenharmony_ci	if (dev->cow.file)
13668c2ecf20Sopenharmony_ci		io_req->fds[0] = dev->cow.fd;
13678c2ecf20Sopenharmony_ci	else
13688c2ecf20Sopenharmony_ci		io_req->fds[0] = dev->fd;
13698c2ecf20Sopenharmony_ci	io_req->error = 0;
13708c2ecf20Sopenharmony_ci	io_req->sectorsize = SECTOR_SIZE;
13718c2ecf20Sopenharmony_ci	io_req->fds[1] = dev->fd;
13728c2ecf20Sopenharmony_ci	io_req->offset = (u64) blk_rq_pos(req) << SECTOR_SHIFT;
13738c2ecf20Sopenharmony_ci	io_req->offsets[0] = 0;
13748c2ecf20Sopenharmony_ci	io_req->offsets[1] = dev->cow.data_offset;
13758c2ecf20Sopenharmony_ci
13768c2ecf20Sopenharmony_ci	for (i = 0 ; i < desc_cnt; i++) {
13778c2ecf20Sopenharmony_ci		io_req->io_desc[i].sector_mask = 0;
13788c2ecf20Sopenharmony_ci		io_req->io_desc[i].cow_offset = -1;
13798c2ecf20Sopenharmony_ci	}
13808c2ecf20Sopenharmony_ci
13818c2ecf20Sopenharmony_ci	return io_req;
13828c2ecf20Sopenharmony_ci}
13838c2ecf20Sopenharmony_ci
13848c2ecf20Sopenharmony_cistatic int ubd_submit_request(struct ubd *dev, struct request *req)
13858c2ecf20Sopenharmony_ci{
13868c2ecf20Sopenharmony_ci	int segs = 0;
13878c2ecf20Sopenharmony_ci	struct io_thread_req *io_req;
13888c2ecf20Sopenharmony_ci	int ret;
13898c2ecf20Sopenharmony_ci	int op = req_op(req);
13908c2ecf20Sopenharmony_ci
13918c2ecf20Sopenharmony_ci	if (op == REQ_OP_FLUSH)
13928c2ecf20Sopenharmony_ci		segs = 0;
13938c2ecf20Sopenharmony_ci	else if (op == REQ_OP_WRITE_ZEROES || op == REQ_OP_DISCARD)
13948c2ecf20Sopenharmony_ci		segs = 1;
13958c2ecf20Sopenharmony_ci	else
13968c2ecf20Sopenharmony_ci		segs = blk_rq_nr_phys_segments(req);
13978c2ecf20Sopenharmony_ci
13988c2ecf20Sopenharmony_ci	io_req = ubd_alloc_req(dev, req, segs);
13998c2ecf20Sopenharmony_ci	if (!io_req)
14008c2ecf20Sopenharmony_ci		return -ENOMEM;
14018c2ecf20Sopenharmony_ci
14028c2ecf20Sopenharmony_ci	io_req->desc_cnt = segs;
14038c2ecf20Sopenharmony_ci	if (segs)
14048c2ecf20Sopenharmony_ci		ubd_map_req(dev, io_req, req);
14058c2ecf20Sopenharmony_ci
14068c2ecf20Sopenharmony_ci	ret = os_write_file(thread_fd, &io_req, sizeof(io_req));
14078c2ecf20Sopenharmony_ci	if (ret != sizeof(io_req)) {
14088c2ecf20Sopenharmony_ci		if (ret != -EAGAIN)
14098c2ecf20Sopenharmony_ci			pr_err("write to io thread failed: %d\n", -ret);
14108c2ecf20Sopenharmony_ci		kfree(io_req);
14118c2ecf20Sopenharmony_ci	}
14128c2ecf20Sopenharmony_ci	return ret;
14138c2ecf20Sopenharmony_ci}
14148c2ecf20Sopenharmony_ci
14158c2ecf20Sopenharmony_cistatic blk_status_t ubd_queue_rq(struct blk_mq_hw_ctx *hctx,
14168c2ecf20Sopenharmony_ci				 const struct blk_mq_queue_data *bd)
14178c2ecf20Sopenharmony_ci{
14188c2ecf20Sopenharmony_ci	struct ubd *ubd_dev = hctx->queue->queuedata;
14198c2ecf20Sopenharmony_ci	struct request *req = bd->rq;
14208c2ecf20Sopenharmony_ci	int ret = 0, res = BLK_STS_OK;
14218c2ecf20Sopenharmony_ci
14228c2ecf20Sopenharmony_ci	blk_mq_start_request(req);
14238c2ecf20Sopenharmony_ci
14248c2ecf20Sopenharmony_ci	spin_lock_irq(&ubd_dev->lock);
14258c2ecf20Sopenharmony_ci
14268c2ecf20Sopenharmony_ci	switch (req_op(req)) {
14278c2ecf20Sopenharmony_ci	case REQ_OP_FLUSH:
14288c2ecf20Sopenharmony_ci	case REQ_OP_READ:
14298c2ecf20Sopenharmony_ci	case REQ_OP_WRITE:
14308c2ecf20Sopenharmony_ci	case REQ_OP_DISCARD:
14318c2ecf20Sopenharmony_ci	case REQ_OP_WRITE_ZEROES:
14328c2ecf20Sopenharmony_ci		ret = ubd_submit_request(ubd_dev, req);
14338c2ecf20Sopenharmony_ci		break;
14348c2ecf20Sopenharmony_ci	default:
14358c2ecf20Sopenharmony_ci		WARN_ON_ONCE(1);
14368c2ecf20Sopenharmony_ci		res = BLK_STS_NOTSUPP;
14378c2ecf20Sopenharmony_ci	}
14388c2ecf20Sopenharmony_ci
14398c2ecf20Sopenharmony_ci	spin_unlock_irq(&ubd_dev->lock);
14408c2ecf20Sopenharmony_ci
14418c2ecf20Sopenharmony_ci	if (ret < 0) {
14428c2ecf20Sopenharmony_ci		if (ret == -ENOMEM)
14438c2ecf20Sopenharmony_ci			res = BLK_STS_RESOURCE;
14448c2ecf20Sopenharmony_ci		else
14458c2ecf20Sopenharmony_ci			res = BLK_STS_DEV_RESOURCE;
14468c2ecf20Sopenharmony_ci	}
14478c2ecf20Sopenharmony_ci
14488c2ecf20Sopenharmony_ci	return res;
14498c2ecf20Sopenharmony_ci}
14508c2ecf20Sopenharmony_ci
14518c2ecf20Sopenharmony_cistatic int ubd_getgeo(struct block_device *bdev, struct hd_geometry *geo)
14528c2ecf20Sopenharmony_ci{
14538c2ecf20Sopenharmony_ci	struct ubd *ubd_dev = bdev->bd_disk->private_data;
14548c2ecf20Sopenharmony_ci
14558c2ecf20Sopenharmony_ci	geo->heads = 128;
14568c2ecf20Sopenharmony_ci	geo->sectors = 32;
14578c2ecf20Sopenharmony_ci	geo->cylinders = ubd_dev->size / (128 * 32 * 512);
14588c2ecf20Sopenharmony_ci	return 0;
14598c2ecf20Sopenharmony_ci}
14608c2ecf20Sopenharmony_ci
14618c2ecf20Sopenharmony_cistatic int ubd_ioctl(struct block_device *bdev, fmode_t mode,
14628c2ecf20Sopenharmony_ci		     unsigned int cmd, unsigned long arg)
14638c2ecf20Sopenharmony_ci{
14648c2ecf20Sopenharmony_ci	struct ubd *ubd_dev = bdev->bd_disk->private_data;
14658c2ecf20Sopenharmony_ci	u16 ubd_id[ATA_ID_WORDS];
14668c2ecf20Sopenharmony_ci
14678c2ecf20Sopenharmony_ci	switch (cmd) {
14688c2ecf20Sopenharmony_ci		struct cdrom_volctrl volume;
14698c2ecf20Sopenharmony_ci	case HDIO_GET_IDENTITY:
14708c2ecf20Sopenharmony_ci		memset(&ubd_id, 0, ATA_ID_WORDS * 2);
14718c2ecf20Sopenharmony_ci		ubd_id[ATA_ID_CYLS]	= ubd_dev->size / (128 * 32 * 512);
14728c2ecf20Sopenharmony_ci		ubd_id[ATA_ID_HEADS]	= 128;
14738c2ecf20Sopenharmony_ci		ubd_id[ATA_ID_SECTORS]	= 32;
14748c2ecf20Sopenharmony_ci		if(copy_to_user((char __user *) arg, (char *) &ubd_id,
14758c2ecf20Sopenharmony_ci				 sizeof(ubd_id)))
14768c2ecf20Sopenharmony_ci			return -EFAULT;
14778c2ecf20Sopenharmony_ci		return 0;
14788c2ecf20Sopenharmony_ci
14798c2ecf20Sopenharmony_ci	case CDROMVOLREAD:
14808c2ecf20Sopenharmony_ci		if(copy_from_user(&volume, (char __user *) arg, sizeof(volume)))
14818c2ecf20Sopenharmony_ci			return -EFAULT;
14828c2ecf20Sopenharmony_ci		volume.channel0 = 255;
14838c2ecf20Sopenharmony_ci		volume.channel1 = 255;
14848c2ecf20Sopenharmony_ci		volume.channel2 = 255;
14858c2ecf20Sopenharmony_ci		volume.channel3 = 255;
14868c2ecf20Sopenharmony_ci		if(copy_to_user((char __user *) arg, &volume, sizeof(volume)))
14878c2ecf20Sopenharmony_ci			return -EFAULT;
14888c2ecf20Sopenharmony_ci		return 0;
14898c2ecf20Sopenharmony_ci	}
14908c2ecf20Sopenharmony_ci	return -EINVAL;
14918c2ecf20Sopenharmony_ci}
14928c2ecf20Sopenharmony_ci
14938c2ecf20Sopenharmony_cistatic int map_error(int error_code)
14948c2ecf20Sopenharmony_ci{
14958c2ecf20Sopenharmony_ci	switch (error_code) {
14968c2ecf20Sopenharmony_ci	case 0:
14978c2ecf20Sopenharmony_ci		return BLK_STS_OK;
14988c2ecf20Sopenharmony_ci	case ENOSYS:
14998c2ecf20Sopenharmony_ci	case EOPNOTSUPP:
15008c2ecf20Sopenharmony_ci		return BLK_STS_NOTSUPP;
15018c2ecf20Sopenharmony_ci	case ENOSPC:
15028c2ecf20Sopenharmony_ci		return BLK_STS_NOSPC;
15038c2ecf20Sopenharmony_ci	}
15048c2ecf20Sopenharmony_ci	return BLK_STS_IOERR;
15058c2ecf20Sopenharmony_ci}
15068c2ecf20Sopenharmony_ci
15078c2ecf20Sopenharmony_ci/*
15088c2ecf20Sopenharmony_ci * Everything from here onwards *IS NOT PART OF THE KERNEL*
15098c2ecf20Sopenharmony_ci *
15108c2ecf20Sopenharmony_ci * The following functions are part of UML hypervisor code.
15118c2ecf20Sopenharmony_ci * All functions from here onwards are executed as a helper
15128c2ecf20Sopenharmony_ci * thread and are not allowed to execute any kernel functions.
15138c2ecf20Sopenharmony_ci *
15148c2ecf20Sopenharmony_ci * Any communication must occur strictly via shared memory and IPC.
15158c2ecf20Sopenharmony_ci *
15168c2ecf20Sopenharmony_ci * Do not add printks, locks, kernel memory operations, etc - it
15178c2ecf20Sopenharmony_ci * will result in unpredictable behaviour and/or crashes.
15188c2ecf20Sopenharmony_ci */
15198c2ecf20Sopenharmony_ci
15208c2ecf20Sopenharmony_cistatic int update_bitmap(struct io_thread_req *req, struct io_desc *segment)
15218c2ecf20Sopenharmony_ci{
15228c2ecf20Sopenharmony_ci	int n;
15238c2ecf20Sopenharmony_ci
15248c2ecf20Sopenharmony_ci	if (segment->cow_offset == -1)
15258c2ecf20Sopenharmony_ci		return map_error(0);
15268c2ecf20Sopenharmony_ci
15278c2ecf20Sopenharmony_ci	n = os_pwrite_file(req->fds[1], &segment->bitmap_words,
15288c2ecf20Sopenharmony_ci			  sizeof(segment->bitmap_words), segment->cow_offset);
15298c2ecf20Sopenharmony_ci	if (n != sizeof(segment->bitmap_words))
15308c2ecf20Sopenharmony_ci		return map_error(-n);
15318c2ecf20Sopenharmony_ci
15328c2ecf20Sopenharmony_ci	return map_error(0);
15338c2ecf20Sopenharmony_ci}
15348c2ecf20Sopenharmony_ci
15358c2ecf20Sopenharmony_cistatic void do_io(struct io_thread_req *req, struct io_desc *desc)
15368c2ecf20Sopenharmony_ci{
15378c2ecf20Sopenharmony_ci	char *buf = NULL;
15388c2ecf20Sopenharmony_ci	unsigned long len;
15398c2ecf20Sopenharmony_ci	int n, nsectors, start, end, bit;
15408c2ecf20Sopenharmony_ci	__u64 off;
15418c2ecf20Sopenharmony_ci
15428c2ecf20Sopenharmony_ci	/* FLUSH is really a special case, we cannot "case" it with others */
15438c2ecf20Sopenharmony_ci
15448c2ecf20Sopenharmony_ci	if (req_op(req->req) == REQ_OP_FLUSH) {
15458c2ecf20Sopenharmony_ci		/* fds[0] is always either the rw image or our cow file */
15468c2ecf20Sopenharmony_ci		req->error = map_error(-os_sync_file(req->fds[0]));
15478c2ecf20Sopenharmony_ci		return;
15488c2ecf20Sopenharmony_ci	}
15498c2ecf20Sopenharmony_ci
15508c2ecf20Sopenharmony_ci	nsectors = desc->length / req->sectorsize;
15518c2ecf20Sopenharmony_ci	start = 0;
15528c2ecf20Sopenharmony_ci	do {
15538c2ecf20Sopenharmony_ci		bit = ubd_test_bit(start, (unsigned char *) &desc->sector_mask);
15548c2ecf20Sopenharmony_ci		end = start;
15558c2ecf20Sopenharmony_ci		while((end < nsectors) &&
15568c2ecf20Sopenharmony_ci		      (ubd_test_bit(end, (unsigned char *) &desc->sector_mask) == bit))
15578c2ecf20Sopenharmony_ci			end++;
15588c2ecf20Sopenharmony_ci
15598c2ecf20Sopenharmony_ci		off = req->offset + req->offsets[bit] +
15608c2ecf20Sopenharmony_ci			start * req->sectorsize;
15618c2ecf20Sopenharmony_ci		len = (end - start) * req->sectorsize;
15628c2ecf20Sopenharmony_ci		if (desc->buffer != NULL)
15638c2ecf20Sopenharmony_ci			buf = &desc->buffer[start * req->sectorsize];
15648c2ecf20Sopenharmony_ci
15658c2ecf20Sopenharmony_ci		switch (req_op(req->req)) {
15668c2ecf20Sopenharmony_ci		case REQ_OP_READ:
15678c2ecf20Sopenharmony_ci			n = 0;
15688c2ecf20Sopenharmony_ci			do {
15698c2ecf20Sopenharmony_ci				buf = &buf[n];
15708c2ecf20Sopenharmony_ci				len -= n;
15718c2ecf20Sopenharmony_ci				n = os_pread_file(req->fds[bit], buf, len, off);
15728c2ecf20Sopenharmony_ci				if (n < 0) {
15738c2ecf20Sopenharmony_ci					req->error = map_error(-n);
15748c2ecf20Sopenharmony_ci					return;
15758c2ecf20Sopenharmony_ci				}
15768c2ecf20Sopenharmony_ci			} while((n < len) && (n != 0));
15778c2ecf20Sopenharmony_ci			if (n < len) memset(&buf[n], 0, len - n);
15788c2ecf20Sopenharmony_ci			break;
15798c2ecf20Sopenharmony_ci		case REQ_OP_WRITE:
15808c2ecf20Sopenharmony_ci			n = os_pwrite_file(req->fds[bit], buf, len, off);
15818c2ecf20Sopenharmony_ci			if(n != len){
15828c2ecf20Sopenharmony_ci				req->error = map_error(-n);
15838c2ecf20Sopenharmony_ci				return;
15848c2ecf20Sopenharmony_ci			}
15858c2ecf20Sopenharmony_ci			break;
15868c2ecf20Sopenharmony_ci		case REQ_OP_DISCARD:
15878c2ecf20Sopenharmony_ci		case REQ_OP_WRITE_ZEROES:
15888c2ecf20Sopenharmony_ci			n = os_falloc_punch(req->fds[bit], off, len);
15898c2ecf20Sopenharmony_ci			if (n) {
15908c2ecf20Sopenharmony_ci				req->error = map_error(-n);
15918c2ecf20Sopenharmony_ci				return;
15928c2ecf20Sopenharmony_ci			}
15938c2ecf20Sopenharmony_ci			break;
15948c2ecf20Sopenharmony_ci		default:
15958c2ecf20Sopenharmony_ci			WARN_ON_ONCE(1);
15968c2ecf20Sopenharmony_ci			req->error = BLK_STS_NOTSUPP;
15978c2ecf20Sopenharmony_ci			return;
15988c2ecf20Sopenharmony_ci		}
15998c2ecf20Sopenharmony_ci
16008c2ecf20Sopenharmony_ci		start = end;
16018c2ecf20Sopenharmony_ci	} while(start < nsectors);
16028c2ecf20Sopenharmony_ci
16038c2ecf20Sopenharmony_ci	req->offset += len;
16048c2ecf20Sopenharmony_ci	req->error = update_bitmap(req, desc);
16058c2ecf20Sopenharmony_ci}
16068c2ecf20Sopenharmony_ci
16078c2ecf20Sopenharmony_ci/* Changed in start_io_thread, which is serialized by being called only
16088c2ecf20Sopenharmony_ci * from ubd_init, which is an initcall.
16098c2ecf20Sopenharmony_ci */
16108c2ecf20Sopenharmony_ciint kernel_fd = -1;
16118c2ecf20Sopenharmony_ci
16128c2ecf20Sopenharmony_ci/* Only changed by the io thread. XXX: currently unused. */
16138c2ecf20Sopenharmony_cistatic int io_count = 0;
16148c2ecf20Sopenharmony_ci
16158c2ecf20Sopenharmony_ciint io_thread(void *arg)
16168c2ecf20Sopenharmony_ci{
16178c2ecf20Sopenharmony_ci	int n, count, written, res;
16188c2ecf20Sopenharmony_ci
16198c2ecf20Sopenharmony_ci	os_fix_helper_signals();
16208c2ecf20Sopenharmony_ci
16218c2ecf20Sopenharmony_ci	while(1){
16228c2ecf20Sopenharmony_ci		n = bulk_req_safe_read(
16238c2ecf20Sopenharmony_ci			kernel_fd,
16248c2ecf20Sopenharmony_ci			io_req_buffer,
16258c2ecf20Sopenharmony_ci			&io_remainder,
16268c2ecf20Sopenharmony_ci			&io_remainder_size,
16278c2ecf20Sopenharmony_ci			UBD_REQ_BUFFER_SIZE
16288c2ecf20Sopenharmony_ci		);
16298c2ecf20Sopenharmony_ci		if (n <= 0) {
16308c2ecf20Sopenharmony_ci			if (n == -EAGAIN)
16318c2ecf20Sopenharmony_ci				ubd_read_poll(-1);
16328c2ecf20Sopenharmony_ci
16338c2ecf20Sopenharmony_ci			continue;
16348c2ecf20Sopenharmony_ci		}
16358c2ecf20Sopenharmony_ci
16368c2ecf20Sopenharmony_ci		for (count = 0; count < n/sizeof(struct io_thread_req *); count++) {
16378c2ecf20Sopenharmony_ci			struct io_thread_req *req = (*io_req_buffer)[count];
16388c2ecf20Sopenharmony_ci			int i;
16398c2ecf20Sopenharmony_ci
16408c2ecf20Sopenharmony_ci			io_count++;
16418c2ecf20Sopenharmony_ci			for (i = 0; !req->error && i < req->desc_cnt; i++)
16428c2ecf20Sopenharmony_ci				do_io(req, &(req->io_desc[i]));
16438c2ecf20Sopenharmony_ci
16448c2ecf20Sopenharmony_ci		}
16458c2ecf20Sopenharmony_ci
16468c2ecf20Sopenharmony_ci		written = 0;
16478c2ecf20Sopenharmony_ci
16488c2ecf20Sopenharmony_ci		do {
16498c2ecf20Sopenharmony_ci			res = os_write_file(kernel_fd,
16508c2ecf20Sopenharmony_ci					    ((char *) io_req_buffer) + written,
16518c2ecf20Sopenharmony_ci					    n - written);
16528c2ecf20Sopenharmony_ci			if (res >= 0) {
16538c2ecf20Sopenharmony_ci				written += res;
16548c2ecf20Sopenharmony_ci			}
16558c2ecf20Sopenharmony_ci			if (written < n) {
16568c2ecf20Sopenharmony_ci				ubd_write_poll(-1);
16578c2ecf20Sopenharmony_ci			}
16588c2ecf20Sopenharmony_ci		} while (written < n);
16598c2ecf20Sopenharmony_ci	}
16608c2ecf20Sopenharmony_ci
16618c2ecf20Sopenharmony_ci	return 0;
16628c2ecf20Sopenharmony_ci}
1663