162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0
262306a36Sopenharmony_ci/*
362306a36Sopenharmony_ci * Copyright (C) 2018 Cambridge Greys Ltd
462306a36Sopenharmony_ci * Copyright (C) 2015-2016 Anton Ivanov (aivanov@brocade.com)
562306a36Sopenharmony_ci * Copyright (C) 2000 Jeff Dike (jdike@karaya.com)
662306a36Sopenharmony_ci */
762306a36Sopenharmony_ci
862306a36Sopenharmony_ci/* 2001-09-28...2002-04-17
962306a36Sopenharmony_ci * Partition stuff by James_McMechan@hotmail.com
1062306a36Sopenharmony_ci * old style ubd by setting UBD_SHIFT to 0
1162306a36Sopenharmony_ci * 2002-09-27...2002-10-18 massive tinkering for 2.5
1262306a36Sopenharmony_ci * partitions have changed in 2.5
1362306a36Sopenharmony_ci * 2003-01-29 more tinkering for 2.5.59-1
1462306a36Sopenharmony_ci * This should now address the sysfs problems and has
1562306a36Sopenharmony_ci * the symlink for devfs to allow for booting with
1662306a36Sopenharmony_ci * the common /dev/ubd/discX/... names rather than
1762306a36Sopenharmony_ci * only /dev/ubdN/discN this version also has lots of
1862306a36Sopenharmony_ci * clean ups preparing for ubd-many.
1962306a36Sopenharmony_ci * James McMechan
2062306a36Sopenharmony_ci */
2162306a36Sopenharmony_ci
2262306a36Sopenharmony_ci#define UBD_SHIFT 4
2362306a36Sopenharmony_ci
2462306a36Sopenharmony_ci#include <linux/module.h>
2562306a36Sopenharmony_ci#include <linux/init.h>
2662306a36Sopenharmony_ci#include <linux/blkdev.h>
2762306a36Sopenharmony_ci#include <linux/blk-mq.h>
2862306a36Sopenharmony_ci#include <linux/ata.h>
2962306a36Sopenharmony_ci#include <linux/hdreg.h>
3062306a36Sopenharmony_ci#include <linux/major.h>
3162306a36Sopenharmony_ci#include <linux/cdrom.h>
3262306a36Sopenharmony_ci#include <linux/proc_fs.h>
3362306a36Sopenharmony_ci#include <linux/seq_file.h>
3462306a36Sopenharmony_ci#include <linux/ctype.h>
3562306a36Sopenharmony_ci#include <linux/slab.h>
3662306a36Sopenharmony_ci#include <linux/vmalloc.h>
3762306a36Sopenharmony_ci#include <linux/platform_device.h>
3862306a36Sopenharmony_ci#include <linux/scatterlist.h>
3962306a36Sopenharmony_ci#include <asm/tlbflush.h>
4062306a36Sopenharmony_ci#include <kern_util.h>
4162306a36Sopenharmony_ci#include "mconsole_kern.h"
4262306a36Sopenharmony_ci#include <init.h>
4362306a36Sopenharmony_ci#include <irq_kern.h>
4462306a36Sopenharmony_ci#include "ubd.h"
4562306a36Sopenharmony_ci#include <os.h>
4662306a36Sopenharmony_ci#include "cow.h"
4762306a36Sopenharmony_ci
4862306a36Sopenharmony_ci/* Max request size is determined by sector mask - 32K */
4962306a36Sopenharmony_ci#define UBD_MAX_REQUEST (8 * sizeof(long))
5062306a36Sopenharmony_ci
5162306a36Sopenharmony_cistruct io_desc {
5262306a36Sopenharmony_ci	char *buffer;
5362306a36Sopenharmony_ci	unsigned long length;
5462306a36Sopenharmony_ci	unsigned long sector_mask;
5562306a36Sopenharmony_ci	unsigned long long cow_offset;
5662306a36Sopenharmony_ci	unsigned long bitmap_words[2];
5762306a36Sopenharmony_ci};
5862306a36Sopenharmony_ci
5962306a36Sopenharmony_cistruct io_thread_req {
6062306a36Sopenharmony_ci	struct request *req;
6162306a36Sopenharmony_ci	int fds[2];
6262306a36Sopenharmony_ci	unsigned long offsets[2];
6362306a36Sopenharmony_ci	unsigned long long offset;
6462306a36Sopenharmony_ci	int sectorsize;
6562306a36Sopenharmony_ci	int error;
6662306a36Sopenharmony_ci
6762306a36Sopenharmony_ci	int desc_cnt;
6862306a36Sopenharmony_ci	/* io_desc has to be the last element of the struct */
6962306a36Sopenharmony_ci	struct io_desc io_desc[];
7062306a36Sopenharmony_ci};
7162306a36Sopenharmony_ci
7262306a36Sopenharmony_ci
7362306a36Sopenharmony_cistatic struct io_thread_req * (*irq_req_buffer)[];
7462306a36Sopenharmony_cistatic struct io_thread_req *irq_remainder;
7562306a36Sopenharmony_cistatic int irq_remainder_size;
7662306a36Sopenharmony_ci
7762306a36Sopenharmony_cistatic struct io_thread_req * (*io_req_buffer)[];
7862306a36Sopenharmony_cistatic struct io_thread_req *io_remainder;
7962306a36Sopenharmony_cistatic int io_remainder_size;
8062306a36Sopenharmony_ci
8162306a36Sopenharmony_ci
8262306a36Sopenharmony_ci
8362306a36Sopenharmony_cistatic inline int ubd_test_bit(__u64 bit, unsigned char *data)
8462306a36Sopenharmony_ci{
8562306a36Sopenharmony_ci	__u64 n;
8662306a36Sopenharmony_ci	int bits, off;
8762306a36Sopenharmony_ci
8862306a36Sopenharmony_ci	bits = sizeof(data[0]) * 8;
8962306a36Sopenharmony_ci	n = bit / bits;
9062306a36Sopenharmony_ci	off = bit % bits;
9162306a36Sopenharmony_ci	return (data[n] & (1 << off)) != 0;
9262306a36Sopenharmony_ci}
9362306a36Sopenharmony_ci
9462306a36Sopenharmony_cistatic inline void ubd_set_bit(__u64 bit, unsigned char *data)
9562306a36Sopenharmony_ci{
9662306a36Sopenharmony_ci	__u64 n;
9762306a36Sopenharmony_ci	int bits, off;
9862306a36Sopenharmony_ci
9962306a36Sopenharmony_ci	bits = sizeof(data[0]) * 8;
10062306a36Sopenharmony_ci	n = bit / bits;
10162306a36Sopenharmony_ci	off = bit % bits;
10262306a36Sopenharmony_ci	data[n] |= (1 << off);
10362306a36Sopenharmony_ci}
10462306a36Sopenharmony_ci/*End stuff from ubd_user.h*/
10562306a36Sopenharmony_ci
10662306a36Sopenharmony_ci#define DRIVER_NAME "uml-blkdev"
10762306a36Sopenharmony_ci
10862306a36Sopenharmony_cistatic DEFINE_MUTEX(ubd_lock);
10962306a36Sopenharmony_cistatic DEFINE_MUTEX(ubd_mutex); /* replaces BKL, might not be needed */
11062306a36Sopenharmony_ci
11162306a36Sopenharmony_cistatic int ubd_open(struct gendisk *disk, blk_mode_t mode);
11262306a36Sopenharmony_cistatic void ubd_release(struct gendisk *disk);
11362306a36Sopenharmony_cistatic int ubd_ioctl(struct block_device *bdev, blk_mode_t mode,
11462306a36Sopenharmony_ci		     unsigned int cmd, unsigned long arg);
11562306a36Sopenharmony_cistatic int ubd_getgeo(struct block_device *bdev, struct hd_geometry *geo);
11662306a36Sopenharmony_ci
11762306a36Sopenharmony_ci#define MAX_DEV (16)
11862306a36Sopenharmony_ci
11962306a36Sopenharmony_cistatic const struct block_device_operations ubd_blops = {
12062306a36Sopenharmony_ci        .owner		= THIS_MODULE,
12162306a36Sopenharmony_ci        .open		= ubd_open,
12262306a36Sopenharmony_ci        .release	= ubd_release,
12362306a36Sopenharmony_ci        .ioctl		= ubd_ioctl,
12462306a36Sopenharmony_ci        .compat_ioctl	= blkdev_compat_ptr_ioctl,
12562306a36Sopenharmony_ci	.getgeo		= ubd_getgeo,
12662306a36Sopenharmony_ci};
12762306a36Sopenharmony_ci
12862306a36Sopenharmony_ci/* Protected by ubd_lock */
12962306a36Sopenharmony_cistatic struct gendisk *ubd_gendisk[MAX_DEV];
13062306a36Sopenharmony_ci
13162306a36Sopenharmony_ci#ifdef CONFIG_BLK_DEV_UBD_SYNC
13262306a36Sopenharmony_ci#define OPEN_FLAGS ((struct openflags) { .r = 1, .w = 1, .s = 1, .c = 0, \
13362306a36Sopenharmony_ci					 .cl = 1 })
13462306a36Sopenharmony_ci#else
13562306a36Sopenharmony_ci#define OPEN_FLAGS ((struct openflags) { .r = 1, .w = 1, .s = 0, .c = 0, \
13662306a36Sopenharmony_ci					 .cl = 1 })
13762306a36Sopenharmony_ci#endif
13862306a36Sopenharmony_cistatic struct openflags global_openflags = OPEN_FLAGS;
13962306a36Sopenharmony_ci
14062306a36Sopenharmony_cistruct cow {
14162306a36Sopenharmony_ci	/* backing file name */
14262306a36Sopenharmony_ci	char *file;
14362306a36Sopenharmony_ci	/* backing file fd */
14462306a36Sopenharmony_ci	int fd;
14562306a36Sopenharmony_ci	unsigned long *bitmap;
14662306a36Sopenharmony_ci	unsigned long bitmap_len;
14762306a36Sopenharmony_ci	int bitmap_offset;
14862306a36Sopenharmony_ci	int data_offset;
14962306a36Sopenharmony_ci};
15062306a36Sopenharmony_ci
15162306a36Sopenharmony_ci#define MAX_SG 64
15262306a36Sopenharmony_ci
15362306a36Sopenharmony_cistruct ubd {
15462306a36Sopenharmony_ci	/* name (and fd, below) of the file opened for writing, either the
15562306a36Sopenharmony_ci	 * backing or the cow file. */
15662306a36Sopenharmony_ci	char *file;
15762306a36Sopenharmony_ci	char *serial;
15862306a36Sopenharmony_ci	int count;
15962306a36Sopenharmony_ci	int fd;
16062306a36Sopenharmony_ci	__u64 size;
16162306a36Sopenharmony_ci	struct openflags boot_openflags;
16262306a36Sopenharmony_ci	struct openflags openflags;
16362306a36Sopenharmony_ci	unsigned shared:1;
16462306a36Sopenharmony_ci	unsigned no_cow:1;
16562306a36Sopenharmony_ci	unsigned no_trim:1;
16662306a36Sopenharmony_ci	struct cow cow;
16762306a36Sopenharmony_ci	struct platform_device pdev;
16862306a36Sopenharmony_ci	struct request_queue *queue;
16962306a36Sopenharmony_ci	struct blk_mq_tag_set tag_set;
17062306a36Sopenharmony_ci	spinlock_t lock;
17162306a36Sopenharmony_ci};
17262306a36Sopenharmony_ci
17362306a36Sopenharmony_ci#define DEFAULT_COW { \
17462306a36Sopenharmony_ci	.file =			NULL, \
17562306a36Sopenharmony_ci	.fd =			-1,	\
17662306a36Sopenharmony_ci	.bitmap =		NULL, \
17762306a36Sopenharmony_ci	.bitmap_offset =	0, \
17862306a36Sopenharmony_ci	.data_offset =		0, \
17962306a36Sopenharmony_ci}
18062306a36Sopenharmony_ci
18162306a36Sopenharmony_ci#define DEFAULT_UBD { \
18262306a36Sopenharmony_ci	.file = 		NULL, \
18362306a36Sopenharmony_ci	.serial =		NULL, \
18462306a36Sopenharmony_ci	.count =		0, \
18562306a36Sopenharmony_ci	.fd =			-1, \
18662306a36Sopenharmony_ci	.size =			-1, \
18762306a36Sopenharmony_ci	.boot_openflags =	OPEN_FLAGS, \
18862306a36Sopenharmony_ci	.openflags =		OPEN_FLAGS, \
18962306a36Sopenharmony_ci	.no_cow =               0, \
19062306a36Sopenharmony_ci	.no_trim =		0, \
19162306a36Sopenharmony_ci	.shared =		0, \
19262306a36Sopenharmony_ci	.cow =			DEFAULT_COW, \
19362306a36Sopenharmony_ci	.lock =			__SPIN_LOCK_UNLOCKED(ubd_devs.lock), \
19462306a36Sopenharmony_ci}
19562306a36Sopenharmony_ci
19662306a36Sopenharmony_ci/* Protected by ubd_lock */
19762306a36Sopenharmony_cistatic struct ubd ubd_devs[MAX_DEV] = { [0 ... MAX_DEV - 1] = DEFAULT_UBD };
19862306a36Sopenharmony_ci
19962306a36Sopenharmony_cistatic blk_status_t ubd_queue_rq(struct blk_mq_hw_ctx *hctx,
20062306a36Sopenharmony_ci				 const struct blk_mq_queue_data *bd);
20162306a36Sopenharmony_ci
20262306a36Sopenharmony_cistatic int fake_ide_setup(char *str)
20362306a36Sopenharmony_ci{
20462306a36Sopenharmony_ci	pr_warn("The fake_ide option has been removed\n");
20562306a36Sopenharmony_ci	return 1;
20662306a36Sopenharmony_ci}
20762306a36Sopenharmony_ci__setup("fake_ide", fake_ide_setup);
20862306a36Sopenharmony_ci
20962306a36Sopenharmony_ci__uml_help(fake_ide_setup,
21062306a36Sopenharmony_ci"fake_ide\n"
21162306a36Sopenharmony_ci"    Obsolete stub.\n\n"
21262306a36Sopenharmony_ci);
21362306a36Sopenharmony_ci
21462306a36Sopenharmony_cistatic int parse_unit(char **ptr)
21562306a36Sopenharmony_ci{
21662306a36Sopenharmony_ci	char *str = *ptr, *end;
21762306a36Sopenharmony_ci	int n = -1;
21862306a36Sopenharmony_ci
21962306a36Sopenharmony_ci	if(isdigit(*str)) {
22062306a36Sopenharmony_ci		n = simple_strtoul(str, &end, 0);
22162306a36Sopenharmony_ci		if(end == str)
22262306a36Sopenharmony_ci			return -1;
22362306a36Sopenharmony_ci		*ptr = end;
22462306a36Sopenharmony_ci	}
22562306a36Sopenharmony_ci	else if (('a' <= *str) && (*str <= 'z')) {
22662306a36Sopenharmony_ci		n = *str - 'a';
22762306a36Sopenharmony_ci		str++;
22862306a36Sopenharmony_ci		*ptr = str;
22962306a36Sopenharmony_ci	}
23062306a36Sopenharmony_ci	return n;
23162306a36Sopenharmony_ci}
23262306a36Sopenharmony_ci
23362306a36Sopenharmony_ci/* If *index_out == -1 at exit, the passed option was a general one;
23462306a36Sopenharmony_ci * otherwise, the str pointer is used (and owned) inside ubd_devs array, so it
23562306a36Sopenharmony_ci * should not be freed on exit.
23662306a36Sopenharmony_ci */
23762306a36Sopenharmony_cistatic int ubd_setup_common(char *str, int *index_out, char **error_out)
23862306a36Sopenharmony_ci{
23962306a36Sopenharmony_ci	struct ubd *ubd_dev;
24062306a36Sopenharmony_ci	struct openflags flags = global_openflags;
24162306a36Sopenharmony_ci	char *file, *backing_file, *serial;
24262306a36Sopenharmony_ci	int n, err = 0, i;
24362306a36Sopenharmony_ci
24462306a36Sopenharmony_ci	if(index_out) *index_out = -1;
24562306a36Sopenharmony_ci	n = *str;
24662306a36Sopenharmony_ci	if(n == '='){
24762306a36Sopenharmony_ci		str++;
24862306a36Sopenharmony_ci		if(!strcmp(str, "sync")){
24962306a36Sopenharmony_ci			global_openflags = of_sync(global_openflags);
25062306a36Sopenharmony_ci			return err;
25162306a36Sopenharmony_ci		}
25262306a36Sopenharmony_ci
25362306a36Sopenharmony_ci		pr_warn("fake major not supported any more\n");
25462306a36Sopenharmony_ci		return 0;
25562306a36Sopenharmony_ci	}
25662306a36Sopenharmony_ci
25762306a36Sopenharmony_ci	n = parse_unit(&str);
25862306a36Sopenharmony_ci	if(n < 0){
25962306a36Sopenharmony_ci		*error_out = "Couldn't parse device number";
26062306a36Sopenharmony_ci		return -EINVAL;
26162306a36Sopenharmony_ci	}
26262306a36Sopenharmony_ci	if(n >= MAX_DEV){
26362306a36Sopenharmony_ci		*error_out = "Device number out of range";
26462306a36Sopenharmony_ci		return 1;
26562306a36Sopenharmony_ci	}
26662306a36Sopenharmony_ci
26762306a36Sopenharmony_ci	err = -EBUSY;
26862306a36Sopenharmony_ci	mutex_lock(&ubd_lock);
26962306a36Sopenharmony_ci
27062306a36Sopenharmony_ci	ubd_dev = &ubd_devs[n];
27162306a36Sopenharmony_ci	if(ubd_dev->file != NULL){
27262306a36Sopenharmony_ci		*error_out = "Device is already configured";
27362306a36Sopenharmony_ci		goto out;
27462306a36Sopenharmony_ci	}
27562306a36Sopenharmony_ci
27662306a36Sopenharmony_ci	if (index_out)
27762306a36Sopenharmony_ci		*index_out = n;
27862306a36Sopenharmony_ci
27962306a36Sopenharmony_ci	err = -EINVAL;
28062306a36Sopenharmony_ci	for (i = 0; i < sizeof("rscdt="); i++) {
28162306a36Sopenharmony_ci		switch (*str) {
28262306a36Sopenharmony_ci		case 'r':
28362306a36Sopenharmony_ci			flags.w = 0;
28462306a36Sopenharmony_ci			break;
28562306a36Sopenharmony_ci		case 's':
28662306a36Sopenharmony_ci			flags.s = 1;
28762306a36Sopenharmony_ci			break;
28862306a36Sopenharmony_ci		case 'd':
28962306a36Sopenharmony_ci			ubd_dev->no_cow = 1;
29062306a36Sopenharmony_ci			break;
29162306a36Sopenharmony_ci		case 'c':
29262306a36Sopenharmony_ci			ubd_dev->shared = 1;
29362306a36Sopenharmony_ci			break;
29462306a36Sopenharmony_ci		case 't':
29562306a36Sopenharmony_ci			ubd_dev->no_trim = 1;
29662306a36Sopenharmony_ci			break;
29762306a36Sopenharmony_ci		case '=':
29862306a36Sopenharmony_ci			str++;
29962306a36Sopenharmony_ci			goto break_loop;
30062306a36Sopenharmony_ci		default:
30162306a36Sopenharmony_ci			*error_out = "Expected '=' or flag letter "
30262306a36Sopenharmony_ci				"(r, s, c, t or d)";
30362306a36Sopenharmony_ci			goto out;
30462306a36Sopenharmony_ci		}
30562306a36Sopenharmony_ci		str++;
30662306a36Sopenharmony_ci	}
30762306a36Sopenharmony_ci
30862306a36Sopenharmony_ci	if (*str == '=')
30962306a36Sopenharmony_ci		*error_out = "Too many flags specified";
31062306a36Sopenharmony_ci	else
31162306a36Sopenharmony_ci		*error_out = "Missing '='";
31262306a36Sopenharmony_ci	goto out;
31362306a36Sopenharmony_ci
31462306a36Sopenharmony_cibreak_loop:
31562306a36Sopenharmony_ci	file = strsep(&str, ",:");
31662306a36Sopenharmony_ci	if (*file == '\0')
31762306a36Sopenharmony_ci		file = NULL;
31862306a36Sopenharmony_ci
31962306a36Sopenharmony_ci	backing_file = strsep(&str, ",:");
32062306a36Sopenharmony_ci	if (backing_file && *backing_file == '\0')
32162306a36Sopenharmony_ci		backing_file = NULL;
32262306a36Sopenharmony_ci
32362306a36Sopenharmony_ci	serial = strsep(&str, ",:");
32462306a36Sopenharmony_ci	if (serial && *serial == '\0')
32562306a36Sopenharmony_ci		serial = NULL;
32662306a36Sopenharmony_ci
32762306a36Sopenharmony_ci	if (backing_file && ubd_dev->no_cow) {
32862306a36Sopenharmony_ci		*error_out = "Can't specify both 'd' and a cow file";
32962306a36Sopenharmony_ci		goto out;
33062306a36Sopenharmony_ci	}
33162306a36Sopenharmony_ci
33262306a36Sopenharmony_ci	err = 0;
33362306a36Sopenharmony_ci	ubd_dev->file = file;
33462306a36Sopenharmony_ci	ubd_dev->cow.file = backing_file;
33562306a36Sopenharmony_ci	ubd_dev->serial = serial;
33662306a36Sopenharmony_ci	ubd_dev->boot_openflags = flags;
33762306a36Sopenharmony_ciout:
33862306a36Sopenharmony_ci	mutex_unlock(&ubd_lock);
33962306a36Sopenharmony_ci	return err;
34062306a36Sopenharmony_ci}
34162306a36Sopenharmony_ci
34262306a36Sopenharmony_cistatic int ubd_setup(char *str)
34362306a36Sopenharmony_ci{
34462306a36Sopenharmony_ci	char *error;
34562306a36Sopenharmony_ci	int err;
34662306a36Sopenharmony_ci
34762306a36Sopenharmony_ci	err = ubd_setup_common(str, NULL, &error);
34862306a36Sopenharmony_ci	if(err)
34962306a36Sopenharmony_ci		printk(KERN_ERR "Failed to initialize device with \"%s\" : "
35062306a36Sopenharmony_ci		       "%s\n", str, error);
35162306a36Sopenharmony_ci	return 1;
35262306a36Sopenharmony_ci}
35362306a36Sopenharmony_ci
35462306a36Sopenharmony_ci__setup("ubd", ubd_setup);
35562306a36Sopenharmony_ci__uml_help(ubd_setup,
35662306a36Sopenharmony_ci"ubd<n><flags>=<filename>[(:|,)<filename2>][(:|,)<serial>]\n"
35762306a36Sopenharmony_ci"    This is used to associate a device with a file in the underlying\n"
35862306a36Sopenharmony_ci"    filesystem. When specifying two filenames, the first one is the\n"
35962306a36Sopenharmony_ci"    COW name and the second is the backing file name. As separator you can\n"
36062306a36Sopenharmony_ci"    use either a ':' or a ',': the first one allows writing things like;\n"
36162306a36Sopenharmony_ci"	ubd0=~/Uml/root_cow:~/Uml/root_backing_file\n"
36262306a36Sopenharmony_ci"    while with a ',' the shell would not expand the 2nd '~'.\n"
36362306a36Sopenharmony_ci"    When using only one filename, UML will detect whether to treat it like\n"
36462306a36Sopenharmony_ci"    a COW file or a backing file. To override this detection, add the 'd'\n"
36562306a36Sopenharmony_ci"    flag:\n"
36662306a36Sopenharmony_ci"	ubd0d=BackingFile\n"
36762306a36Sopenharmony_ci"    Usually, there is a filesystem in the file, but \n"
36862306a36Sopenharmony_ci"    that's not required. Swap devices containing swap files can be\n"
36962306a36Sopenharmony_ci"    specified like this. Also, a file which doesn't contain a\n"
37062306a36Sopenharmony_ci"    filesystem can have its contents read in the virtual \n"
37162306a36Sopenharmony_ci"    machine by running 'dd' on the device. <n> must be in the range\n"
37262306a36Sopenharmony_ci"    0 to 7. Appending an 'r' to the number will cause that device\n"
37362306a36Sopenharmony_ci"    to be mounted read-only. For example ubd1r=./ext_fs. Appending\n"
37462306a36Sopenharmony_ci"    an 's' will cause data to be written to disk on the host immediately.\n"
37562306a36Sopenharmony_ci"    'c' will cause the device to be treated as being shared between multiple\n"
37662306a36Sopenharmony_ci"    UMLs and file locking will be turned off - this is appropriate for a\n"
37762306a36Sopenharmony_ci"    cluster filesystem and inappropriate at almost all other times.\n\n"
37862306a36Sopenharmony_ci"    't' will disable trim/discard support on the device (enabled by default).\n\n"
37962306a36Sopenharmony_ci"    An optional device serial number can be exposed using the serial parameter\n"
38062306a36Sopenharmony_ci"    on the cmdline which is exposed as a sysfs entry. This is particularly\n"
38162306a36Sopenharmony_ci"    useful when a unique number should be given to the device. Note when\n"
38262306a36Sopenharmony_ci"    specifying a label, the filename2 must be also presented. It can be\n"
38362306a36Sopenharmony_ci"    an empty string, in which case the backing file is not used:\n"
38462306a36Sopenharmony_ci"       ubd0=File,,Serial\n"
38562306a36Sopenharmony_ci);
38662306a36Sopenharmony_ci
38762306a36Sopenharmony_cistatic int udb_setup(char *str)
38862306a36Sopenharmony_ci{
38962306a36Sopenharmony_ci	printk("udb%s specified on command line is almost certainly a ubd -> "
39062306a36Sopenharmony_ci	       "udb TYPO\n", str);
39162306a36Sopenharmony_ci	return 1;
39262306a36Sopenharmony_ci}
39362306a36Sopenharmony_ci
39462306a36Sopenharmony_ci__setup("udb", udb_setup);
39562306a36Sopenharmony_ci__uml_help(udb_setup,
39662306a36Sopenharmony_ci"udb\n"
39762306a36Sopenharmony_ci"    This option is here solely to catch ubd -> udb typos, which can be\n"
39862306a36Sopenharmony_ci"    to impossible to catch visually unless you specifically look for\n"
39962306a36Sopenharmony_ci"    them.  The only result of any option starting with 'udb' is an error\n"
40062306a36Sopenharmony_ci"    in the boot output.\n\n"
40162306a36Sopenharmony_ci);
40262306a36Sopenharmony_ci
40362306a36Sopenharmony_ci/* Only changed by ubd_init, which is an initcall. */
40462306a36Sopenharmony_cistatic int thread_fd = -1;
40562306a36Sopenharmony_ci
40662306a36Sopenharmony_ci/* Function to read several request pointers at a time
40762306a36Sopenharmony_ci* handling fractional reads if (and as) needed
40862306a36Sopenharmony_ci*/
40962306a36Sopenharmony_ci
41062306a36Sopenharmony_cistatic int bulk_req_safe_read(
41162306a36Sopenharmony_ci	int fd,
41262306a36Sopenharmony_ci	struct io_thread_req * (*request_buffer)[],
41362306a36Sopenharmony_ci	struct io_thread_req **remainder,
41462306a36Sopenharmony_ci	int *remainder_size,
41562306a36Sopenharmony_ci	int max_recs
41662306a36Sopenharmony_ci	)
41762306a36Sopenharmony_ci{
41862306a36Sopenharmony_ci	int n = 0;
41962306a36Sopenharmony_ci	int res = 0;
42062306a36Sopenharmony_ci
42162306a36Sopenharmony_ci	if (*remainder_size > 0) {
42262306a36Sopenharmony_ci		memmove(
42362306a36Sopenharmony_ci			(char *) request_buffer,
42462306a36Sopenharmony_ci			(char *) remainder, *remainder_size
42562306a36Sopenharmony_ci		);
42662306a36Sopenharmony_ci		n = *remainder_size;
42762306a36Sopenharmony_ci	}
42862306a36Sopenharmony_ci
42962306a36Sopenharmony_ci	res = os_read_file(
43062306a36Sopenharmony_ci			fd,
43162306a36Sopenharmony_ci			((char *) request_buffer) + *remainder_size,
43262306a36Sopenharmony_ci			sizeof(struct io_thread_req *)*max_recs
43362306a36Sopenharmony_ci				- *remainder_size
43462306a36Sopenharmony_ci		);
43562306a36Sopenharmony_ci	if (res > 0) {
43662306a36Sopenharmony_ci		n += res;
43762306a36Sopenharmony_ci		if ((n % sizeof(struct io_thread_req *)) > 0) {
43862306a36Sopenharmony_ci			/*
43962306a36Sopenharmony_ci			* Read somehow returned not a multiple of dword
44062306a36Sopenharmony_ci			* theoretically possible, but never observed in the
44162306a36Sopenharmony_ci			* wild, so read routine must be able to handle it
44262306a36Sopenharmony_ci			*/
44362306a36Sopenharmony_ci			*remainder_size = n % sizeof(struct io_thread_req *);
44462306a36Sopenharmony_ci			WARN(*remainder_size > 0, "UBD IPC read returned a partial result");
44562306a36Sopenharmony_ci			memmove(
44662306a36Sopenharmony_ci				remainder,
44762306a36Sopenharmony_ci				((char *) request_buffer) +
44862306a36Sopenharmony_ci					(n/sizeof(struct io_thread_req *))*sizeof(struct io_thread_req *),
44962306a36Sopenharmony_ci				*remainder_size
45062306a36Sopenharmony_ci			);
45162306a36Sopenharmony_ci			n = n - *remainder_size;
45262306a36Sopenharmony_ci		}
45362306a36Sopenharmony_ci	} else {
45462306a36Sopenharmony_ci		n = res;
45562306a36Sopenharmony_ci	}
45662306a36Sopenharmony_ci	return n;
45762306a36Sopenharmony_ci}
45862306a36Sopenharmony_ci
45962306a36Sopenharmony_ci/* Called without dev->lock held, and only in interrupt context. */
46062306a36Sopenharmony_cistatic void ubd_handler(void)
46162306a36Sopenharmony_ci{
46262306a36Sopenharmony_ci	int n;
46362306a36Sopenharmony_ci	int count;
46462306a36Sopenharmony_ci
46562306a36Sopenharmony_ci	while(1){
46662306a36Sopenharmony_ci		n = bulk_req_safe_read(
46762306a36Sopenharmony_ci			thread_fd,
46862306a36Sopenharmony_ci			irq_req_buffer,
46962306a36Sopenharmony_ci			&irq_remainder,
47062306a36Sopenharmony_ci			&irq_remainder_size,
47162306a36Sopenharmony_ci			UBD_REQ_BUFFER_SIZE
47262306a36Sopenharmony_ci		);
47362306a36Sopenharmony_ci		if (n < 0) {
47462306a36Sopenharmony_ci			if(n == -EAGAIN)
47562306a36Sopenharmony_ci				break;
47662306a36Sopenharmony_ci			printk(KERN_ERR "spurious interrupt in ubd_handler, "
47762306a36Sopenharmony_ci			       "err = %d\n", -n);
47862306a36Sopenharmony_ci			return;
47962306a36Sopenharmony_ci		}
48062306a36Sopenharmony_ci		for (count = 0; count < n/sizeof(struct io_thread_req *); count++) {
48162306a36Sopenharmony_ci			struct io_thread_req *io_req = (*irq_req_buffer)[count];
48262306a36Sopenharmony_ci
48362306a36Sopenharmony_ci			if ((io_req->error == BLK_STS_NOTSUPP) && (req_op(io_req->req) == REQ_OP_DISCARD)) {
48462306a36Sopenharmony_ci				blk_queue_max_discard_sectors(io_req->req->q, 0);
48562306a36Sopenharmony_ci				blk_queue_max_write_zeroes_sectors(io_req->req->q, 0);
48662306a36Sopenharmony_ci			}
48762306a36Sopenharmony_ci			blk_mq_end_request(io_req->req, io_req->error);
48862306a36Sopenharmony_ci			kfree(io_req);
48962306a36Sopenharmony_ci		}
49062306a36Sopenharmony_ci	}
49162306a36Sopenharmony_ci}
49262306a36Sopenharmony_ci
49362306a36Sopenharmony_cistatic irqreturn_t ubd_intr(int irq, void *dev)
49462306a36Sopenharmony_ci{
49562306a36Sopenharmony_ci	ubd_handler();
49662306a36Sopenharmony_ci	return IRQ_HANDLED;
49762306a36Sopenharmony_ci}
49862306a36Sopenharmony_ci
49962306a36Sopenharmony_ci/* Only changed by ubd_init, which is an initcall. */
50062306a36Sopenharmony_cistatic int io_pid = -1;
50162306a36Sopenharmony_ci
50262306a36Sopenharmony_cistatic void kill_io_thread(void)
50362306a36Sopenharmony_ci{
50462306a36Sopenharmony_ci	if(io_pid != -1)
50562306a36Sopenharmony_ci		os_kill_process(io_pid, 1);
50662306a36Sopenharmony_ci}
50762306a36Sopenharmony_ci
50862306a36Sopenharmony_ci__uml_exitcall(kill_io_thread);
50962306a36Sopenharmony_ci
51062306a36Sopenharmony_cistatic inline int ubd_file_size(struct ubd *ubd_dev, __u64 *size_out)
51162306a36Sopenharmony_ci{
51262306a36Sopenharmony_ci	char *file;
51362306a36Sopenharmony_ci	int fd;
51462306a36Sopenharmony_ci	int err;
51562306a36Sopenharmony_ci
51662306a36Sopenharmony_ci	__u32 version;
51762306a36Sopenharmony_ci	__u32 align;
51862306a36Sopenharmony_ci	char *backing_file;
51962306a36Sopenharmony_ci	time64_t mtime;
52062306a36Sopenharmony_ci	unsigned long long size;
52162306a36Sopenharmony_ci	int sector_size;
52262306a36Sopenharmony_ci	int bitmap_offset;
52362306a36Sopenharmony_ci
52462306a36Sopenharmony_ci	if (ubd_dev->file && ubd_dev->cow.file) {
52562306a36Sopenharmony_ci		file = ubd_dev->cow.file;
52662306a36Sopenharmony_ci
52762306a36Sopenharmony_ci		goto out;
52862306a36Sopenharmony_ci	}
52962306a36Sopenharmony_ci
53062306a36Sopenharmony_ci	fd = os_open_file(ubd_dev->file, of_read(OPENFLAGS()), 0);
53162306a36Sopenharmony_ci	if (fd < 0)
53262306a36Sopenharmony_ci		return fd;
53362306a36Sopenharmony_ci
53462306a36Sopenharmony_ci	err = read_cow_header(file_reader, &fd, &version, &backing_file, \
53562306a36Sopenharmony_ci		&mtime, &size, &sector_size, &align, &bitmap_offset);
53662306a36Sopenharmony_ci	os_close_file(fd);
53762306a36Sopenharmony_ci
53862306a36Sopenharmony_ci	if(err == -EINVAL)
53962306a36Sopenharmony_ci		file = ubd_dev->file;
54062306a36Sopenharmony_ci	else
54162306a36Sopenharmony_ci		file = backing_file;
54262306a36Sopenharmony_ci
54362306a36Sopenharmony_ciout:
54462306a36Sopenharmony_ci	return os_file_size(file, size_out);
54562306a36Sopenharmony_ci}
54662306a36Sopenharmony_ci
54762306a36Sopenharmony_cistatic int read_cow_bitmap(int fd, void *buf, int offset, int len)
54862306a36Sopenharmony_ci{
54962306a36Sopenharmony_ci	int err;
55062306a36Sopenharmony_ci
55162306a36Sopenharmony_ci	err = os_pread_file(fd, buf, len, offset);
55262306a36Sopenharmony_ci	if (err < 0)
55362306a36Sopenharmony_ci		return err;
55462306a36Sopenharmony_ci
55562306a36Sopenharmony_ci	return 0;
55662306a36Sopenharmony_ci}
55762306a36Sopenharmony_ci
55862306a36Sopenharmony_cistatic int backing_file_mismatch(char *file, __u64 size, time64_t mtime)
55962306a36Sopenharmony_ci{
56062306a36Sopenharmony_ci	time64_t modtime;
56162306a36Sopenharmony_ci	unsigned long long actual;
56262306a36Sopenharmony_ci	int err;
56362306a36Sopenharmony_ci
56462306a36Sopenharmony_ci	err = os_file_modtime(file, &modtime);
56562306a36Sopenharmony_ci	if (err < 0) {
56662306a36Sopenharmony_ci		printk(KERN_ERR "Failed to get modification time of backing "
56762306a36Sopenharmony_ci		       "file \"%s\", err = %d\n", file, -err);
56862306a36Sopenharmony_ci		return err;
56962306a36Sopenharmony_ci	}
57062306a36Sopenharmony_ci
57162306a36Sopenharmony_ci	err = os_file_size(file, &actual);
57262306a36Sopenharmony_ci	if (err < 0) {
57362306a36Sopenharmony_ci		printk(KERN_ERR "Failed to get size of backing file \"%s\", "
57462306a36Sopenharmony_ci		       "err = %d\n", file, -err);
57562306a36Sopenharmony_ci		return err;
57662306a36Sopenharmony_ci	}
57762306a36Sopenharmony_ci
57862306a36Sopenharmony_ci	if (actual != size) {
57962306a36Sopenharmony_ci		/*__u64 can be a long on AMD64 and with %lu GCC complains; so
58062306a36Sopenharmony_ci		 * the typecast.*/
58162306a36Sopenharmony_ci		printk(KERN_ERR "Size mismatch (%llu vs %llu) of COW header "
58262306a36Sopenharmony_ci		       "vs backing file\n", (unsigned long long) size, actual);
58362306a36Sopenharmony_ci		return -EINVAL;
58462306a36Sopenharmony_ci	}
58562306a36Sopenharmony_ci	if (modtime != mtime) {
58662306a36Sopenharmony_ci		printk(KERN_ERR "mtime mismatch (%lld vs %lld) of COW header vs "
58762306a36Sopenharmony_ci		       "backing file\n", mtime, modtime);
58862306a36Sopenharmony_ci		return -EINVAL;
58962306a36Sopenharmony_ci	}
59062306a36Sopenharmony_ci	return 0;
59162306a36Sopenharmony_ci}
59262306a36Sopenharmony_ci
59362306a36Sopenharmony_cistatic int path_requires_switch(char *from_cmdline, char *from_cow, char *cow)
59462306a36Sopenharmony_ci{
59562306a36Sopenharmony_ci	struct uml_stat buf1, buf2;
59662306a36Sopenharmony_ci	int err;
59762306a36Sopenharmony_ci
59862306a36Sopenharmony_ci	if (from_cmdline == NULL)
59962306a36Sopenharmony_ci		return 0;
60062306a36Sopenharmony_ci	if (!strcmp(from_cmdline, from_cow))
60162306a36Sopenharmony_ci		return 0;
60262306a36Sopenharmony_ci
60362306a36Sopenharmony_ci	err = os_stat_file(from_cmdline, &buf1);
60462306a36Sopenharmony_ci	if (err < 0) {
60562306a36Sopenharmony_ci		printk(KERN_ERR "Couldn't stat '%s', err = %d\n", from_cmdline,
60662306a36Sopenharmony_ci		       -err);
60762306a36Sopenharmony_ci		return 0;
60862306a36Sopenharmony_ci	}
60962306a36Sopenharmony_ci	err = os_stat_file(from_cow, &buf2);
61062306a36Sopenharmony_ci	if (err < 0) {
61162306a36Sopenharmony_ci		printk(KERN_ERR "Couldn't stat '%s', err = %d\n", from_cow,
61262306a36Sopenharmony_ci		       -err);
61362306a36Sopenharmony_ci		return 1;
61462306a36Sopenharmony_ci	}
61562306a36Sopenharmony_ci	if ((buf1.ust_dev == buf2.ust_dev) && (buf1.ust_ino == buf2.ust_ino))
61662306a36Sopenharmony_ci		return 0;
61762306a36Sopenharmony_ci
61862306a36Sopenharmony_ci	printk(KERN_ERR "Backing file mismatch - \"%s\" requested, "
61962306a36Sopenharmony_ci	       "\"%s\" specified in COW header of \"%s\"\n",
62062306a36Sopenharmony_ci	       from_cmdline, from_cow, cow);
62162306a36Sopenharmony_ci	return 1;
62262306a36Sopenharmony_ci}
62362306a36Sopenharmony_ci
62462306a36Sopenharmony_cistatic int open_ubd_file(char *file, struct openflags *openflags, int shared,
62562306a36Sopenharmony_ci		  char **backing_file_out, int *bitmap_offset_out,
62662306a36Sopenharmony_ci		  unsigned long *bitmap_len_out, int *data_offset_out,
62762306a36Sopenharmony_ci		  int *create_cow_out)
62862306a36Sopenharmony_ci{
62962306a36Sopenharmony_ci	time64_t mtime;
63062306a36Sopenharmony_ci	unsigned long long size;
63162306a36Sopenharmony_ci	__u32 version, align;
63262306a36Sopenharmony_ci	char *backing_file;
63362306a36Sopenharmony_ci	int fd, err, sectorsize, asked_switch, mode = 0644;
63462306a36Sopenharmony_ci
63562306a36Sopenharmony_ci	fd = os_open_file(file, *openflags, mode);
63662306a36Sopenharmony_ci	if (fd < 0) {
63762306a36Sopenharmony_ci		if ((fd == -ENOENT) && (create_cow_out != NULL))
63862306a36Sopenharmony_ci			*create_cow_out = 1;
63962306a36Sopenharmony_ci		if (!openflags->w ||
64062306a36Sopenharmony_ci		    ((fd != -EROFS) && (fd != -EACCES)))
64162306a36Sopenharmony_ci			return fd;
64262306a36Sopenharmony_ci		openflags->w = 0;
64362306a36Sopenharmony_ci		fd = os_open_file(file, *openflags, mode);
64462306a36Sopenharmony_ci		if (fd < 0)
64562306a36Sopenharmony_ci			return fd;
64662306a36Sopenharmony_ci	}
64762306a36Sopenharmony_ci
64862306a36Sopenharmony_ci	if (shared)
64962306a36Sopenharmony_ci		printk(KERN_INFO "Not locking \"%s\" on the host\n", file);
65062306a36Sopenharmony_ci	else {
65162306a36Sopenharmony_ci		err = os_lock_file(fd, openflags->w);
65262306a36Sopenharmony_ci		if (err < 0) {
65362306a36Sopenharmony_ci			printk(KERN_ERR "Failed to lock '%s', err = %d\n",
65462306a36Sopenharmony_ci			       file, -err);
65562306a36Sopenharmony_ci			goto out_close;
65662306a36Sopenharmony_ci		}
65762306a36Sopenharmony_ci	}
65862306a36Sopenharmony_ci
65962306a36Sopenharmony_ci	/* Successful return case! */
66062306a36Sopenharmony_ci	if (backing_file_out == NULL)
66162306a36Sopenharmony_ci		return fd;
66262306a36Sopenharmony_ci
66362306a36Sopenharmony_ci	err = read_cow_header(file_reader, &fd, &version, &backing_file, &mtime,
66462306a36Sopenharmony_ci			      &size, &sectorsize, &align, bitmap_offset_out);
66562306a36Sopenharmony_ci	if (err && (*backing_file_out != NULL)) {
66662306a36Sopenharmony_ci		printk(KERN_ERR "Failed to read COW header from COW file "
66762306a36Sopenharmony_ci		       "\"%s\", errno = %d\n", file, -err);
66862306a36Sopenharmony_ci		goto out_close;
66962306a36Sopenharmony_ci	}
67062306a36Sopenharmony_ci	if (err)
67162306a36Sopenharmony_ci		return fd;
67262306a36Sopenharmony_ci
67362306a36Sopenharmony_ci	asked_switch = path_requires_switch(*backing_file_out, backing_file,
67462306a36Sopenharmony_ci					    file);
67562306a36Sopenharmony_ci
67662306a36Sopenharmony_ci	/* Allow switching only if no mismatch. */
67762306a36Sopenharmony_ci	if (asked_switch && !backing_file_mismatch(*backing_file_out, size,
67862306a36Sopenharmony_ci						   mtime)) {
67962306a36Sopenharmony_ci		printk(KERN_ERR "Switching backing file to '%s'\n",
68062306a36Sopenharmony_ci		       *backing_file_out);
68162306a36Sopenharmony_ci		err = write_cow_header(file, fd, *backing_file_out,
68262306a36Sopenharmony_ci				       sectorsize, align, &size);
68362306a36Sopenharmony_ci		if (err) {
68462306a36Sopenharmony_ci			printk(KERN_ERR "Switch failed, errno = %d\n", -err);
68562306a36Sopenharmony_ci			goto out_close;
68662306a36Sopenharmony_ci		}
68762306a36Sopenharmony_ci	} else {
68862306a36Sopenharmony_ci		*backing_file_out = backing_file;
68962306a36Sopenharmony_ci		err = backing_file_mismatch(*backing_file_out, size, mtime);
69062306a36Sopenharmony_ci		if (err)
69162306a36Sopenharmony_ci			goto out_close;
69262306a36Sopenharmony_ci	}
69362306a36Sopenharmony_ci
69462306a36Sopenharmony_ci	cow_sizes(version, size, sectorsize, align, *bitmap_offset_out,
69562306a36Sopenharmony_ci		  bitmap_len_out, data_offset_out);
69662306a36Sopenharmony_ci
69762306a36Sopenharmony_ci	return fd;
69862306a36Sopenharmony_ci out_close:
69962306a36Sopenharmony_ci	os_close_file(fd);
70062306a36Sopenharmony_ci	return err;
70162306a36Sopenharmony_ci}
70262306a36Sopenharmony_ci
70362306a36Sopenharmony_cistatic int create_cow_file(char *cow_file, char *backing_file,
70462306a36Sopenharmony_ci		    struct openflags flags,
70562306a36Sopenharmony_ci		    int sectorsize, int alignment, int *bitmap_offset_out,
70662306a36Sopenharmony_ci		    unsigned long *bitmap_len_out, int *data_offset_out)
70762306a36Sopenharmony_ci{
70862306a36Sopenharmony_ci	int err, fd;
70962306a36Sopenharmony_ci
71062306a36Sopenharmony_ci	flags.c = 1;
71162306a36Sopenharmony_ci	fd = open_ubd_file(cow_file, &flags, 0, NULL, NULL, NULL, NULL, NULL);
71262306a36Sopenharmony_ci	if (fd < 0) {
71362306a36Sopenharmony_ci		err = fd;
71462306a36Sopenharmony_ci		printk(KERN_ERR "Open of COW file '%s' failed, errno = %d\n",
71562306a36Sopenharmony_ci		       cow_file, -err);
71662306a36Sopenharmony_ci		goto out;
71762306a36Sopenharmony_ci	}
71862306a36Sopenharmony_ci
71962306a36Sopenharmony_ci	err = init_cow_file(fd, cow_file, backing_file, sectorsize, alignment,
72062306a36Sopenharmony_ci			    bitmap_offset_out, bitmap_len_out,
72162306a36Sopenharmony_ci			    data_offset_out);
72262306a36Sopenharmony_ci	if (!err)
72362306a36Sopenharmony_ci		return fd;
72462306a36Sopenharmony_ci	os_close_file(fd);
72562306a36Sopenharmony_ci out:
72662306a36Sopenharmony_ci	return err;
72762306a36Sopenharmony_ci}
72862306a36Sopenharmony_ci
72962306a36Sopenharmony_cistatic void ubd_close_dev(struct ubd *ubd_dev)
73062306a36Sopenharmony_ci{
73162306a36Sopenharmony_ci	os_close_file(ubd_dev->fd);
73262306a36Sopenharmony_ci	if(ubd_dev->cow.file == NULL)
73362306a36Sopenharmony_ci		return;
73462306a36Sopenharmony_ci
73562306a36Sopenharmony_ci	os_close_file(ubd_dev->cow.fd);
73662306a36Sopenharmony_ci	vfree(ubd_dev->cow.bitmap);
73762306a36Sopenharmony_ci	ubd_dev->cow.bitmap = NULL;
73862306a36Sopenharmony_ci}
73962306a36Sopenharmony_ci
74062306a36Sopenharmony_cistatic int ubd_open_dev(struct ubd *ubd_dev)
74162306a36Sopenharmony_ci{
74262306a36Sopenharmony_ci	struct openflags flags;
74362306a36Sopenharmony_ci	char **back_ptr;
74462306a36Sopenharmony_ci	int err, create_cow, *create_ptr;
74562306a36Sopenharmony_ci	int fd;
74662306a36Sopenharmony_ci
74762306a36Sopenharmony_ci	ubd_dev->openflags = ubd_dev->boot_openflags;
74862306a36Sopenharmony_ci	create_cow = 0;
74962306a36Sopenharmony_ci	create_ptr = (ubd_dev->cow.file != NULL) ? &create_cow : NULL;
75062306a36Sopenharmony_ci	back_ptr = ubd_dev->no_cow ? NULL : &ubd_dev->cow.file;
75162306a36Sopenharmony_ci
75262306a36Sopenharmony_ci	fd = open_ubd_file(ubd_dev->file, &ubd_dev->openflags, ubd_dev->shared,
75362306a36Sopenharmony_ci				back_ptr, &ubd_dev->cow.bitmap_offset,
75462306a36Sopenharmony_ci				&ubd_dev->cow.bitmap_len, &ubd_dev->cow.data_offset,
75562306a36Sopenharmony_ci				create_ptr);
75662306a36Sopenharmony_ci
75762306a36Sopenharmony_ci	if((fd == -ENOENT) && create_cow){
75862306a36Sopenharmony_ci		fd = create_cow_file(ubd_dev->file, ubd_dev->cow.file,
75962306a36Sopenharmony_ci					  ubd_dev->openflags, SECTOR_SIZE, PAGE_SIZE,
76062306a36Sopenharmony_ci					  &ubd_dev->cow.bitmap_offset,
76162306a36Sopenharmony_ci					  &ubd_dev->cow.bitmap_len,
76262306a36Sopenharmony_ci					  &ubd_dev->cow.data_offset);
76362306a36Sopenharmony_ci		if(fd >= 0){
76462306a36Sopenharmony_ci			printk(KERN_INFO "Creating \"%s\" as COW file for "
76562306a36Sopenharmony_ci			       "\"%s\"\n", ubd_dev->file, ubd_dev->cow.file);
76662306a36Sopenharmony_ci		}
76762306a36Sopenharmony_ci	}
76862306a36Sopenharmony_ci
76962306a36Sopenharmony_ci	if(fd < 0){
77062306a36Sopenharmony_ci		printk("Failed to open '%s', errno = %d\n", ubd_dev->file,
77162306a36Sopenharmony_ci		       -fd);
77262306a36Sopenharmony_ci		return fd;
77362306a36Sopenharmony_ci	}
77462306a36Sopenharmony_ci	ubd_dev->fd = fd;
77562306a36Sopenharmony_ci
77662306a36Sopenharmony_ci	if(ubd_dev->cow.file != NULL){
77762306a36Sopenharmony_ci		blk_queue_max_hw_sectors(ubd_dev->queue, 8 * sizeof(long));
77862306a36Sopenharmony_ci
77962306a36Sopenharmony_ci		err = -ENOMEM;
78062306a36Sopenharmony_ci		ubd_dev->cow.bitmap = vmalloc(ubd_dev->cow.bitmap_len);
78162306a36Sopenharmony_ci		if(ubd_dev->cow.bitmap == NULL){
78262306a36Sopenharmony_ci			printk(KERN_ERR "Failed to vmalloc COW bitmap\n");
78362306a36Sopenharmony_ci			goto error;
78462306a36Sopenharmony_ci		}
78562306a36Sopenharmony_ci		flush_tlb_kernel_vm();
78662306a36Sopenharmony_ci
78762306a36Sopenharmony_ci		err = read_cow_bitmap(ubd_dev->fd, ubd_dev->cow.bitmap,
78862306a36Sopenharmony_ci				      ubd_dev->cow.bitmap_offset,
78962306a36Sopenharmony_ci				      ubd_dev->cow.bitmap_len);
79062306a36Sopenharmony_ci		if(err < 0)
79162306a36Sopenharmony_ci			goto error;
79262306a36Sopenharmony_ci
79362306a36Sopenharmony_ci		flags = ubd_dev->openflags;
79462306a36Sopenharmony_ci		flags.w = 0;
79562306a36Sopenharmony_ci		err = open_ubd_file(ubd_dev->cow.file, &flags, ubd_dev->shared, NULL,
79662306a36Sopenharmony_ci				    NULL, NULL, NULL, NULL);
79762306a36Sopenharmony_ci		if(err < 0) goto error;
79862306a36Sopenharmony_ci		ubd_dev->cow.fd = err;
79962306a36Sopenharmony_ci	}
80062306a36Sopenharmony_ci	if (ubd_dev->no_trim == 0) {
80162306a36Sopenharmony_ci		ubd_dev->queue->limits.discard_granularity = SECTOR_SIZE;
80262306a36Sopenharmony_ci		blk_queue_max_discard_sectors(ubd_dev->queue, UBD_MAX_REQUEST);
80362306a36Sopenharmony_ci		blk_queue_max_write_zeroes_sectors(ubd_dev->queue, UBD_MAX_REQUEST);
80462306a36Sopenharmony_ci	}
80562306a36Sopenharmony_ci	blk_queue_flag_set(QUEUE_FLAG_NONROT, ubd_dev->queue);
80662306a36Sopenharmony_ci	return 0;
80762306a36Sopenharmony_ci error:
80862306a36Sopenharmony_ci	os_close_file(ubd_dev->fd);
80962306a36Sopenharmony_ci	return err;
81062306a36Sopenharmony_ci}
81162306a36Sopenharmony_ci
81262306a36Sopenharmony_cistatic void ubd_device_release(struct device *dev)
81362306a36Sopenharmony_ci{
81462306a36Sopenharmony_ci	struct ubd *ubd_dev = dev_get_drvdata(dev);
81562306a36Sopenharmony_ci
81662306a36Sopenharmony_ci	blk_mq_free_tag_set(&ubd_dev->tag_set);
81762306a36Sopenharmony_ci	*ubd_dev = ((struct ubd) DEFAULT_UBD);
81862306a36Sopenharmony_ci}
81962306a36Sopenharmony_ci
82062306a36Sopenharmony_cistatic ssize_t serial_show(struct device *dev,
82162306a36Sopenharmony_ci			   struct device_attribute *attr, char *buf)
82262306a36Sopenharmony_ci{
82362306a36Sopenharmony_ci	struct gendisk *disk = dev_to_disk(dev);
82462306a36Sopenharmony_ci	struct ubd *ubd_dev = disk->private_data;
82562306a36Sopenharmony_ci
82662306a36Sopenharmony_ci	if (!ubd_dev)
82762306a36Sopenharmony_ci		return 0;
82862306a36Sopenharmony_ci
82962306a36Sopenharmony_ci	return sprintf(buf, "%s", ubd_dev->serial);
83062306a36Sopenharmony_ci}
83162306a36Sopenharmony_ci
83262306a36Sopenharmony_cistatic DEVICE_ATTR_RO(serial);
83362306a36Sopenharmony_ci
83462306a36Sopenharmony_cistatic struct attribute *ubd_attrs[] = {
83562306a36Sopenharmony_ci	&dev_attr_serial.attr,
83662306a36Sopenharmony_ci	NULL,
83762306a36Sopenharmony_ci};
83862306a36Sopenharmony_ci
83962306a36Sopenharmony_cistatic umode_t ubd_attrs_are_visible(struct kobject *kobj,
84062306a36Sopenharmony_ci				     struct attribute *a, int n)
84162306a36Sopenharmony_ci{
84262306a36Sopenharmony_ci	return a->mode;
84362306a36Sopenharmony_ci}
84462306a36Sopenharmony_ci
84562306a36Sopenharmony_cistatic const struct attribute_group ubd_attr_group = {
84662306a36Sopenharmony_ci	.attrs = ubd_attrs,
84762306a36Sopenharmony_ci	.is_visible = ubd_attrs_are_visible,
84862306a36Sopenharmony_ci};
84962306a36Sopenharmony_ci
85062306a36Sopenharmony_cistatic const struct attribute_group *ubd_attr_groups[] = {
85162306a36Sopenharmony_ci	&ubd_attr_group,
85262306a36Sopenharmony_ci	NULL,
85362306a36Sopenharmony_ci};
85462306a36Sopenharmony_ci
85562306a36Sopenharmony_cistatic int ubd_disk_register(int major, u64 size, int unit,
85662306a36Sopenharmony_ci			     struct gendisk *disk)
85762306a36Sopenharmony_ci{
85862306a36Sopenharmony_ci	disk->major = major;
85962306a36Sopenharmony_ci	disk->first_minor = unit << UBD_SHIFT;
86062306a36Sopenharmony_ci	disk->minors = 1 << UBD_SHIFT;
86162306a36Sopenharmony_ci	disk->fops = &ubd_blops;
86262306a36Sopenharmony_ci	set_capacity(disk, size / 512);
86362306a36Sopenharmony_ci	sprintf(disk->disk_name, "ubd%c", 'a' + unit);
86462306a36Sopenharmony_ci
86562306a36Sopenharmony_ci	ubd_devs[unit].pdev.id   = unit;
86662306a36Sopenharmony_ci	ubd_devs[unit].pdev.name = DRIVER_NAME;
86762306a36Sopenharmony_ci	ubd_devs[unit].pdev.dev.release = ubd_device_release;
86862306a36Sopenharmony_ci	dev_set_drvdata(&ubd_devs[unit].pdev.dev, &ubd_devs[unit]);
86962306a36Sopenharmony_ci	platform_device_register(&ubd_devs[unit].pdev);
87062306a36Sopenharmony_ci
87162306a36Sopenharmony_ci	disk->private_data = &ubd_devs[unit];
87262306a36Sopenharmony_ci	disk->queue = ubd_devs[unit].queue;
87362306a36Sopenharmony_ci	return device_add_disk(&ubd_devs[unit].pdev.dev, disk, ubd_attr_groups);
87462306a36Sopenharmony_ci}
87562306a36Sopenharmony_ci
87662306a36Sopenharmony_ci#define ROUND_BLOCK(n) ((n + (SECTOR_SIZE - 1)) & (-SECTOR_SIZE))
87762306a36Sopenharmony_ci
87862306a36Sopenharmony_cistatic const struct blk_mq_ops ubd_mq_ops = {
87962306a36Sopenharmony_ci	.queue_rq = ubd_queue_rq,
88062306a36Sopenharmony_ci};
88162306a36Sopenharmony_ci
88262306a36Sopenharmony_cistatic int ubd_add(int n, char **error_out)
88362306a36Sopenharmony_ci{
88462306a36Sopenharmony_ci	struct ubd *ubd_dev = &ubd_devs[n];
88562306a36Sopenharmony_ci	struct gendisk *disk;
88662306a36Sopenharmony_ci	int err = 0;
88762306a36Sopenharmony_ci
88862306a36Sopenharmony_ci	if(ubd_dev->file == NULL)
88962306a36Sopenharmony_ci		goto out;
89062306a36Sopenharmony_ci
89162306a36Sopenharmony_ci	err = ubd_file_size(ubd_dev, &ubd_dev->size);
89262306a36Sopenharmony_ci	if(err < 0){
89362306a36Sopenharmony_ci		*error_out = "Couldn't determine size of device's file";
89462306a36Sopenharmony_ci		goto out;
89562306a36Sopenharmony_ci	}
89662306a36Sopenharmony_ci
89762306a36Sopenharmony_ci	ubd_dev->size = ROUND_BLOCK(ubd_dev->size);
89862306a36Sopenharmony_ci
89962306a36Sopenharmony_ci	ubd_dev->tag_set.ops = &ubd_mq_ops;
90062306a36Sopenharmony_ci	ubd_dev->tag_set.queue_depth = 64;
90162306a36Sopenharmony_ci	ubd_dev->tag_set.numa_node = NUMA_NO_NODE;
90262306a36Sopenharmony_ci	ubd_dev->tag_set.flags = BLK_MQ_F_SHOULD_MERGE;
90362306a36Sopenharmony_ci	ubd_dev->tag_set.driver_data = ubd_dev;
90462306a36Sopenharmony_ci	ubd_dev->tag_set.nr_hw_queues = 1;
90562306a36Sopenharmony_ci
90662306a36Sopenharmony_ci	err = blk_mq_alloc_tag_set(&ubd_dev->tag_set);
90762306a36Sopenharmony_ci	if (err)
90862306a36Sopenharmony_ci		goto out;
90962306a36Sopenharmony_ci
91062306a36Sopenharmony_ci	disk = blk_mq_alloc_disk(&ubd_dev->tag_set, ubd_dev);
91162306a36Sopenharmony_ci	if (IS_ERR(disk)) {
91262306a36Sopenharmony_ci		err = PTR_ERR(disk);
91362306a36Sopenharmony_ci		goto out_cleanup_tags;
91462306a36Sopenharmony_ci	}
91562306a36Sopenharmony_ci	ubd_dev->queue = disk->queue;
91662306a36Sopenharmony_ci
91762306a36Sopenharmony_ci	blk_queue_write_cache(ubd_dev->queue, true, false);
91862306a36Sopenharmony_ci	blk_queue_max_segments(ubd_dev->queue, MAX_SG);
91962306a36Sopenharmony_ci	blk_queue_segment_boundary(ubd_dev->queue, PAGE_SIZE - 1);
92062306a36Sopenharmony_ci	err = ubd_disk_register(UBD_MAJOR, ubd_dev->size, n, disk);
92162306a36Sopenharmony_ci	if (err)
92262306a36Sopenharmony_ci		goto out_cleanup_disk;
92362306a36Sopenharmony_ci
92462306a36Sopenharmony_ci	ubd_gendisk[n] = disk;
92562306a36Sopenharmony_ci	return 0;
92662306a36Sopenharmony_ci
92762306a36Sopenharmony_ciout_cleanup_disk:
92862306a36Sopenharmony_ci	put_disk(disk);
92962306a36Sopenharmony_ciout_cleanup_tags:
93062306a36Sopenharmony_ci	blk_mq_free_tag_set(&ubd_dev->tag_set);
93162306a36Sopenharmony_ciout:
93262306a36Sopenharmony_ci	return err;
93362306a36Sopenharmony_ci}
93462306a36Sopenharmony_ci
93562306a36Sopenharmony_cistatic int ubd_config(char *str, char **error_out)
93662306a36Sopenharmony_ci{
93762306a36Sopenharmony_ci	int n, ret;
93862306a36Sopenharmony_ci
93962306a36Sopenharmony_ci	/* This string is possibly broken up and stored, so it's only
94062306a36Sopenharmony_ci	 * freed if ubd_setup_common fails, or if only general options
94162306a36Sopenharmony_ci	 * were set.
94262306a36Sopenharmony_ci	 */
94362306a36Sopenharmony_ci	str = kstrdup(str, GFP_KERNEL);
94462306a36Sopenharmony_ci	if (str == NULL) {
94562306a36Sopenharmony_ci		*error_out = "Failed to allocate memory";
94662306a36Sopenharmony_ci		return -ENOMEM;
94762306a36Sopenharmony_ci	}
94862306a36Sopenharmony_ci
94962306a36Sopenharmony_ci	ret = ubd_setup_common(str, &n, error_out);
95062306a36Sopenharmony_ci	if (ret)
95162306a36Sopenharmony_ci		goto err_free;
95262306a36Sopenharmony_ci
95362306a36Sopenharmony_ci	if (n == -1) {
95462306a36Sopenharmony_ci		ret = 0;
95562306a36Sopenharmony_ci		goto err_free;
95662306a36Sopenharmony_ci	}
95762306a36Sopenharmony_ci
95862306a36Sopenharmony_ci	mutex_lock(&ubd_lock);
95962306a36Sopenharmony_ci	ret = ubd_add(n, error_out);
96062306a36Sopenharmony_ci	if (ret)
96162306a36Sopenharmony_ci		ubd_devs[n].file = NULL;
96262306a36Sopenharmony_ci	mutex_unlock(&ubd_lock);
96362306a36Sopenharmony_ci
96462306a36Sopenharmony_ciout:
96562306a36Sopenharmony_ci	return ret;
96662306a36Sopenharmony_ci
96762306a36Sopenharmony_cierr_free:
96862306a36Sopenharmony_ci	kfree(str);
96962306a36Sopenharmony_ci	goto out;
97062306a36Sopenharmony_ci}
97162306a36Sopenharmony_ci
97262306a36Sopenharmony_cistatic int ubd_get_config(char *name, char *str, int size, char **error_out)
97362306a36Sopenharmony_ci{
97462306a36Sopenharmony_ci	struct ubd *ubd_dev;
97562306a36Sopenharmony_ci	int n, len = 0;
97662306a36Sopenharmony_ci
97762306a36Sopenharmony_ci	n = parse_unit(&name);
97862306a36Sopenharmony_ci	if((n >= MAX_DEV) || (n < 0)){
97962306a36Sopenharmony_ci		*error_out = "ubd_get_config : device number out of range";
98062306a36Sopenharmony_ci		return -1;
98162306a36Sopenharmony_ci	}
98262306a36Sopenharmony_ci
98362306a36Sopenharmony_ci	ubd_dev = &ubd_devs[n];
98462306a36Sopenharmony_ci	mutex_lock(&ubd_lock);
98562306a36Sopenharmony_ci
98662306a36Sopenharmony_ci	if(ubd_dev->file == NULL){
98762306a36Sopenharmony_ci		CONFIG_CHUNK(str, size, len, "", 1);
98862306a36Sopenharmony_ci		goto out;
98962306a36Sopenharmony_ci	}
99062306a36Sopenharmony_ci
99162306a36Sopenharmony_ci	CONFIG_CHUNK(str, size, len, ubd_dev->file, 0);
99262306a36Sopenharmony_ci
99362306a36Sopenharmony_ci	if(ubd_dev->cow.file != NULL){
99462306a36Sopenharmony_ci		CONFIG_CHUNK(str, size, len, ",", 0);
99562306a36Sopenharmony_ci		CONFIG_CHUNK(str, size, len, ubd_dev->cow.file, 1);
99662306a36Sopenharmony_ci	}
99762306a36Sopenharmony_ci	else CONFIG_CHUNK(str, size, len, "", 1);
99862306a36Sopenharmony_ci
99962306a36Sopenharmony_ci out:
100062306a36Sopenharmony_ci	mutex_unlock(&ubd_lock);
100162306a36Sopenharmony_ci	return len;
100262306a36Sopenharmony_ci}
100362306a36Sopenharmony_ci
100462306a36Sopenharmony_cistatic int ubd_id(char **str, int *start_out, int *end_out)
100562306a36Sopenharmony_ci{
100662306a36Sopenharmony_ci	int n;
100762306a36Sopenharmony_ci
100862306a36Sopenharmony_ci	n = parse_unit(str);
100962306a36Sopenharmony_ci	*start_out = 0;
101062306a36Sopenharmony_ci	*end_out = MAX_DEV - 1;
101162306a36Sopenharmony_ci	return n;
101262306a36Sopenharmony_ci}
101362306a36Sopenharmony_ci
101462306a36Sopenharmony_cistatic int ubd_remove(int n, char **error_out)
101562306a36Sopenharmony_ci{
101662306a36Sopenharmony_ci	struct gendisk *disk = ubd_gendisk[n];
101762306a36Sopenharmony_ci	struct ubd *ubd_dev;
101862306a36Sopenharmony_ci	int err = -ENODEV;
101962306a36Sopenharmony_ci
102062306a36Sopenharmony_ci	mutex_lock(&ubd_lock);
102162306a36Sopenharmony_ci
102262306a36Sopenharmony_ci	ubd_dev = &ubd_devs[n];
102362306a36Sopenharmony_ci
102462306a36Sopenharmony_ci	if(ubd_dev->file == NULL)
102562306a36Sopenharmony_ci		goto out;
102662306a36Sopenharmony_ci
102762306a36Sopenharmony_ci	/* you cannot remove a open disk */
102862306a36Sopenharmony_ci	err = -EBUSY;
102962306a36Sopenharmony_ci	if(ubd_dev->count > 0)
103062306a36Sopenharmony_ci		goto out;
103162306a36Sopenharmony_ci
103262306a36Sopenharmony_ci	ubd_gendisk[n] = NULL;
103362306a36Sopenharmony_ci	if(disk != NULL){
103462306a36Sopenharmony_ci		del_gendisk(disk);
103562306a36Sopenharmony_ci		put_disk(disk);
103662306a36Sopenharmony_ci	}
103762306a36Sopenharmony_ci
103862306a36Sopenharmony_ci	err = 0;
103962306a36Sopenharmony_ci	platform_device_unregister(&ubd_dev->pdev);
104062306a36Sopenharmony_ciout:
104162306a36Sopenharmony_ci	mutex_unlock(&ubd_lock);
104262306a36Sopenharmony_ci	return err;
104362306a36Sopenharmony_ci}
104462306a36Sopenharmony_ci
104562306a36Sopenharmony_ci/* All these are called by mconsole in process context and without
104662306a36Sopenharmony_ci * ubd-specific locks.  The structure itself is const except for .list.
104762306a36Sopenharmony_ci */
104862306a36Sopenharmony_cistatic struct mc_device ubd_mc = {
104962306a36Sopenharmony_ci	.list		= LIST_HEAD_INIT(ubd_mc.list),
105062306a36Sopenharmony_ci	.name		= "ubd",
105162306a36Sopenharmony_ci	.config		= ubd_config,
105262306a36Sopenharmony_ci	.get_config	= ubd_get_config,
105362306a36Sopenharmony_ci	.id		= ubd_id,
105462306a36Sopenharmony_ci	.remove		= ubd_remove,
105562306a36Sopenharmony_ci};
105662306a36Sopenharmony_ci
105762306a36Sopenharmony_cistatic int __init ubd_mc_init(void)
105862306a36Sopenharmony_ci{
105962306a36Sopenharmony_ci	mconsole_register_dev(&ubd_mc);
106062306a36Sopenharmony_ci	return 0;
106162306a36Sopenharmony_ci}
106262306a36Sopenharmony_ci
106362306a36Sopenharmony_ci__initcall(ubd_mc_init);
106462306a36Sopenharmony_ci
106562306a36Sopenharmony_cistatic int __init ubd0_init(void)
106662306a36Sopenharmony_ci{
106762306a36Sopenharmony_ci	struct ubd *ubd_dev = &ubd_devs[0];
106862306a36Sopenharmony_ci
106962306a36Sopenharmony_ci	mutex_lock(&ubd_lock);
107062306a36Sopenharmony_ci	if(ubd_dev->file == NULL)
107162306a36Sopenharmony_ci		ubd_dev->file = "root_fs";
107262306a36Sopenharmony_ci	mutex_unlock(&ubd_lock);
107362306a36Sopenharmony_ci
107462306a36Sopenharmony_ci	return 0;
107562306a36Sopenharmony_ci}
107662306a36Sopenharmony_ci
107762306a36Sopenharmony_ci__initcall(ubd0_init);
107862306a36Sopenharmony_ci
107962306a36Sopenharmony_ci/* Used in ubd_init, which is an initcall */
108062306a36Sopenharmony_cistatic struct platform_driver ubd_driver = {
108162306a36Sopenharmony_ci	.driver = {
108262306a36Sopenharmony_ci		.name  = DRIVER_NAME,
108362306a36Sopenharmony_ci	},
108462306a36Sopenharmony_ci};
108562306a36Sopenharmony_ci
108662306a36Sopenharmony_cistatic int __init ubd_init(void)
108762306a36Sopenharmony_ci{
108862306a36Sopenharmony_ci	char *error;
108962306a36Sopenharmony_ci	int i, err;
109062306a36Sopenharmony_ci
109162306a36Sopenharmony_ci	if (register_blkdev(UBD_MAJOR, "ubd"))
109262306a36Sopenharmony_ci		return -1;
109362306a36Sopenharmony_ci
109462306a36Sopenharmony_ci	irq_req_buffer = kmalloc_array(UBD_REQ_BUFFER_SIZE,
109562306a36Sopenharmony_ci				       sizeof(struct io_thread_req *),
109662306a36Sopenharmony_ci				       GFP_KERNEL
109762306a36Sopenharmony_ci		);
109862306a36Sopenharmony_ci	irq_remainder = 0;
109962306a36Sopenharmony_ci
110062306a36Sopenharmony_ci	if (irq_req_buffer == NULL) {
110162306a36Sopenharmony_ci		printk(KERN_ERR "Failed to initialize ubd buffering\n");
110262306a36Sopenharmony_ci		return -1;
110362306a36Sopenharmony_ci	}
110462306a36Sopenharmony_ci	io_req_buffer = kmalloc_array(UBD_REQ_BUFFER_SIZE,
110562306a36Sopenharmony_ci				      sizeof(struct io_thread_req *),
110662306a36Sopenharmony_ci				      GFP_KERNEL
110762306a36Sopenharmony_ci		);
110862306a36Sopenharmony_ci
110962306a36Sopenharmony_ci	io_remainder = 0;
111062306a36Sopenharmony_ci
111162306a36Sopenharmony_ci	if (io_req_buffer == NULL) {
111262306a36Sopenharmony_ci		printk(KERN_ERR "Failed to initialize ubd buffering\n");
111362306a36Sopenharmony_ci		return -1;
111462306a36Sopenharmony_ci	}
111562306a36Sopenharmony_ci	platform_driver_register(&ubd_driver);
111662306a36Sopenharmony_ci	mutex_lock(&ubd_lock);
111762306a36Sopenharmony_ci	for (i = 0; i < MAX_DEV; i++){
111862306a36Sopenharmony_ci		err = ubd_add(i, &error);
111962306a36Sopenharmony_ci		if(err)
112062306a36Sopenharmony_ci			printk(KERN_ERR "Failed to initialize ubd device %d :"
112162306a36Sopenharmony_ci			       "%s\n", i, error);
112262306a36Sopenharmony_ci	}
112362306a36Sopenharmony_ci	mutex_unlock(&ubd_lock);
112462306a36Sopenharmony_ci	return 0;
112562306a36Sopenharmony_ci}
112662306a36Sopenharmony_ci
112762306a36Sopenharmony_cilate_initcall(ubd_init);
112862306a36Sopenharmony_ci
112962306a36Sopenharmony_cistatic int __init ubd_driver_init(void){
113062306a36Sopenharmony_ci	unsigned long stack;
113162306a36Sopenharmony_ci	int err;
113262306a36Sopenharmony_ci
113362306a36Sopenharmony_ci	/* Set by CONFIG_BLK_DEV_UBD_SYNC or ubd=sync.*/
113462306a36Sopenharmony_ci	if(global_openflags.s){
113562306a36Sopenharmony_ci		printk(KERN_INFO "ubd: Synchronous mode\n");
113662306a36Sopenharmony_ci		/* Letting ubd=sync be like using ubd#s= instead of ubd#= is
113762306a36Sopenharmony_ci		 * enough. So use anyway the io thread. */
113862306a36Sopenharmony_ci	}
113962306a36Sopenharmony_ci	stack = alloc_stack(0, 0);
114062306a36Sopenharmony_ci	io_pid = start_io_thread(stack + PAGE_SIZE, &thread_fd);
114162306a36Sopenharmony_ci	if(io_pid < 0){
114262306a36Sopenharmony_ci		printk(KERN_ERR
114362306a36Sopenharmony_ci		       "ubd : Failed to start I/O thread (errno = %d) - "
114462306a36Sopenharmony_ci		       "falling back to synchronous I/O\n", -io_pid);
114562306a36Sopenharmony_ci		io_pid = -1;
114662306a36Sopenharmony_ci		return 0;
114762306a36Sopenharmony_ci	}
114862306a36Sopenharmony_ci	err = um_request_irq(UBD_IRQ, thread_fd, IRQ_READ, ubd_intr,
114962306a36Sopenharmony_ci			     0, "ubd", ubd_devs);
115062306a36Sopenharmony_ci	if(err < 0)
115162306a36Sopenharmony_ci		printk(KERN_ERR "um_request_irq failed - errno = %d\n", -err);
115262306a36Sopenharmony_ci	return 0;
115362306a36Sopenharmony_ci}
115462306a36Sopenharmony_ci
115562306a36Sopenharmony_cidevice_initcall(ubd_driver_init);
115662306a36Sopenharmony_ci
115762306a36Sopenharmony_cistatic int ubd_open(struct gendisk *disk, blk_mode_t mode)
115862306a36Sopenharmony_ci{
115962306a36Sopenharmony_ci	struct ubd *ubd_dev = disk->private_data;
116062306a36Sopenharmony_ci	int err = 0;
116162306a36Sopenharmony_ci
116262306a36Sopenharmony_ci	mutex_lock(&ubd_mutex);
116362306a36Sopenharmony_ci	if(ubd_dev->count == 0){
116462306a36Sopenharmony_ci		err = ubd_open_dev(ubd_dev);
116562306a36Sopenharmony_ci		if(err){
116662306a36Sopenharmony_ci			printk(KERN_ERR "%s: Can't open \"%s\": errno = %d\n",
116762306a36Sopenharmony_ci			       disk->disk_name, ubd_dev->file, -err);
116862306a36Sopenharmony_ci			goto out;
116962306a36Sopenharmony_ci		}
117062306a36Sopenharmony_ci	}
117162306a36Sopenharmony_ci	ubd_dev->count++;
117262306a36Sopenharmony_ci	set_disk_ro(disk, !ubd_dev->openflags.w);
117362306a36Sopenharmony_ciout:
117462306a36Sopenharmony_ci	mutex_unlock(&ubd_mutex);
117562306a36Sopenharmony_ci	return err;
117662306a36Sopenharmony_ci}
117762306a36Sopenharmony_ci
117862306a36Sopenharmony_cistatic void ubd_release(struct gendisk *disk)
117962306a36Sopenharmony_ci{
118062306a36Sopenharmony_ci	struct ubd *ubd_dev = disk->private_data;
118162306a36Sopenharmony_ci
118262306a36Sopenharmony_ci	mutex_lock(&ubd_mutex);
118362306a36Sopenharmony_ci	if(--ubd_dev->count == 0)
118462306a36Sopenharmony_ci		ubd_close_dev(ubd_dev);
118562306a36Sopenharmony_ci	mutex_unlock(&ubd_mutex);
118662306a36Sopenharmony_ci}
118762306a36Sopenharmony_ci
118862306a36Sopenharmony_cistatic void cowify_bitmap(__u64 io_offset, int length, unsigned long *cow_mask,
118962306a36Sopenharmony_ci			  __u64 *cow_offset, unsigned long *bitmap,
119062306a36Sopenharmony_ci			  __u64 bitmap_offset, unsigned long *bitmap_words,
119162306a36Sopenharmony_ci			  __u64 bitmap_len)
119262306a36Sopenharmony_ci{
119362306a36Sopenharmony_ci	__u64 sector = io_offset >> SECTOR_SHIFT;
119462306a36Sopenharmony_ci	int i, update_bitmap = 0;
119562306a36Sopenharmony_ci
119662306a36Sopenharmony_ci	for (i = 0; i < length >> SECTOR_SHIFT; i++) {
119762306a36Sopenharmony_ci		if(cow_mask != NULL)
119862306a36Sopenharmony_ci			ubd_set_bit(i, (unsigned char *) cow_mask);
119962306a36Sopenharmony_ci		if(ubd_test_bit(sector + i, (unsigned char *) bitmap))
120062306a36Sopenharmony_ci			continue;
120162306a36Sopenharmony_ci
120262306a36Sopenharmony_ci		update_bitmap = 1;
120362306a36Sopenharmony_ci		ubd_set_bit(sector + i, (unsigned char *) bitmap);
120462306a36Sopenharmony_ci	}
120562306a36Sopenharmony_ci
120662306a36Sopenharmony_ci	if(!update_bitmap)
120762306a36Sopenharmony_ci		return;
120862306a36Sopenharmony_ci
120962306a36Sopenharmony_ci	*cow_offset = sector / (sizeof(unsigned long) * 8);
121062306a36Sopenharmony_ci
121162306a36Sopenharmony_ci	/* This takes care of the case where we're exactly at the end of the
121262306a36Sopenharmony_ci	 * device, and *cow_offset + 1 is off the end.  So, just back it up
121362306a36Sopenharmony_ci	 * by one word.  Thanks to Lynn Kerby for the fix and James McMechan
121462306a36Sopenharmony_ci	 * for the original diagnosis.
121562306a36Sopenharmony_ci	 */
121662306a36Sopenharmony_ci	if (*cow_offset == (DIV_ROUND_UP(bitmap_len,
121762306a36Sopenharmony_ci					 sizeof(unsigned long)) - 1))
121862306a36Sopenharmony_ci		(*cow_offset)--;
121962306a36Sopenharmony_ci
122062306a36Sopenharmony_ci	bitmap_words[0] = bitmap[*cow_offset];
122162306a36Sopenharmony_ci	bitmap_words[1] = bitmap[*cow_offset + 1];
122262306a36Sopenharmony_ci
122362306a36Sopenharmony_ci	*cow_offset *= sizeof(unsigned long);
122462306a36Sopenharmony_ci	*cow_offset += bitmap_offset;
122562306a36Sopenharmony_ci}
122662306a36Sopenharmony_ci
122762306a36Sopenharmony_cistatic void cowify_req(struct io_thread_req *req, struct io_desc *segment,
122862306a36Sopenharmony_ci		       unsigned long offset, unsigned long *bitmap,
122962306a36Sopenharmony_ci		       __u64 bitmap_offset, __u64 bitmap_len)
123062306a36Sopenharmony_ci{
123162306a36Sopenharmony_ci	__u64 sector = offset >> SECTOR_SHIFT;
123262306a36Sopenharmony_ci	int i;
123362306a36Sopenharmony_ci
123462306a36Sopenharmony_ci	if (segment->length > (sizeof(segment->sector_mask) * 8) << SECTOR_SHIFT)
123562306a36Sopenharmony_ci		panic("Operation too long");
123662306a36Sopenharmony_ci
123762306a36Sopenharmony_ci	if (req_op(req->req) == REQ_OP_READ) {
123862306a36Sopenharmony_ci		for (i = 0; i < segment->length >> SECTOR_SHIFT; i++) {
123962306a36Sopenharmony_ci			if(ubd_test_bit(sector + i, (unsigned char *) bitmap))
124062306a36Sopenharmony_ci				ubd_set_bit(i, (unsigned char *)
124162306a36Sopenharmony_ci					    &segment->sector_mask);
124262306a36Sopenharmony_ci		}
124362306a36Sopenharmony_ci	} else {
124462306a36Sopenharmony_ci		cowify_bitmap(offset, segment->length, &segment->sector_mask,
124562306a36Sopenharmony_ci			      &segment->cow_offset, bitmap, bitmap_offset,
124662306a36Sopenharmony_ci			      segment->bitmap_words, bitmap_len);
124762306a36Sopenharmony_ci	}
124862306a36Sopenharmony_ci}
124962306a36Sopenharmony_ci
125062306a36Sopenharmony_cistatic void ubd_map_req(struct ubd *dev, struct io_thread_req *io_req,
125162306a36Sopenharmony_ci			struct request *req)
125262306a36Sopenharmony_ci{
125362306a36Sopenharmony_ci	struct bio_vec bvec;
125462306a36Sopenharmony_ci	struct req_iterator iter;
125562306a36Sopenharmony_ci	int i = 0;
125662306a36Sopenharmony_ci	unsigned long byte_offset = io_req->offset;
125762306a36Sopenharmony_ci	enum req_op op = req_op(req);
125862306a36Sopenharmony_ci
125962306a36Sopenharmony_ci	if (op == REQ_OP_WRITE_ZEROES || op == REQ_OP_DISCARD) {
126062306a36Sopenharmony_ci		io_req->io_desc[0].buffer = NULL;
126162306a36Sopenharmony_ci		io_req->io_desc[0].length = blk_rq_bytes(req);
126262306a36Sopenharmony_ci	} else {
126362306a36Sopenharmony_ci		rq_for_each_segment(bvec, req, iter) {
126462306a36Sopenharmony_ci			BUG_ON(i >= io_req->desc_cnt);
126562306a36Sopenharmony_ci
126662306a36Sopenharmony_ci			io_req->io_desc[i].buffer = bvec_virt(&bvec);
126762306a36Sopenharmony_ci			io_req->io_desc[i].length = bvec.bv_len;
126862306a36Sopenharmony_ci			i++;
126962306a36Sopenharmony_ci		}
127062306a36Sopenharmony_ci	}
127162306a36Sopenharmony_ci
127262306a36Sopenharmony_ci	if (dev->cow.file) {
127362306a36Sopenharmony_ci		for (i = 0; i < io_req->desc_cnt; i++) {
127462306a36Sopenharmony_ci			cowify_req(io_req, &io_req->io_desc[i], byte_offset,
127562306a36Sopenharmony_ci				   dev->cow.bitmap, dev->cow.bitmap_offset,
127662306a36Sopenharmony_ci				   dev->cow.bitmap_len);
127762306a36Sopenharmony_ci			byte_offset += io_req->io_desc[i].length;
127862306a36Sopenharmony_ci		}
127962306a36Sopenharmony_ci
128062306a36Sopenharmony_ci	}
128162306a36Sopenharmony_ci}
128262306a36Sopenharmony_ci
128362306a36Sopenharmony_cistatic struct io_thread_req *ubd_alloc_req(struct ubd *dev, struct request *req,
128462306a36Sopenharmony_ci					   int desc_cnt)
128562306a36Sopenharmony_ci{
128662306a36Sopenharmony_ci	struct io_thread_req *io_req;
128762306a36Sopenharmony_ci	int i;
128862306a36Sopenharmony_ci
128962306a36Sopenharmony_ci	io_req = kmalloc(sizeof(*io_req) +
129062306a36Sopenharmony_ci			 (desc_cnt * sizeof(struct io_desc)),
129162306a36Sopenharmony_ci			 GFP_ATOMIC);
129262306a36Sopenharmony_ci	if (!io_req)
129362306a36Sopenharmony_ci		return NULL;
129462306a36Sopenharmony_ci
129562306a36Sopenharmony_ci	io_req->req = req;
129662306a36Sopenharmony_ci	if (dev->cow.file)
129762306a36Sopenharmony_ci		io_req->fds[0] = dev->cow.fd;
129862306a36Sopenharmony_ci	else
129962306a36Sopenharmony_ci		io_req->fds[0] = dev->fd;
130062306a36Sopenharmony_ci	io_req->error = 0;
130162306a36Sopenharmony_ci	io_req->sectorsize = SECTOR_SIZE;
130262306a36Sopenharmony_ci	io_req->fds[1] = dev->fd;
130362306a36Sopenharmony_ci	io_req->offset = (u64) blk_rq_pos(req) << SECTOR_SHIFT;
130462306a36Sopenharmony_ci	io_req->offsets[0] = 0;
130562306a36Sopenharmony_ci	io_req->offsets[1] = dev->cow.data_offset;
130662306a36Sopenharmony_ci
130762306a36Sopenharmony_ci	for (i = 0 ; i < desc_cnt; i++) {
130862306a36Sopenharmony_ci		io_req->io_desc[i].sector_mask = 0;
130962306a36Sopenharmony_ci		io_req->io_desc[i].cow_offset = -1;
131062306a36Sopenharmony_ci	}
131162306a36Sopenharmony_ci
131262306a36Sopenharmony_ci	return io_req;
131362306a36Sopenharmony_ci}
131462306a36Sopenharmony_ci
131562306a36Sopenharmony_cistatic int ubd_submit_request(struct ubd *dev, struct request *req)
131662306a36Sopenharmony_ci{
131762306a36Sopenharmony_ci	int segs = 0;
131862306a36Sopenharmony_ci	struct io_thread_req *io_req;
131962306a36Sopenharmony_ci	int ret;
132062306a36Sopenharmony_ci	enum req_op op = req_op(req);
132162306a36Sopenharmony_ci
132262306a36Sopenharmony_ci	if (op == REQ_OP_FLUSH)
132362306a36Sopenharmony_ci		segs = 0;
132462306a36Sopenharmony_ci	else if (op == REQ_OP_WRITE_ZEROES || op == REQ_OP_DISCARD)
132562306a36Sopenharmony_ci		segs = 1;
132662306a36Sopenharmony_ci	else
132762306a36Sopenharmony_ci		segs = blk_rq_nr_phys_segments(req);
132862306a36Sopenharmony_ci
132962306a36Sopenharmony_ci	io_req = ubd_alloc_req(dev, req, segs);
133062306a36Sopenharmony_ci	if (!io_req)
133162306a36Sopenharmony_ci		return -ENOMEM;
133262306a36Sopenharmony_ci
133362306a36Sopenharmony_ci	io_req->desc_cnt = segs;
133462306a36Sopenharmony_ci	if (segs)
133562306a36Sopenharmony_ci		ubd_map_req(dev, io_req, req);
133662306a36Sopenharmony_ci
133762306a36Sopenharmony_ci	ret = os_write_file(thread_fd, &io_req, sizeof(io_req));
133862306a36Sopenharmony_ci	if (ret != sizeof(io_req)) {
133962306a36Sopenharmony_ci		if (ret != -EAGAIN)
134062306a36Sopenharmony_ci			pr_err("write to io thread failed: %d\n", -ret);
134162306a36Sopenharmony_ci		kfree(io_req);
134262306a36Sopenharmony_ci	}
134362306a36Sopenharmony_ci	return ret;
134462306a36Sopenharmony_ci}
134562306a36Sopenharmony_ci
134662306a36Sopenharmony_cistatic blk_status_t ubd_queue_rq(struct blk_mq_hw_ctx *hctx,
134762306a36Sopenharmony_ci				 const struct blk_mq_queue_data *bd)
134862306a36Sopenharmony_ci{
134962306a36Sopenharmony_ci	struct ubd *ubd_dev = hctx->queue->queuedata;
135062306a36Sopenharmony_ci	struct request *req = bd->rq;
135162306a36Sopenharmony_ci	int ret = 0, res = BLK_STS_OK;
135262306a36Sopenharmony_ci
135362306a36Sopenharmony_ci	blk_mq_start_request(req);
135462306a36Sopenharmony_ci
135562306a36Sopenharmony_ci	spin_lock_irq(&ubd_dev->lock);
135662306a36Sopenharmony_ci
135762306a36Sopenharmony_ci	switch (req_op(req)) {
135862306a36Sopenharmony_ci	case REQ_OP_FLUSH:
135962306a36Sopenharmony_ci	case REQ_OP_READ:
136062306a36Sopenharmony_ci	case REQ_OP_WRITE:
136162306a36Sopenharmony_ci	case REQ_OP_DISCARD:
136262306a36Sopenharmony_ci	case REQ_OP_WRITE_ZEROES:
136362306a36Sopenharmony_ci		ret = ubd_submit_request(ubd_dev, req);
136462306a36Sopenharmony_ci		break;
136562306a36Sopenharmony_ci	default:
136662306a36Sopenharmony_ci		WARN_ON_ONCE(1);
136762306a36Sopenharmony_ci		res = BLK_STS_NOTSUPP;
136862306a36Sopenharmony_ci	}
136962306a36Sopenharmony_ci
137062306a36Sopenharmony_ci	spin_unlock_irq(&ubd_dev->lock);
137162306a36Sopenharmony_ci
137262306a36Sopenharmony_ci	if (ret < 0) {
137362306a36Sopenharmony_ci		if (ret == -ENOMEM)
137462306a36Sopenharmony_ci			res = BLK_STS_RESOURCE;
137562306a36Sopenharmony_ci		else
137662306a36Sopenharmony_ci			res = BLK_STS_DEV_RESOURCE;
137762306a36Sopenharmony_ci	}
137862306a36Sopenharmony_ci
137962306a36Sopenharmony_ci	return res;
138062306a36Sopenharmony_ci}
138162306a36Sopenharmony_ci
138262306a36Sopenharmony_cistatic int ubd_getgeo(struct block_device *bdev, struct hd_geometry *geo)
138362306a36Sopenharmony_ci{
138462306a36Sopenharmony_ci	struct ubd *ubd_dev = bdev->bd_disk->private_data;
138562306a36Sopenharmony_ci
138662306a36Sopenharmony_ci	geo->heads = 128;
138762306a36Sopenharmony_ci	geo->sectors = 32;
138862306a36Sopenharmony_ci	geo->cylinders = ubd_dev->size / (128 * 32 * 512);
138962306a36Sopenharmony_ci	return 0;
139062306a36Sopenharmony_ci}
139162306a36Sopenharmony_ci
139262306a36Sopenharmony_cistatic int ubd_ioctl(struct block_device *bdev, blk_mode_t mode,
139362306a36Sopenharmony_ci		     unsigned int cmd, unsigned long arg)
139462306a36Sopenharmony_ci{
139562306a36Sopenharmony_ci	struct ubd *ubd_dev = bdev->bd_disk->private_data;
139662306a36Sopenharmony_ci	u16 ubd_id[ATA_ID_WORDS];
139762306a36Sopenharmony_ci
139862306a36Sopenharmony_ci	switch (cmd) {
139962306a36Sopenharmony_ci		struct cdrom_volctrl volume;
140062306a36Sopenharmony_ci	case HDIO_GET_IDENTITY:
140162306a36Sopenharmony_ci		memset(&ubd_id, 0, ATA_ID_WORDS * 2);
140262306a36Sopenharmony_ci		ubd_id[ATA_ID_CYLS]	= ubd_dev->size / (128 * 32 * 512);
140362306a36Sopenharmony_ci		ubd_id[ATA_ID_HEADS]	= 128;
140462306a36Sopenharmony_ci		ubd_id[ATA_ID_SECTORS]	= 32;
140562306a36Sopenharmony_ci		if(copy_to_user((char __user *) arg, (char *) &ubd_id,
140662306a36Sopenharmony_ci				 sizeof(ubd_id)))
140762306a36Sopenharmony_ci			return -EFAULT;
140862306a36Sopenharmony_ci		return 0;
140962306a36Sopenharmony_ci
141062306a36Sopenharmony_ci	case CDROMVOLREAD:
141162306a36Sopenharmony_ci		if(copy_from_user(&volume, (char __user *) arg, sizeof(volume)))
141262306a36Sopenharmony_ci			return -EFAULT;
141362306a36Sopenharmony_ci		volume.channel0 = 255;
141462306a36Sopenharmony_ci		volume.channel1 = 255;
141562306a36Sopenharmony_ci		volume.channel2 = 255;
141662306a36Sopenharmony_ci		volume.channel3 = 255;
141762306a36Sopenharmony_ci		if(copy_to_user((char __user *) arg, &volume, sizeof(volume)))
141862306a36Sopenharmony_ci			return -EFAULT;
141962306a36Sopenharmony_ci		return 0;
142062306a36Sopenharmony_ci	}
142162306a36Sopenharmony_ci	return -EINVAL;
142262306a36Sopenharmony_ci}
142362306a36Sopenharmony_ci
142462306a36Sopenharmony_cistatic int map_error(int error_code)
142562306a36Sopenharmony_ci{
142662306a36Sopenharmony_ci	switch (error_code) {
142762306a36Sopenharmony_ci	case 0:
142862306a36Sopenharmony_ci		return BLK_STS_OK;
142962306a36Sopenharmony_ci	case ENOSYS:
143062306a36Sopenharmony_ci	case EOPNOTSUPP:
143162306a36Sopenharmony_ci		return BLK_STS_NOTSUPP;
143262306a36Sopenharmony_ci	case ENOSPC:
143362306a36Sopenharmony_ci		return BLK_STS_NOSPC;
143462306a36Sopenharmony_ci	}
143562306a36Sopenharmony_ci	return BLK_STS_IOERR;
143662306a36Sopenharmony_ci}
143762306a36Sopenharmony_ci
143862306a36Sopenharmony_ci/*
143962306a36Sopenharmony_ci * Everything from here onwards *IS NOT PART OF THE KERNEL*
144062306a36Sopenharmony_ci *
144162306a36Sopenharmony_ci * The following functions are part of UML hypervisor code.
144262306a36Sopenharmony_ci * All functions from here onwards are executed as a helper
144362306a36Sopenharmony_ci * thread and are not allowed to execute any kernel functions.
144462306a36Sopenharmony_ci *
144562306a36Sopenharmony_ci * Any communication must occur strictly via shared memory and IPC.
144662306a36Sopenharmony_ci *
144762306a36Sopenharmony_ci * Do not add printks, locks, kernel memory operations, etc - it
144862306a36Sopenharmony_ci * will result in unpredictable behaviour and/or crashes.
144962306a36Sopenharmony_ci */
145062306a36Sopenharmony_ci
145162306a36Sopenharmony_cistatic int update_bitmap(struct io_thread_req *req, struct io_desc *segment)
145262306a36Sopenharmony_ci{
145362306a36Sopenharmony_ci	int n;
145462306a36Sopenharmony_ci
145562306a36Sopenharmony_ci	if (segment->cow_offset == -1)
145662306a36Sopenharmony_ci		return map_error(0);
145762306a36Sopenharmony_ci
145862306a36Sopenharmony_ci	n = os_pwrite_file(req->fds[1], &segment->bitmap_words,
145962306a36Sopenharmony_ci			  sizeof(segment->bitmap_words), segment->cow_offset);
146062306a36Sopenharmony_ci	if (n != sizeof(segment->bitmap_words))
146162306a36Sopenharmony_ci		return map_error(-n);
146262306a36Sopenharmony_ci
146362306a36Sopenharmony_ci	return map_error(0);
146462306a36Sopenharmony_ci}
146562306a36Sopenharmony_ci
146662306a36Sopenharmony_cistatic void do_io(struct io_thread_req *req, struct io_desc *desc)
146762306a36Sopenharmony_ci{
146862306a36Sopenharmony_ci	char *buf = NULL;
146962306a36Sopenharmony_ci	unsigned long len;
147062306a36Sopenharmony_ci	int n, nsectors, start, end, bit;
147162306a36Sopenharmony_ci	__u64 off;
147262306a36Sopenharmony_ci
147362306a36Sopenharmony_ci	/* FLUSH is really a special case, we cannot "case" it with others */
147462306a36Sopenharmony_ci
147562306a36Sopenharmony_ci	if (req_op(req->req) == REQ_OP_FLUSH) {
147662306a36Sopenharmony_ci		/* fds[0] is always either the rw image or our cow file */
147762306a36Sopenharmony_ci		req->error = map_error(-os_sync_file(req->fds[0]));
147862306a36Sopenharmony_ci		return;
147962306a36Sopenharmony_ci	}
148062306a36Sopenharmony_ci
148162306a36Sopenharmony_ci	nsectors = desc->length / req->sectorsize;
148262306a36Sopenharmony_ci	start = 0;
148362306a36Sopenharmony_ci	do {
148462306a36Sopenharmony_ci		bit = ubd_test_bit(start, (unsigned char *) &desc->sector_mask);
148562306a36Sopenharmony_ci		end = start;
148662306a36Sopenharmony_ci		while((end < nsectors) &&
148762306a36Sopenharmony_ci		      (ubd_test_bit(end, (unsigned char *) &desc->sector_mask) == bit))
148862306a36Sopenharmony_ci			end++;
148962306a36Sopenharmony_ci
149062306a36Sopenharmony_ci		off = req->offset + req->offsets[bit] +
149162306a36Sopenharmony_ci			start * req->sectorsize;
149262306a36Sopenharmony_ci		len = (end - start) * req->sectorsize;
149362306a36Sopenharmony_ci		if (desc->buffer != NULL)
149462306a36Sopenharmony_ci			buf = &desc->buffer[start * req->sectorsize];
149562306a36Sopenharmony_ci
149662306a36Sopenharmony_ci		switch (req_op(req->req)) {
149762306a36Sopenharmony_ci		case REQ_OP_READ:
149862306a36Sopenharmony_ci			n = 0;
149962306a36Sopenharmony_ci			do {
150062306a36Sopenharmony_ci				buf = &buf[n];
150162306a36Sopenharmony_ci				len -= n;
150262306a36Sopenharmony_ci				n = os_pread_file(req->fds[bit], buf, len, off);
150362306a36Sopenharmony_ci				if (n < 0) {
150462306a36Sopenharmony_ci					req->error = map_error(-n);
150562306a36Sopenharmony_ci					return;
150662306a36Sopenharmony_ci				}
150762306a36Sopenharmony_ci			} while((n < len) && (n != 0));
150862306a36Sopenharmony_ci			if (n < len) memset(&buf[n], 0, len - n);
150962306a36Sopenharmony_ci			break;
151062306a36Sopenharmony_ci		case REQ_OP_WRITE:
151162306a36Sopenharmony_ci			n = os_pwrite_file(req->fds[bit], buf, len, off);
151262306a36Sopenharmony_ci			if(n != len){
151362306a36Sopenharmony_ci				req->error = map_error(-n);
151462306a36Sopenharmony_ci				return;
151562306a36Sopenharmony_ci			}
151662306a36Sopenharmony_ci			break;
151762306a36Sopenharmony_ci		case REQ_OP_DISCARD:
151862306a36Sopenharmony_ci			n = os_falloc_punch(req->fds[bit], off, len);
151962306a36Sopenharmony_ci			if (n) {
152062306a36Sopenharmony_ci				req->error = map_error(-n);
152162306a36Sopenharmony_ci				return;
152262306a36Sopenharmony_ci			}
152362306a36Sopenharmony_ci			break;
152462306a36Sopenharmony_ci		case REQ_OP_WRITE_ZEROES:
152562306a36Sopenharmony_ci			n = os_falloc_zeroes(req->fds[bit], off, len);
152662306a36Sopenharmony_ci			if (n) {
152762306a36Sopenharmony_ci				req->error = map_error(-n);
152862306a36Sopenharmony_ci				return;
152962306a36Sopenharmony_ci			}
153062306a36Sopenharmony_ci			break;
153162306a36Sopenharmony_ci		default:
153262306a36Sopenharmony_ci			WARN_ON_ONCE(1);
153362306a36Sopenharmony_ci			req->error = BLK_STS_NOTSUPP;
153462306a36Sopenharmony_ci			return;
153562306a36Sopenharmony_ci		}
153662306a36Sopenharmony_ci
153762306a36Sopenharmony_ci		start = end;
153862306a36Sopenharmony_ci	} while(start < nsectors);
153962306a36Sopenharmony_ci
154062306a36Sopenharmony_ci	req->offset += len;
154162306a36Sopenharmony_ci	req->error = update_bitmap(req, desc);
154262306a36Sopenharmony_ci}
154362306a36Sopenharmony_ci
154462306a36Sopenharmony_ci/* Changed in start_io_thread, which is serialized by being called only
154562306a36Sopenharmony_ci * from ubd_init, which is an initcall.
154662306a36Sopenharmony_ci */
154762306a36Sopenharmony_ciint kernel_fd = -1;
154862306a36Sopenharmony_ci
154962306a36Sopenharmony_ci/* Only changed by the io thread. XXX: currently unused. */
155062306a36Sopenharmony_cistatic int io_count;
155162306a36Sopenharmony_ci
155262306a36Sopenharmony_ciint io_thread(void *arg)
155362306a36Sopenharmony_ci{
155462306a36Sopenharmony_ci	int n, count, written, res;
155562306a36Sopenharmony_ci
155662306a36Sopenharmony_ci	os_fix_helper_signals();
155762306a36Sopenharmony_ci
155862306a36Sopenharmony_ci	while(1){
155962306a36Sopenharmony_ci		n = bulk_req_safe_read(
156062306a36Sopenharmony_ci			kernel_fd,
156162306a36Sopenharmony_ci			io_req_buffer,
156262306a36Sopenharmony_ci			&io_remainder,
156362306a36Sopenharmony_ci			&io_remainder_size,
156462306a36Sopenharmony_ci			UBD_REQ_BUFFER_SIZE
156562306a36Sopenharmony_ci		);
156662306a36Sopenharmony_ci		if (n <= 0) {
156762306a36Sopenharmony_ci			if (n == -EAGAIN)
156862306a36Sopenharmony_ci				ubd_read_poll(-1);
156962306a36Sopenharmony_ci
157062306a36Sopenharmony_ci			continue;
157162306a36Sopenharmony_ci		}
157262306a36Sopenharmony_ci
157362306a36Sopenharmony_ci		for (count = 0; count < n/sizeof(struct io_thread_req *); count++) {
157462306a36Sopenharmony_ci			struct io_thread_req *req = (*io_req_buffer)[count];
157562306a36Sopenharmony_ci			int i;
157662306a36Sopenharmony_ci
157762306a36Sopenharmony_ci			io_count++;
157862306a36Sopenharmony_ci			for (i = 0; !req->error && i < req->desc_cnt; i++)
157962306a36Sopenharmony_ci				do_io(req, &(req->io_desc[i]));
158062306a36Sopenharmony_ci
158162306a36Sopenharmony_ci		}
158262306a36Sopenharmony_ci
158362306a36Sopenharmony_ci		written = 0;
158462306a36Sopenharmony_ci
158562306a36Sopenharmony_ci		do {
158662306a36Sopenharmony_ci			res = os_write_file(kernel_fd,
158762306a36Sopenharmony_ci					    ((char *) io_req_buffer) + written,
158862306a36Sopenharmony_ci					    n - written);
158962306a36Sopenharmony_ci			if (res >= 0) {
159062306a36Sopenharmony_ci				written += res;
159162306a36Sopenharmony_ci			}
159262306a36Sopenharmony_ci			if (written < n) {
159362306a36Sopenharmony_ci				ubd_write_poll(-1);
159462306a36Sopenharmony_ci			}
159562306a36Sopenharmony_ci		} while (written < n);
159662306a36Sopenharmony_ci	}
159762306a36Sopenharmony_ci
159862306a36Sopenharmony_ci	return 0;
159962306a36Sopenharmony_ci}
1600