18c2ecf20Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-or-later
28c2ecf20Sopenharmony_ci/*
38c2ecf20Sopenharmony_ci   raid0.c : Multiple Devices driver for Linux
48c2ecf20Sopenharmony_ci	     Copyright (C) 1994-96 Marc ZYNGIER
58c2ecf20Sopenharmony_ci	     <zyngier@ufr-info-p7.ibp.fr> or
68c2ecf20Sopenharmony_ci	     <maz@gloups.fdn.fr>
78c2ecf20Sopenharmony_ci	     Copyright (C) 1999, 2000 Ingo Molnar, Red Hat
88c2ecf20Sopenharmony_ci
98c2ecf20Sopenharmony_ci   RAID-0 management functions.
108c2ecf20Sopenharmony_ci
118c2ecf20Sopenharmony_ci*/
128c2ecf20Sopenharmony_ci
138c2ecf20Sopenharmony_ci#include <linux/blkdev.h>
148c2ecf20Sopenharmony_ci#include <linux/seq_file.h>
158c2ecf20Sopenharmony_ci#include <linux/module.h>
168c2ecf20Sopenharmony_ci#include <linux/slab.h>
178c2ecf20Sopenharmony_ci#include <trace/events/block.h>
188c2ecf20Sopenharmony_ci#include "md.h"
198c2ecf20Sopenharmony_ci#include "raid0.h"
208c2ecf20Sopenharmony_ci#include "raid5.h"
218c2ecf20Sopenharmony_ci
228c2ecf20Sopenharmony_cistatic int default_layout = 0;
238c2ecf20Sopenharmony_cimodule_param(default_layout, int, 0644);
248c2ecf20Sopenharmony_ci
258c2ecf20Sopenharmony_ci#define UNSUPPORTED_MDDEV_FLAGS		\
268c2ecf20Sopenharmony_ci	((1L << MD_HAS_JOURNAL) |	\
278c2ecf20Sopenharmony_ci	 (1L << MD_JOURNAL_CLEAN) |	\
288c2ecf20Sopenharmony_ci	 (1L << MD_FAILFAST_SUPPORTED) |\
298c2ecf20Sopenharmony_ci	 (1L << MD_HAS_PPL) |		\
308c2ecf20Sopenharmony_ci	 (1L << MD_HAS_MULTIPLE_PPLS))
318c2ecf20Sopenharmony_ci
328c2ecf20Sopenharmony_ci/*
338c2ecf20Sopenharmony_ci * inform the user of the raid configuration
348c2ecf20Sopenharmony_ci*/
358c2ecf20Sopenharmony_cistatic void dump_zones(struct mddev *mddev)
368c2ecf20Sopenharmony_ci{
378c2ecf20Sopenharmony_ci	int j, k;
388c2ecf20Sopenharmony_ci	sector_t zone_size = 0;
398c2ecf20Sopenharmony_ci	sector_t zone_start = 0;
408c2ecf20Sopenharmony_ci	char b[BDEVNAME_SIZE];
418c2ecf20Sopenharmony_ci	struct r0conf *conf = mddev->private;
428c2ecf20Sopenharmony_ci	int raid_disks = conf->strip_zone[0].nb_dev;
438c2ecf20Sopenharmony_ci	pr_debug("md: RAID0 configuration for %s - %d zone%s\n",
448c2ecf20Sopenharmony_ci		 mdname(mddev),
458c2ecf20Sopenharmony_ci		 conf->nr_strip_zones, conf->nr_strip_zones==1?"":"s");
468c2ecf20Sopenharmony_ci	for (j = 0; j < conf->nr_strip_zones; j++) {
478c2ecf20Sopenharmony_ci		char line[200];
488c2ecf20Sopenharmony_ci		int len = 0;
498c2ecf20Sopenharmony_ci
508c2ecf20Sopenharmony_ci		for (k = 0; k < conf->strip_zone[j].nb_dev; k++)
518c2ecf20Sopenharmony_ci			len += scnprintf(line+len, 200-len, "%s%s", k?"/":"",
528c2ecf20Sopenharmony_ci					bdevname(conf->devlist[j*raid_disks
538c2ecf20Sopenharmony_ci							       + k]->bdev, b));
548c2ecf20Sopenharmony_ci		pr_debug("md: zone%d=[%s]\n", j, line);
558c2ecf20Sopenharmony_ci
568c2ecf20Sopenharmony_ci		zone_size  = conf->strip_zone[j].zone_end - zone_start;
578c2ecf20Sopenharmony_ci		pr_debug("      zone-offset=%10lluKB, device-offset=%10lluKB, size=%10lluKB\n",
588c2ecf20Sopenharmony_ci			(unsigned long long)zone_start>>1,
598c2ecf20Sopenharmony_ci			(unsigned long long)conf->strip_zone[j].dev_start>>1,
608c2ecf20Sopenharmony_ci			(unsigned long long)zone_size>>1);
618c2ecf20Sopenharmony_ci		zone_start = conf->strip_zone[j].zone_end;
628c2ecf20Sopenharmony_ci	}
638c2ecf20Sopenharmony_ci}
648c2ecf20Sopenharmony_ci
658c2ecf20Sopenharmony_cistatic int create_strip_zones(struct mddev *mddev, struct r0conf **private_conf)
668c2ecf20Sopenharmony_ci{
678c2ecf20Sopenharmony_ci	int i, c, err;
688c2ecf20Sopenharmony_ci	sector_t curr_zone_end, sectors;
698c2ecf20Sopenharmony_ci	struct md_rdev *smallest, *rdev1, *rdev2, *rdev, **dev;
708c2ecf20Sopenharmony_ci	struct strip_zone *zone;
718c2ecf20Sopenharmony_ci	int cnt;
728c2ecf20Sopenharmony_ci	char b[BDEVNAME_SIZE];
738c2ecf20Sopenharmony_ci	char b2[BDEVNAME_SIZE];
748c2ecf20Sopenharmony_ci	struct r0conf *conf = kzalloc(sizeof(*conf), GFP_KERNEL);
758c2ecf20Sopenharmony_ci	unsigned blksize = 512;
768c2ecf20Sopenharmony_ci
778c2ecf20Sopenharmony_ci	*private_conf = ERR_PTR(-ENOMEM);
788c2ecf20Sopenharmony_ci	if (!conf)
798c2ecf20Sopenharmony_ci		return -ENOMEM;
808c2ecf20Sopenharmony_ci	rdev_for_each(rdev1, mddev) {
818c2ecf20Sopenharmony_ci		pr_debug("md/raid0:%s: looking at %s\n",
828c2ecf20Sopenharmony_ci			 mdname(mddev),
838c2ecf20Sopenharmony_ci			 bdevname(rdev1->bdev, b));
848c2ecf20Sopenharmony_ci		c = 0;
858c2ecf20Sopenharmony_ci
868c2ecf20Sopenharmony_ci		/* round size to chunk_size */
878c2ecf20Sopenharmony_ci		sectors = rdev1->sectors;
888c2ecf20Sopenharmony_ci		sector_div(sectors, mddev->chunk_sectors);
898c2ecf20Sopenharmony_ci		rdev1->sectors = sectors * mddev->chunk_sectors;
908c2ecf20Sopenharmony_ci
918c2ecf20Sopenharmony_ci		blksize = max(blksize, queue_logical_block_size(
928c2ecf20Sopenharmony_ci				      rdev1->bdev->bd_disk->queue));
938c2ecf20Sopenharmony_ci
948c2ecf20Sopenharmony_ci		rdev_for_each(rdev2, mddev) {
958c2ecf20Sopenharmony_ci			pr_debug("md/raid0:%s:   comparing %s(%llu)"
968c2ecf20Sopenharmony_ci				 " with %s(%llu)\n",
978c2ecf20Sopenharmony_ci				 mdname(mddev),
988c2ecf20Sopenharmony_ci				 bdevname(rdev1->bdev,b),
998c2ecf20Sopenharmony_ci				 (unsigned long long)rdev1->sectors,
1008c2ecf20Sopenharmony_ci				 bdevname(rdev2->bdev,b2),
1018c2ecf20Sopenharmony_ci				 (unsigned long long)rdev2->sectors);
1028c2ecf20Sopenharmony_ci			if (rdev2 == rdev1) {
1038c2ecf20Sopenharmony_ci				pr_debug("md/raid0:%s:   END\n",
1048c2ecf20Sopenharmony_ci					 mdname(mddev));
1058c2ecf20Sopenharmony_ci				break;
1068c2ecf20Sopenharmony_ci			}
1078c2ecf20Sopenharmony_ci			if (rdev2->sectors == rdev1->sectors) {
1088c2ecf20Sopenharmony_ci				/*
1098c2ecf20Sopenharmony_ci				 * Not unique, don't count it as a new
1108c2ecf20Sopenharmony_ci				 * group
1118c2ecf20Sopenharmony_ci				 */
1128c2ecf20Sopenharmony_ci				pr_debug("md/raid0:%s:   EQUAL\n",
1138c2ecf20Sopenharmony_ci					 mdname(mddev));
1148c2ecf20Sopenharmony_ci				c = 1;
1158c2ecf20Sopenharmony_ci				break;
1168c2ecf20Sopenharmony_ci			}
1178c2ecf20Sopenharmony_ci			pr_debug("md/raid0:%s:   NOT EQUAL\n",
1188c2ecf20Sopenharmony_ci				 mdname(mddev));
1198c2ecf20Sopenharmony_ci		}
1208c2ecf20Sopenharmony_ci		if (!c) {
1218c2ecf20Sopenharmony_ci			pr_debug("md/raid0:%s:   ==> UNIQUE\n",
1228c2ecf20Sopenharmony_ci				 mdname(mddev));
1238c2ecf20Sopenharmony_ci			conf->nr_strip_zones++;
1248c2ecf20Sopenharmony_ci			pr_debug("md/raid0:%s: %d zones\n",
1258c2ecf20Sopenharmony_ci				 mdname(mddev), conf->nr_strip_zones);
1268c2ecf20Sopenharmony_ci		}
1278c2ecf20Sopenharmony_ci	}
1288c2ecf20Sopenharmony_ci	pr_debug("md/raid0:%s: FINAL %d zones\n",
1298c2ecf20Sopenharmony_ci		 mdname(mddev), conf->nr_strip_zones);
1308c2ecf20Sopenharmony_ci
1318c2ecf20Sopenharmony_ci	/*
1328c2ecf20Sopenharmony_ci	 * now since we have the hard sector sizes, we can make sure
1338c2ecf20Sopenharmony_ci	 * chunk size is a multiple of that sector size
1348c2ecf20Sopenharmony_ci	 */
1358c2ecf20Sopenharmony_ci	if ((mddev->chunk_sectors << 9) % blksize) {
1368c2ecf20Sopenharmony_ci		pr_warn("md/raid0:%s: chunk_size of %d not multiple of block size %d\n",
1378c2ecf20Sopenharmony_ci			mdname(mddev),
1388c2ecf20Sopenharmony_ci			mddev->chunk_sectors << 9, blksize);
1398c2ecf20Sopenharmony_ci		err = -EINVAL;
1408c2ecf20Sopenharmony_ci		goto abort;
1418c2ecf20Sopenharmony_ci	}
1428c2ecf20Sopenharmony_ci
1438c2ecf20Sopenharmony_ci	err = -ENOMEM;
1448c2ecf20Sopenharmony_ci	conf->strip_zone = kcalloc(conf->nr_strip_zones,
1458c2ecf20Sopenharmony_ci				   sizeof(struct strip_zone),
1468c2ecf20Sopenharmony_ci				   GFP_KERNEL);
1478c2ecf20Sopenharmony_ci	if (!conf->strip_zone)
1488c2ecf20Sopenharmony_ci		goto abort;
1498c2ecf20Sopenharmony_ci	conf->devlist = kzalloc(array3_size(sizeof(struct md_rdev *),
1508c2ecf20Sopenharmony_ci					    conf->nr_strip_zones,
1518c2ecf20Sopenharmony_ci					    mddev->raid_disks),
1528c2ecf20Sopenharmony_ci				GFP_KERNEL);
1538c2ecf20Sopenharmony_ci	if (!conf->devlist)
1548c2ecf20Sopenharmony_ci		goto abort;
1558c2ecf20Sopenharmony_ci
1568c2ecf20Sopenharmony_ci	/* The first zone must contain all devices, so here we check that
1578c2ecf20Sopenharmony_ci	 * there is a proper alignment of slots to devices and find them all
1588c2ecf20Sopenharmony_ci	 */
1598c2ecf20Sopenharmony_ci	zone = &conf->strip_zone[0];
1608c2ecf20Sopenharmony_ci	cnt = 0;
1618c2ecf20Sopenharmony_ci	smallest = NULL;
1628c2ecf20Sopenharmony_ci	dev = conf->devlist;
1638c2ecf20Sopenharmony_ci	err = -EINVAL;
1648c2ecf20Sopenharmony_ci	rdev_for_each(rdev1, mddev) {
1658c2ecf20Sopenharmony_ci		int j = rdev1->raid_disk;
1668c2ecf20Sopenharmony_ci
1678c2ecf20Sopenharmony_ci		if (mddev->level == 10) {
1688c2ecf20Sopenharmony_ci			/* taking over a raid10-n2 array */
1698c2ecf20Sopenharmony_ci			j /= 2;
1708c2ecf20Sopenharmony_ci			rdev1->new_raid_disk = j;
1718c2ecf20Sopenharmony_ci		}
1728c2ecf20Sopenharmony_ci
1738c2ecf20Sopenharmony_ci		if (mddev->level == 1) {
1748c2ecf20Sopenharmony_ci			/* taiking over a raid1 array-
1758c2ecf20Sopenharmony_ci			 * we have only one active disk
1768c2ecf20Sopenharmony_ci			 */
1778c2ecf20Sopenharmony_ci			j = 0;
1788c2ecf20Sopenharmony_ci			rdev1->new_raid_disk = j;
1798c2ecf20Sopenharmony_ci		}
1808c2ecf20Sopenharmony_ci
1818c2ecf20Sopenharmony_ci		if (j < 0) {
1828c2ecf20Sopenharmony_ci			pr_warn("md/raid0:%s: remove inactive devices before converting to RAID0\n",
1838c2ecf20Sopenharmony_ci				mdname(mddev));
1848c2ecf20Sopenharmony_ci			goto abort;
1858c2ecf20Sopenharmony_ci		}
1868c2ecf20Sopenharmony_ci		if (j >= mddev->raid_disks) {
1878c2ecf20Sopenharmony_ci			pr_warn("md/raid0:%s: bad disk number %d - aborting!\n",
1888c2ecf20Sopenharmony_ci				mdname(mddev), j);
1898c2ecf20Sopenharmony_ci			goto abort;
1908c2ecf20Sopenharmony_ci		}
1918c2ecf20Sopenharmony_ci		if (dev[j]) {
1928c2ecf20Sopenharmony_ci			pr_warn("md/raid0:%s: multiple devices for %d - aborting!\n",
1938c2ecf20Sopenharmony_ci				mdname(mddev), j);
1948c2ecf20Sopenharmony_ci			goto abort;
1958c2ecf20Sopenharmony_ci		}
1968c2ecf20Sopenharmony_ci		dev[j] = rdev1;
1978c2ecf20Sopenharmony_ci
1988c2ecf20Sopenharmony_ci		if (!smallest || (rdev1->sectors < smallest->sectors))
1998c2ecf20Sopenharmony_ci			smallest = rdev1;
2008c2ecf20Sopenharmony_ci		cnt++;
2018c2ecf20Sopenharmony_ci	}
2028c2ecf20Sopenharmony_ci	if (cnt != mddev->raid_disks) {
2038c2ecf20Sopenharmony_ci		pr_warn("md/raid0:%s: too few disks (%d of %d) - aborting!\n",
2048c2ecf20Sopenharmony_ci			mdname(mddev), cnt, mddev->raid_disks);
2058c2ecf20Sopenharmony_ci		goto abort;
2068c2ecf20Sopenharmony_ci	}
2078c2ecf20Sopenharmony_ci	zone->nb_dev = cnt;
2088c2ecf20Sopenharmony_ci	zone->zone_end = smallest->sectors * cnt;
2098c2ecf20Sopenharmony_ci
2108c2ecf20Sopenharmony_ci	curr_zone_end = zone->zone_end;
2118c2ecf20Sopenharmony_ci
2128c2ecf20Sopenharmony_ci	/* now do the other zones */
2138c2ecf20Sopenharmony_ci	for (i = 1; i < conf->nr_strip_zones; i++)
2148c2ecf20Sopenharmony_ci	{
2158c2ecf20Sopenharmony_ci		int j;
2168c2ecf20Sopenharmony_ci
2178c2ecf20Sopenharmony_ci		zone = conf->strip_zone + i;
2188c2ecf20Sopenharmony_ci		dev = conf->devlist + i * mddev->raid_disks;
2198c2ecf20Sopenharmony_ci
2208c2ecf20Sopenharmony_ci		pr_debug("md/raid0:%s: zone %d\n", mdname(mddev), i);
2218c2ecf20Sopenharmony_ci		zone->dev_start = smallest->sectors;
2228c2ecf20Sopenharmony_ci		smallest = NULL;
2238c2ecf20Sopenharmony_ci		c = 0;
2248c2ecf20Sopenharmony_ci
2258c2ecf20Sopenharmony_ci		for (j=0; j<cnt; j++) {
2268c2ecf20Sopenharmony_ci			rdev = conf->devlist[j];
2278c2ecf20Sopenharmony_ci			if (rdev->sectors <= zone->dev_start) {
2288c2ecf20Sopenharmony_ci				pr_debug("md/raid0:%s: checking %s ... nope\n",
2298c2ecf20Sopenharmony_ci					 mdname(mddev),
2308c2ecf20Sopenharmony_ci					 bdevname(rdev->bdev, b));
2318c2ecf20Sopenharmony_ci				continue;
2328c2ecf20Sopenharmony_ci			}
2338c2ecf20Sopenharmony_ci			pr_debug("md/raid0:%s: checking %s ..."
2348c2ecf20Sopenharmony_ci				 " contained as device %d\n",
2358c2ecf20Sopenharmony_ci				 mdname(mddev),
2368c2ecf20Sopenharmony_ci				 bdevname(rdev->bdev, b), c);
2378c2ecf20Sopenharmony_ci			dev[c] = rdev;
2388c2ecf20Sopenharmony_ci			c++;
2398c2ecf20Sopenharmony_ci			if (!smallest || rdev->sectors < smallest->sectors) {
2408c2ecf20Sopenharmony_ci				smallest = rdev;
2418c2ecf20Sopenharmony_ci				pr_debug("md/raid0:%s:  (%llu) is smallest!.\n",
2428c2ecf20Sopenharmony_ci					 mdname(mddev),
2438c2ecf20Sopenharmony_ci					 (unsigned long long)rdev->sectors);
2448c2ecf20Sopenharmony_ci			}
2458c2ecf20Sopenharmony_ci		}
2468c2ecf20Sopenharmony_ci
2478c2ecf20Sopenharmony_ci		zone->nb_dev = c;
2488c2ecf20Sopenharmony_ci		sectors = (smallest->sectors - zone->dev_start) * c;
2498c2ecf20Sopenharmony_ci		pr_debug("md/raid0:%s: zone->nb_dev: %d, sectors: %llu\n",
2508c2ecf20Sopenharmony_ci			 mdname(mddev),
2518c2ecf20Sopenharmony_ci			 zone->nb_dev, (unsigned long long)sectors);
2528c2ecf20Sopenharmony_ci
2538c2ecf20Sopenharmony_ci		curr_zone_end += sectors;
2548c2ecf20Sopenharmony_ci		zone->zone_end = curr_zone_end;
2558c2ecf20Sopenharmony_ci
2568c2ecf20Sopenharmony_ci		pr_debug("md/raid0:%s: current zone start: %llu\n",
2578c2ecf20Sopenharmony_ci			 mdname(mddev),
2588c2ecf20Sopenharmony_ci			 (unsigned long long)smallest->sectors);
2598c2ecf20Sopenharmony_ci	}
2608c2ecf20Sopenharmony_ci
2618c2ecf20Sopenharmony_ci	if (conf->nr_strip_zones == 1 || conf->strip_zone[1].nb_dev == 1) {
2628c2ecf20Sopenharmony_ci		conf->layout = RAID0_ORIG_LAYOUT;
2638c2ecf20Sopenharmony_ci	} else if (mddev->layout == RAID0_ORIG_LAYOUT ||
2648c2ecf20Sopenharmony_ci		   mddev->layout == RAID0_ALT_MULTIZONE_LAYOUT) {
2658c2ecf20Sopenharmony_ci		conf->layout = mddev->layout;
2668c2ecf20Sopenharmony_ci	} else if (default_layout == RAID0_ORIG_LAYOUT ||
2678c2ecf20Sopenharmony_ci		   default_layout == RAID0_ALT_MULTIZONE_LAYOUT) {
2688c2ecf20Sopenharmony_ci		conf->layout = default_layout;
2698c2ecf20Sopenharmony_ci	} else {
2708c2ecf20Sopenharmony_ci		pr_err("md/raid0:%s: cannot assemble multi-zone RAID0 with default_layout setting\n",
2718c2ecf20Sopenharmony_ci		       mdname(mddev));
2728c2ecf20Sopenharmony_ci		pr_err("md/raid0: please set raid0.default_layout to 1 or 2\n");
2738c2ecf20Sopenharmony_ci		err = -EOPNOTSUPP;
2748c2ecf20Sopenharmony_ci		goto abort;
2758c2ecf20Sopenharmony_ci	}
2768c2ecf20Sopenharmony_ci
2778c2ecf20Sopenharmony_ci	if (conf->layout == RAID0_ORIG_LAYOUT) {
2788c2ecf20Sopenharmony_ci		for (i = 1; i < conf->nr_strip_zones; i++) {
2798c2ecf20Sopenharmony_ci			sector_t first_sector = conf->strip_zone[i-1].zone_end;
2808c2ecf20Sopenharmony_ci
2818c2ecf20Sopenharmony_ci			sector_div(first_sector, mddev->chunk_sectors);
2828c2ecf20Sopenharmony_ci			zone = conf->strip_zone + i;
2838c2ecf20Sopenharmony_ci			/* disk_shift is first disk index used in the zone */
2848c2ecf20Sopenharmony_ci			zone->disk_shift = sector_div(first_sector,
2858c2ecf20Sopenharmony_ci						      zone->nb_dev);
2868c2ecf20Sopenharmony_ci		}
2878c2ecf20Sopenharmony_ci	}
2888c2ecf20Sopenharmony_ci
2898c2ecf20Sopenharmony_ci	pr_debug("md/raid0:%s: done.\n", mdname(mddev));
2908c2ecf20Sopenharmony_ci	*private_conf = conf;
2918c2ecf20Sopenharmony_ci
2928c2ecf20Sopenharmony_ci	return 0;
2938c2ecf20Sopenharmony_ciabort:
2948c2ecf20Sopenharmony_ci	kfree(conf->strip_zone);
2958c2ecf20Sopenharmony_ci	kfree(conf->devlist);
2968c2ecf20Sopenharmony_ci	kfree(conf);
2978c2ecf20Sopenharmony_ci	*private_conf = ERR_PTR(err);
2988c2ecf20Sopenharmony_ci	return err;
2998c2ecf20Sopenharmony_ci}
3008c2ecf20Sopenharmony_ci
3018c2ecf20Sopenharmony_ci/* Find the zone which holds a particular offset
3028c2ecf20Sopenharmony_ci * Update *sectorp to be an offset in that zone
3038c2ecf20Sopenharmony_ci */
3048c2ecf20Sopenharmony_cistatic struct strip_zone *find_zone(struct r0conf *conf,
3058c2ecf20Sopenharmony_ci				    sector_t *sectorp)
3068c2ecf20Sopenharmony_ci{
3078c2ecf20Sopenharmony_ci	int i;
3088c2ecf20Sopenharmony_ci	struct strip_zone *z = conf->strip_zone;
3098c2ecf20Sopenharmony_ci	sector_t sector = *sectorp;
3108c2ecf20Sopenharmony_ci
3118c2ecf20Sopenharmony_ci	for (i = 0; i < conf->nr_strip_zones; i++)
3128c2ecf20Sopenharmony_ci		if (sector < z[i].zone_end) {
3138c2ecf20Sopenharmony_ci			if (i)
3148c2ecf20Sopenharmony_ci				*sectorp = sector - z[i-1].zone_end;
3158c2ecf20Sopenharmony_ci			return z + i;
3168c2ecf20Sopenharmony_ci		}
3178c2ecf20Sopenharmony_ci	BUG();
3188c2ecf20Sopenharmony_ci}
3198c2ecf20Sopenharmony_ci
3208c2ecf20Sopenharmony_ci/*
3218c2ecf20Sopenharmony_ci * remaps the bio to the target device. we separate two flows.
3228c2ecf20Sopenharmony_ci * power 2 flow and a general flow for the sake of performance
3238c2ecf20Sopenharmony_ci*/
3248c2ecf20Sopenharmony_cistatic struct md_rdev *map_sector(struct mddev *mddev, struct strip_zone *zone,
3258c2ecf20Sopenharmony_ci				sector_t sector, sector_t *sector_offset)
3268c2ecf20Sopenharmony_ci{
3278c2ecf20Sopenharmony_ci	unsigned int sect_in_chunk;
3288c2ecf20Sopenharmony_ci	sector_t chunk;
3298c2ecf20Sopenharmony_ci	struct r0conf *conf = mddev->private;
3308c2ecf20Sopenharmony_ci	int raid_disks = conf->strip_zone[0].nb_dev;
3318c2ecf20Sopenharmony_ci	unsigned int chunk_sects = mddev->chunk_sectors;
3328c2ecf20Sopenharmony_ci
3338c2ecf20Sopenharmony_ci	if (is_power_of_2(chunk_sects)) {
3348c2ecf20Sopenharmony_ci		int chunksect_bits = ffz(~chunk_sects);
3358c2ecf20Sopenharmony_ci		/* find the sector offset inside the chunk */
3368c2ecf20Sopenharmony_ci		sect_in_chunk  = sector & (chunk_sects - 1);
3378c2ecf20Sopenharmony_ci		sector >>= chunksect_bits;
3388c2ecf20Sopenharmony_ci		/* chunk in zone */
3398c2ecf20Sopenharmony_ci		chunk = *sector_offset;
3408c2ecf20Sopenharmony_ci		/* quotient is the chunk in real device*/
3418c2ecf20Sopenharmony_ci		sector_div(chunk, zone->nb_dev << chunksect_bits);
3428c2ecf20Sopenharmony_ci	} else{
3438c2ecf20Sopenharmony_ci		sect_in_chunk = sector_div(sector, chunk_sects);
3448c2ecf20Sopenharmony_ci		chunk = *sector_offset;
3458c2ecf20Sopenharmony_ci		sector_div(chunk, chunk_sects * zone->nb_dev);
3468c2ecf20Sopenharmony_ci	}
3478c2ecf20Sopenharmony_ci	/*
3488c2ecf20Sopenharmony_ci	*  position the bio over the real device
3498c2ecf20Sopenharmony_ci	*  real sector = chunk in device + starting of zone
3508c2ecf20Sopenharmony_ci	*	+ the position in the chunk
3518c2ecf20Sopenharmony_ci	*/
3528c2ecf20Sopenharmony_ci	*sector_offset = (chunk * chunk_sects) + sect_in_chunk;
3538c2ecf20Sopenharmony_ci	return conf->devlist[(zone - conf->strip_zone)*raid_disks
3548c2ecf20Sopenharmony_ci			     + sector_div(sector, zone->nb_dev)];
3558c2ecf20Sopenharmony_ci}
3568c2ecf20Sopenharmony_ci
3578c2ecf20Sopenharmony_cistatic sector_t raid0_size(struct mddev *mddev, sector_t sectors, int raid_disks)
3588c2ecf20Sopenharmony_ci{
3598c2ecf20Sopenharmony_ci	sector_t array_sectors = 0;
3608c2ecf20Sopenharmony_ci	struct md_rdev *rdev;
3618c2ecf20Sopenharmony_ci
3628c2ecf20Sopenharmony_ci	WARN_ONCE(sectors || raid_disks,
3638c2ecf20Sopenharmony_ci		  "%s does not support generic reshape\n", __func__);
3648c2ecf20Sopenharmony_ci
3658c2ecf20Sopenharmony_ci	rdev_for_each(rdev, mddev)
3668c2ecf20Sopenharmony_ci		array_sectors += (rdev->sectors &
3678c2ecf20Sopenharmony_ci				  ~(sector_t)(mddev->chunk_sectors-1));
3688c2ecf20Sopenharmony_ci
3698c2ecf20Sopenharmony_ci	return array_sectors;
3708c2ecf20Sopenharmony_ci}
3718c2ecf20Sopenharmony_ci
3728c2ecf20Sopenharmony_cistatic void raid0_free(struct mddev *mddev, void *priv);
3738c2ecf20Sopenharmony_ci
3748c2ecf20Sopenharmony_cistatic int raid0_run(struct mddev *mddev)
3758c2ecf20Sopenharmony_ci{
3768c2ecf20Sopenharmony_ci	struct r0conf *conf;
3778c2ecf20Sopenharmony_ci	int ret;
3788c2ecf20Sopenharmony_ci
3798c2ecf20Sopenharmony_ci	if (mddev->chunk_sectors == 0) {
3808c2ecf20Sopenharmony_ci		pr_warn("md/raid0:%s: chunk size must be set.\n", mdname(mddev));
3818c2ecf20Sopenharmony_ci		return -EINVAL;
3828c2ecf20Sopenharmony_ci	}
3838c2ecf20Sopenharmony_ci	if (md_check_no_bitmap(mddev))
3848c2ecf20Sopenharmony_ci		return -EINVAL;
3858c2ecf20Sopenharmony_ci
3868c2ecf20Sopenharmony_ci	/* if private is not null, we are here after takeover */
3878c2ecf20Sopenharmony_ci	if (mddev->private == NULL) {
3888c2ecf20Sopenharmony_ci		ret = create_strip_zones(mddev, &conf);
3898c2ecf20Sopenharmony_ci		if (ret < 0)
3908c2ecf20Sopenharmony_ci			return ret;
3918c2ecf20Sopenharmony_ci		mddev->private = conf;
3928c2ecf20Sopenharmony_ci	}
3938c2ecf20Sopenharmony_ci	conf = mddev->private;
3948c2ecf20Sopenharmony_ci	if (mddev->queue) {
3958c2ecf20Sopenharmony_ci		struct md_rdev *rdev;
3968c2ecf20Sopenharmony_ci		bool discard_supported = false;
3978c2ecf20Sopenharmony_ci
3988c2ecf20Sopenharmony_ci		blk_queue_max_hw_sectors(mddev->queue, mddev->chunk_sectors);
3998c2ecf20Sopenharmony_ci		blk_queue_max_write_same_sectors(mddev->queue, mddev->chunk_sectors);
4008c2ecf20Sopenharmony_ci		blk_queue_max_write_zeroes_sectors(mddev->queue, mddev->chunk_sectors);
4018c2ecf20Sopenharmony_ci		blk_queue_max_discard_sectors(mddev->queue, UINT_MAX);
4028c2ecf20Sopenharmony_ci
4038c2ecf20Sopenharmony_ci		blk_queue_io_min(mddev->queue, mddev->chunk_sectors << 9);
4048c2ecf20Sopenharmony_ci		blk_queue_io_opt(mddev->queue,
4058c2ecf20Sopenharmony_ci				 (mddev->chunk_sectors << 9) * mddev->raid_disks);
4068c2ecf20Sopenharmony_ci
4078c2ecf20Sopenharmony_ci		rdev_for_each(rdev, mddev) {
4088c2ecf20Sopenharmony_ci			disk_stack_limits(mddev->gendisk, rdev->bdev,
4098c2ecf20Sopenharmony_ci					  rdev->data_offset << 9);
4108c2ecf20Sopenharmony_ci			if (blk_queue_discard(bdev_get_queue(rdev->bdev)))
4118c2ecf20Sopenharmony_ci				discard_supported = true;
4128c2ecf20Sopenharmony_ci		}
4138c2ecf20Sopenharmony_ci		if (!discard_supported)
4148c2ecf20Sopenharmony_ci			blk_queue_flag_clear(QUEUE_FLAG_DISCARD, mddev->queue);
4158c2ecf20Sopenharmony_ci		else
4168c2ecf20Sopenharmony_ci			blk_queue_flag_set(QUEUE_FLAG_DISCARD, mddev->queue);
4178c2ecf20Sopenharmony_ci	}
4188c2ecf20Sopenharmony_ci
4198c2ecf20Sopenharmony_ci	/* calculate array device size */
4208c2ecf20Sopenharmony_ci	md_set_array_sectors(mddev, raid0_size(mddev, 0, 0));
4218c2ecf20Sopenharmony_ci
4228c2ecf20Sopenharmony_ci	pr_debug("md/raid0:%s: md_size is %llu sectors.\n",
4238c2ecf20Sopenharmony_ci		 mdname(mddev),
4248c2ecf20Sopenharmony_ci		 (unsigned long long)mddev->array_sectors);
4258c2ecf20Sopenharmony_ci
4268c2ecf20Sopenharmony_ci	dump_zones(mddev);
4278c2ecf20Sopenharmony_ci
4288c2ecf20Sopenharmony_ci	ret = md_integrity_register(mddev);
4298c2ecf20Sopenharmony_ci
4308c2ecf20Sopenharmony_ci	return ret;
4318c2ecf20Sopenharmony_ci}
4328c2ecf20Sopenharmony_ci
4338c2ecf20Sopenharmony_cistatic void raid0_free(struct mddev *mddev, void *priv)
4348c2ecf20Sopenharmony_ci{
4358c2ecf20Sopenharmony_ci	struct r0conf *conf = priv;
4368c2ecf20Sopenharmony_ci
4378c2ecf20Sopenharmony_ci	kfree(conf->strip_zone);
4388c2ecf20Sopenharmony_ci	kfree(conf->devlist);
4398c2ecf20Sopenharmony_ci	kfree(conf);
4408c2ecf20Sopenharmony_ci}
4418c2ecf20Sopenharmony_ci
4428c2ecf20Sopenharmony_ci/*
4438c2ecf20Sopenharmony_ci * Convert disk_index to the disk order in which it is read/written.
4448c2ecf20Sopenharmony_ci *  For example, if we have 4 disks, they are numbered 0,1,2,3. If we
4458c2ecf20Sopenharmony_ci *  write the disks starting at disk 3, then the read/write order would
4468c2ecf20Sopenharmony_ci *  be disk 3, then 0, then 1, and then disk 2 and we want map_disk_shift()
4478c2ecf20Sopenharmony_ci *  to map the disks as follows 0,1,2,3 => 1,2,3,0. So disk 0 would map
4488c2ecf20Sopenharmony_ci *  to 1, 1 to 2, 2 to 3, and 3 to 0. That way we can compare disks in
4498c2ecf20Sopenharmony_ci *  that 'output' space to understand the read/write disk ordering.
4508c2ecf20Sopenharmony_ci */
4518c2ecf20Sopenharmony_cistatic int map_disk_shift(int disk_index, int num_disks, int disk_shift)
4528c2ecf20Sopenharmony_ci{
4538c2ecf20Sopenharmony_ci	return ((disk_index + num_disks - disk_shift) % num_disks);
4548c2ecf20Sopenharmony_ci}
4558c2ecf20Sopenharmony_ci
4568c2ecf20Sopenharmony_cistatic void raid0_handle_discard(struct mddev *mddev, struct bio *bio)
4578c2ecf20Sopenharmony_ci{
4588c2ecf20Sopenharmony_ci	struct r0conf *conf = mddev->private;
4598c2ecf20Sopenharmony_ci	struct strip_zone *zone;
4608c2ecf20Sopenharmony_ci	sector_t start = bio->bi_iter.bi_sector;
4618c2ecf20Sopenharmony_ci	sector_t end;
4628c2ecf20Sopenharmony_ci	unsigned int stripe_size;
4638c2ecf20Sopenharmony_ci	sector_t first_stripe_index, last_stripe_index;
4648c2ecf20Sopenharmony_ci	sector_t start_disk_offset;
4658c2ecf20Sopenharmony_ci	unsigned int start_disk_index;
4668c2ecf20Sopenharmony_ci	sector_t end_disk_offset;
4678c2ecf20Sopenharmony_ci	unsigned int end_disk_index;
4688c2ecf20Sopenharmony_ci	unsigned int disk;
4698c2ecf20Sopenharmony_ci	sector_t orig_start, orig_end;
4708c2ecf20Sopenharmony_ci
4718c2ecf20Sopenharmony_ci	orig_start = start;
4728c2ecf20Sopenharmony_ci	zone = find_zone(conf, &start);
4738c2ecf20Sopenharmony_ci
4748c2ecf20Sopenharmony_ci	if (bio_end_sector(bio) > zone->zone_end) {
4758c2ecf20Sopenharmony_ci		struct bio *split = bio_split(bio,
4768c2ecf20Sopenharmony_ci			zone->zone_end - bio->bi_iter.bi_sector, GFP_NOIO,
4778c2ecf20Sopenharmony_ci			&mddev->bio_set);
4788c2ecf20Sopenharmony_ci		bio_chain(split, bio);
4798c2ecf20Sopenharmony_ci		submit_bio_noacct(bio);
4808c2ecf20Sopenharmony_ci		bio = split;
4818c2ecf20Sopenharmony_ci		end = zone->zone_end;
4828c2ecf20Sopenharmony_ci	} else
4838c2ecf20Sopenharmony_ci		end = bio_end_sector(bio);
4848c2ecf20Sopenharmony_ci
4858c2ecf20Sopenharmony_ci	orig_end = end;
4868c2ecf20Sopenharmony_ci	if (zone != conf->strip_zone)
4878c2ecf20Sopenharmony_ci		end = end - zone[-1].zone_end;
4888c2ecf20Sopenharmony_ci
4898c2ecf20Sopenharmony_ci	/* Now start and end is the offset in zone */
4908c2ecf20Sopenharmony_ci	stripe_size = zone->nb_dev * mddev->chunk_sectors;
4918c2ecf20Sopenharmony_ci
4928c2ecf20Sopenharmony_ci	first_stripe_index = start;
4938c2ecf20Sopenharmony_ci	sector_div(first_stripe_index, stripe_size);
4948c2ecf20Sopenharmony_ci	last_stripe_index = end;
4958c2ecf20Sopenharmony_ci	sector_div(last_stripe_index, stripe_size);
4968c2ecf20Sopenharmony_ci
4978c2ecf20Sopenharmony_ci	/* In the first zone the original and alternate layouts are the same */
4988c2ecf20Sopenharmony_ci	if ((conf->layout == RAID0_ORIG_LAYOUT) && (zone != conf->strip_zone)) {
4998c2ecf20Sopenharmony_ci		sector_div(orig_start, mddev->chunk_sectors);
5008c2ecf20Sopenharmony_ci		start_disk_index = sector_div(orig_start, zone->nb_dev);
5018c2ecf20Sopenharmony_ci		start_disk_index = map_disk_shift(start_disk_index,
5028c2ecf20Sopenharmony_ci						  zone->nb_dev,
5038c2ecf20Sopenharmony_ci						  zone->disk_shift);
5048c2ecf20Sopenharmony_ci		sector_div(orig_end, mddev->chunk_sectors);
5058c2ecf20Sopenharmony_ci		end_disk_index = sector_div(orig_end, zone->nb_dev);
5068c2ecf20Sopenharmony_ci		end_disk_index = map_disk_shift(end_disk_index,
5078c2ecf20Sopenharmony_ci						zone->nb_dev, zone->disk_shift);
5088c2ecf20Sopenharmony_ci	} else {
5098c2ecf20Sopenharmony_ci		start_disk_index = (int)(start - first_stripe_index * stripe_size) /
5108c2ecf20Sopenharmony_ci			mddev->chunk_sectors;
5118c2ecf20Sopenharmony_ci		end_disk_index = (int)(end - last_stripe_index * stripe_size) /
5128c2ecf20Sopenharmony_ci			mddev->chunk_sectors;
5138c2ecf20Sopenharmony_ci	}
5148c2ecf20Sopenharmony_ci	start_disk_offset = ((int)(start - first_stripe_index * stripe_size) %
5158c2ecf20Sopenharmony_ci		mddev->chunk_sectors) +
5168c2ecf20Sopenharmony_ci		first_stripe_index * mddev->chunk_sectors;
5178c2ecf20Sopenharmony_ci	end_disk_offset = ((int)(end - last_stripe_index * stripe_size) %
5188c2ecf20Sopenharmony_ci		mddev->chunk_sectors) +
5198c2ecf20Sopenharmony_ci		last_stripe_index * mddev->chunk_sectors;
5208c2ecf20Sopenharmony_ci
5218c2ecf20Sopenharmony_ci	for (disk = 0; disk < zone->nb_dev; disk++) {
5228c2ecf20Sopenharmony_ci		sector_t dev_start, dev_end;
5238c2ecf20Sopenharmony_ci		struct bio *discard_bio = NULL;
5248c2ecf20Sopenharmony_ci		struct md_rdev *rdev;
5258c2ecf20Sopenharmony_ci		int compare_disk;
5268c2ecf20Sopenharmony_ci
5278c2ecf20Sopenharmony_ci		compare_disk = map_disk_shift(disk, zone->nb_dev,
5288c2ecf20Sopenharmony_ci					      zone->disk_shift);
5298c2ecf20Sopenharmony_ci
5308c2ecf20Sopenharmony_ci		if (compare_disk < start_disk_index)
5318c2ecf20Sopenharmony_ci			dev_start = (first_stripe_index + 1) *
5328c2ecf20Sopenharmony_ci				mddev->chunk_sectors;
5338c2ecf20Sopenharmony_ci		else if (compare_disk > start_disk_index)
5348c2ecf20Sopenharmony_ci			dev_start = first_stripe_index * mddev->chunk_sectors;
5358c2ecf20Sopenharmony_ci		else
5368c2ecf20Sopenharmony_ci			dev_start = start_disk_offset;
5378c2ecf20Sopenharmony_ci
5388c2ecf20Sopenharmony_ci		if (compare_disk < end_disk_index)
5398c2ecf20Sopenharmony_ci			dev_end = (last_stripe_index + 1) * mddev->chunk_sectors;
5408c2ecf20Sopenharmony_ci		else if (compare_disk > end_disk_index)
5418c2ecf20Sopenharmony_ci			dev_end = last_stripe_index * mddev->chunk_sectors;
5428c2ecf20Sopenharmony_ci		else
5438c2ecf20Sopenharmony_ci			dev_end = end_disk_offset;
5448c2ecf20Sopenharmony_ci
5458c2ecf20Sopenharmony_ci		if (dev_end <= dev_start)
5468c2ecf20Sopenharmony_ci			continue;
5478c2ecf20Sopenharmony_ci
5488c2ecf20Sopenharmony_ci		rdev = conf->devlist[(zone - conf->strip_zone) *
5498c2ecf20Sopenharmony_ci			conf->strip_zone[0].nb_dev + disk];
5508c2ecf20Sopenharmony_ci		if (__blkdev_issue_discard(rdev->bdev,
5518c2ecf20Sopenharmony_ci			dev_start + zone->dev_start + rdev->data_offset,
5528c2ecf20Sopenharmony_ci			dev_end - dev_start, GFP_NOIO, 0, &discard_bio) ||
5538c2ecf20Sopenharmony_ci		    !discard_bio)
5548c2ecf20Sopenharmony_ci			continue;
5558c2ecf20Sopenharmony_ci		bio_chain(discard_bio, bio);
5568c2ecf20Sopenharmony_ci		bio_clone_blkg_association(discard_bio, bio);
5578c2ecf20Sopenharmony_ci		if (mddev->gendisk)
5588c2ecf20Sopenharmony_ci			trace_block_bio_remap(bdev_get_queue(rdev->bdev),
5598c2ecf20Sopenharmony_ci				discard_bio, disk_devt(mddev->gendisk),
5608c2ecf20Sopenharmony_ci				bio->bi_iter.bi_sector);
5618c2ecf20Sopenharmony_ci		submit_bio_noacct(discard_bio);
5628c2ecf20Sopenharmony_ci	}
5638c2ecf20Sopenharmony_ci	bio_endio(bio);
5648c2ecf20Sopenharmony_ci}
5658c2ecf20Sopenharmony_ci
5668c2ecf20Sopenharmony_cistatic bool raid0_make_request(struct mddev *mddev, struct bio *bio)
5678c2ecf20Sopenharmony_ci{
5688c2ecf20Sopenharmony_ci	struct r0conf *conf = mddev->private;
5698c2ecf20Sopenharmony_ci	struct strip_zone *zone;
5708c2ecf20Sopenharmony_ci	struct md_rdev *tmp_dev;
5718c2ecf20Sopenharmony_ci	sector_t bio_sector;
5728c2ecf20Sopenharmony_ci	sector_t sector;
5738c2ecf20Sopenharmony_ci	sector_t orig_sector;
5748c2ecf20Sopenharmony_ci	unsigned chunk_sects;
5758c2ecf20Sopenharmony_ci	unsigned sectors;
5768c2ecf20Sopenharmony_ci
5778c2ecf20Sopenharmony_ci	if (unlikely(bio->bi_opf & REQ_PREFLUSH)
5788c2ecf20Sopenharmony_ci	    && md_flush_request(mddev, bio))
5798c2ecf20Sopenharmony_ci		return true;
5808c2ecf20Sopenharmony_ci
5818c2ecf20Sopenharmony_ci	if (unlikely((bio_op(bio) == REQ_OP_DISCARD))) {
5828c2ecf20Sopenharmony_ci		raid0_handle_discard(mddev, bio);
5838c2ecf20Sopenharmony_ci		return true;
5848c2ecf20Sopenharmony_ci	}
5858c2ecf20Sopenharmony_ci
5868c2ecf20Sopenharmony_ci	bio_sector = bio->bi_iter.bi_sector;
5878c2ecf20Sopenharmony_ci	sector = bio_sector;
5888c2ecf20Sopenharmony_ci	chunk_sects = mddev->chunk_sectors;
5898c2ecf20Sopenharmony_ci
5908c2ecf20Sopenharmony_ci	sectors = chunk_sects -
5918c2ecf20Sopenharmony_ci		(likely(is_power_of_2(chunk_sects))
5928c2ecf20Sopenharmony_ci		 ? (sector & (chunk_sects-1))
5938c2ecf20Sopenharmony_ci		 : sector_div(sector, chunk_sects));
5948c2ecf20Sopenharmony_ci
5958c2ecf20Sopenharmony_ci	/* Restore due to sector_div */
5968c2ecf20Sopenharmony_ci	sector = bio_sector;
5978c2ecf20Sopenharmony_ci
5988c2ecf20Sopenharmony_ci	if (sectors < bio_sectors(bio)) {
5998c2ecf20Sopenharmony_ci		struct bio *split = bio_split(bio, sectors, GFP_NOIO,
6008c2ecf20Sopenharmony_ci					      &mddev->bio_set);
6018c2ecf20Sopenharmony_ci		bio_chain(split, bio);
6028c2ecf20Sopenharmony_ci		submit_bio_noacct(bio);
6038c2ecf20Sopenharmony_ci		bio = split;
6048c2ecf20Sopenharmony_ci	}
6058c2ecf20Sopenharmony_ci
6068c2ecf20Sopenharmony_ci	orig_sector = sector;
6078c2ecf20Sopenharmony_ci	zone = find_zone(mddev->private, &sector);
6088c2ecf20Sopenharmony_ci	switch (conf->layout) {
6098c2ecf20Sopenharmony_ci	case RAID0_ORIG_LAYOUT:
6108c2ecf20Sopenharmony_ci		tmp_dev = map_sector(mddev, zone, orig_sector, &sector);
6118c2ecf20Sopenharmony_ci		break;
6128c2ecf20Sopenharmony_ci	case RAID0_ALT_MULTIZONE_LAYOUT:
6138c2ecf20Sopenharmony_ci		tmp_dev = map_sector(mddev, zone, sector, &sector);
6148c2ecf20Sopenharmony_ci		break;
6158c2ecf20Sopenharmony_ci	default:
6168c2ecf20Sopenharmony_ci		WARN(1, "md/raid0:%s: Invalid layout\n", mdname(mddev));
6178c2ecf20Sopenharmony_ci		bio_io_error(bio);
6188c2ecf20Sopenharmony_ci		return true;
6198c2ecf20Sopenharmony_ci	}
6208c2ecf20Sopenharmony_ci
6218c2ecf20Sopenharmony_ci	if (unlikely(is_mddev_broken(tmp_dev, "raid0"))) {
6228c2ecf20Sopenharmony_ci		bio_io_error(bio);
6238c2ecf20Sopenharmony_ci		return true;
6248c2ecf20Sopenharmony_ci	}
6258c2ecf20Sopenharmony_ci
6268c2ecf20Sopenharmony_ci	bio_set_dev(bio, tmp_dev->bdev);
6278c2ecf20Sopenharmony_ci	bio->bi_iter.bi_sector = sector + zone->dev_start +
6288c2ecf20Sopenharmony_ci		tmp_dev->data_offset;
6298c2ecf20Sopenharmony_ci
6308c2ecf20Sopenharmony_ci	if (mddev->gendisk)
6318c2ecf20Sopenharmony_ci		trace_block_bio_remap(bio->bi_disk->queue, bio,
6328c2ecf20Sopenharmony_ci				disk_devt(mddev->gendisk), bio_sector);
6338c2ecf20Sopenharmony_ci	mddev_check_writesame(mddev, bio);
6348c2ecf20Sopenharmony_ci	mddev_check_write_zeroes(mddev, bio);
6358c2ecf20Sopenharmony_ci	submit_bio_noacct(bio);
6368c2ecf20Sopenharmony_ci	return true;
6378c2ecf20Sopenharmony_ci}
6388c2ecf20Sopenharmony_ci
6398c2ecf20Sopenharmony_cistatic void raid0_status(struct seq_file *seq, struct mddev *mddev)
6408c2ecf20Sopenharmony_ci{
6418c2ecf20Sopenharmony_ci	seq_printf(seq, " %dk chunks", mddev->chunk_sectors / 2);
6428c2ecf20Sopenharmony_ci	return;
6438c2ecf20Sopenharmony_ci}
6448c2ecf20Sopenharmony_ci
6458c2ecf20Sopenharmony_cistatic void *raid0_takeover_raid45(struct mddev *mddev)
6468c2ecf20Sopenharmony_ci{
6478c2ecf20Sopenharmony_ci	struct md_rdev *rdev;
6488c2ecf20Sopenharmony_ci	struct r0conf *priv_conf;
6498c2ecf20Sopenharmony_ci
6508c2ecf20Sopenharmony_ci	if (mddev->degraded != 1) {
6518c2ecf20Sopenharmony_ci		pr_warn("md/raid0:%s: raid5 must be degraded! Degraded disks: %d\n",
6528c2ecf20Sopenharmony_ci			mdname(mddev),
6538c2ecf20Sopenharmony_ci			mddev->degraded);
6548c2ecf20Sopenharmony_ci		return ERR_PTR(-EINVAL);
6558c2ecf20Sopenharmony_ci	}
6568c2ecf20Sopenharmony_ci
6578c2ecf20Sopenharmony_ci	rdev_for_each(rdev, mddev) {
6588c2ecf20Sopenharmony_ci		/* check slot number for a disk */
6598c2ecf20Sopenharmony_ci		if (rdev->raid_disk == mddev->raid_disks-1) {
6608c2ecf20Sopenharmony_ci			pr_warn("md/raid0:%s: raid5 must have missing parity disk!\n",
6618c2ecf20Sopenharmony_ci				mdname(mddev));
6628c2ecf20Sopenharmony_ci			return ERR_PTR(-EINVAL);
6638c2ecf20Sopenharmony_ci		}
6648c2ecf20Sopenharmony_ci		rdev->sectors = mddev->dev_sectors;
6658c2ecf20Sopenharmony_ci	}
6668c2ecf20Sopenharmony_ci
6678c2ecf20Sopenharmony_ci	/* Set new parameters */
6688c2ecf20Sopenharmony_ci	mddev->new_level = 0;
6698c2ecf20Sopenharmony_ci	mddev->new_layout = 0;
6708c2ecf20Sopenharmony_ci	mddev->new_chunk_sectors = mddev->chunk_sectors;
6718c2ecf20Sopenharmony_ci	mddev->raid_disks--;
6728c2ecf20Sopenharmony_ci	mddev->delta_disks = -1;
6738c2ecf20Sopenharmony_ci	/* make sure it will be not marked as dirty */
6748c2ecf20Sopenharmony_ci	mddev->recovery_cp = MaxSector;
6758c2ecf20Sopenharmony_ci	mddev_clear_unsupported_flags(mddev, UNSUPPORTED_MDDEV_FLAGS);
6768c2ecf20Sopenharmony_ci
6778c2ecf20Sopenharmony_ci	create_strip_zones(mddev, &priv_conf);
6788c2ecf20Sopenharmony_ci
6798c2ecf20Sopenharmony_ci	return priv_conf;
6808c2ecf20Sopenharmony_ci}
6818c2ecf20Sopenharmony_ci
6828c2ecf20Sopenharmony_cistatic void *raid0_takeover_raid10(struct mddev *mddev)
6838c2ecf20Sopenharmony_ci{
6848c2ecf20Sopenharmony_ci	struct r0conf *priv_conf;
6858c2ecf20Sopenharmony_ci
6868c2ecf20Sopenharmony_ci	/* Check layout:
6878c2ecf20Sopenharmony_ci	 *  - far_copies must be 1
6888c2ecf20Sopenharmony_ci	 *  - near_copies must be 2
6898c2ecf20Sopenharmony_ci	 *  - disks number must be even
6908c2ecf20Sopenharmony_ci	 *  - all mirrors must be already degraded
6918c2ecf20Sopenharmony_ci	 */
6928c2ecf20Sopenharmony_ci	if (mddev->layout != ((1 << 8) + 2)) {
6938c2ecf20Sopenharmony_ci		pr_warn("md/raid0:%s:: Raid0 cannot takeover layout: 0x%x\n",
6948c2ecf20Sopenharmony_ci			mdname(mddev),
6958c2ecf20Sopenharmony_ci			mddev->layout);
6968c2ecf20Sopenharmony_ci		return ERR_PTR(-EINVAL);
6978c2ecf20Sopenharmony_ci	}
6988c2ecf20Sopenharmony_ci	if (mddev->raid_disks & 1) {
6998c2ecf20Sopenharmony_ci		pr_warn("md/raid0:%s: Raid0 cannot takeover Raid10 with odd disk number.\n",
7008c2ecf20Sopenharmony_ci			mdname(mddev));
7018c2ecf20Sopenharmony_ci		return ERR_PTR(-EINVAL);
7028c2ecf20Sopenharmony_ci	}
7038c2ecf20Sopenharmony_ci	if (mddev->degraded != (mddev->raid_disks>>1)) {
7048c2ecf20Sopenharmony_ci		pr_warn("md/raid0:%s: All mirrors must be already degraded!\n",
7058c2ecf20Sopenharmony_ci			mdname(mddev));
7068c2ecf20Sopenharmony_ci		return ERR_PTR(-EINVAL);
7078c2ecf20Sopenharmony_ci	}
7088c2ecf20Sopenharmony_ci
7098c2ecf20Sopenharmony_ci	/* Set new parameters */
7108c2ecf20Sopenharmony_ci	mddev->new_level = 0;
7118c2ecf20Sopenharmony_ci	mddev->new_layout = 0;
7128c2ecf20Sopenharmony_ci	mddev->new_chunk_sectors = mddev->chunk_sectors;
7138c2ecf20Sopenharmony_ci	mddev->delta_disks = - mddev->raid_disks / 2;
7148c2ecf20Sopenharmony_ci	mddev->raid_disks += mddev->delta_disks;
7158c2ecf20Sopenharmony_ci	mddev->degraded = 0;
7168c2ecf20Sopenharmony_ci	/* make sure it will be not marked as dirty */
7178c2ecf20Sopenharmony_ci	mddev->recovery_cp = MaxSector;
7188c2ecf20Sopenharmony_ci	mddev_clear_unsupported_flags(mddev, UNSUPPORTED_MDDEV_FLAGS);
7198c2ecf20Sopenharmony_ci
7208c2ecf20Sopenharmony_ci	create_strip_zones(mddev, &priv_conf);
7218c2ecf20Sopenharmony_ci	return priv_conf;
7228c2ecf20Sopenharmony_ci}
7238c2ecf20Sopenharmony_ci
7248c2ecf20Sopenharmony_cistatic void *raid0_takeover_raid1(struct mddev *mddev)
7258c2ecf20Sopenharmony_ci{
7268c2ecf20Sopenharmony_ci	struct r0conf *priv_conf;
7278c2ecf20Sopenharmony_ci	int chunksect;
7288c2ecf20Sopenharmony_ci
7298c2ecf20Sopenharmony_ci	/* Check layout:
7308c2ecf20Sopenharmony_ci	 *  - (N - 1) mirror drives must be already faulty
7318c2ecf20Sopenharmony_ci	 */
7328c2ecf20Sopenharmony_ci	if ((mddev->raid_disks - 1) != mddev->degraded) {
7338c2ecf20Sopenharmony_ci		pr_err("md/raid0:%s: (N - 1) mirrors drives must be already faulty!\n",
7348c2ecf20Sopenharmony_ci		       mdname(mddev));
7358c2ecf20Sopenharmony_ci		return ERR_PTR(-EINVAL);
7368c2ecf20Sopenharmony_ci	}
7378c2ecf20Sopenharmony_ci
7388c2ecf20Sopenharmony_ci	/*
7398c2ecf20Sopenharmony_ci	 * a raid1 doesn't have the notion of chunk size, so
7408c2ecf20Sopenharmony_ci	 * figure out the largest suitable size we can use.
7418c2ecf20Sopenharmony_ci	 */
7428c2ecf20Sopenharmony_ci	chunksect = 64 * 2; /* 64K by default */
7438c2ecf20Sopenharmony_ci
7448c2ecf20Sopenharmony_ci	/* The array must be an exact multiple of chunksize */
7458c2ecf20Sopenharmony_ci	while (chunksect && (mddev->array_sectors & (chunksect - 1)))
7468c2ecf20Sopenharmony_ci		chunksect >>= 1;
7478c2ecf20Sopenharmony_ci
7488c2ecf20Sopenharmony_ci	if ((chunksect << 9) < PAGE_SIZE)
7498c2ecf20Sopenharmony_ci		/* array size does not allow a suitable chunk size */
7508c2ecf20Sopenharmony_ci		return ERR_PTR(-EINVAL);
7518c2ecf20Sopenharmony_ci
7528c2ecf20Sopenharmony_ci	/* Set new parameters */
7538c2ecf20Sopenharmony_ci	mddev->new_level = 0;
7548c2ecf20Sopenharmony_ci	mddev->new_layout = 0;
7558c2ecf20Sopenharmony_ci	mddev->new_chunk_sectors = chunksect;
7568c2ecf20Sopenharmony_ci	mddev->chunk_sectors = chunksect;
7578c2ecf20Sopenharmony_ci	mddev->delta_disks = 1 - mddev->raid_disks;
7588c2ecf20Sopenharmony_ci	mddev->raid_disks = 1;
7598c2ecf20Sopenharmony_ci	/* make sure it will be not marked as dirty */
7608c2ecf20Sopenharmony_ci	mddev->recovery_cp = MaxSector;
7618c2ecf20Sopenharmony_ci	mddev_clear_unsupported_flags(mddev, UNSUPPORTED_MDDEV_FLAGS);
7628c2ecf20Sopenharmony_ci
7638c2ecf20Sopenharmony_ci	create_strip_zones(mddev, &priv_conf);
7648c2ecf20Sopenharmony_ci	return priv_conf;
7658c2ecf20Sopenharmony_ci}
7668c2ecf20Sopenharmony_ci
7678c2ecf20Sopenharmony_cistatic void *raid0_takeover(struct mddev *mddev)
7688c2ecf20Sopenharmony_ci{
7698c2ecf20Sopenharmony_ci	/* raid0 can take over:
7708c2ecf20Sopenharmony_ci	 *  raid4 - if all data disks are active.
7718c2ecf20Sopenharmony_ci	 *  raid5 - providing it is Raid4 layout and one disk is faulty
7728c2ecf20Sopenharmony_ci	 *  raid10 - assuming we have all necessary active disks
7738c2ecf20Sopenharmony_ci	 *  raid1 - with (N -1) mirror drives faulty
7748c2ecf20Sopenharmony_ci	 */
7758c2ecf20Sopenharmony_ci
7768c2ecf20Sopenharmony_ci	if (mddev->bitmap) {
7778c2ecf20Sopenharmony_ci		pr_warn("md/raid0: %s: cannot takeover array with bitmap\n",
7788c2ecf20Sopenharmony_ci			mdname(mddev));
7798c2ecf20Sopenharmony_ci		return ERR_PTR(-EBUSY);
7808c2ecf20Sopenharmony_ci	}
7818c2ecf20Sopenharmony_ci	if (mddev->level == 4)
7828c2ecf20Sopenharmony_ci		return raid0_takeover_raid45(mddev);
7838c2ecf20Sopenharmony_ci
7848c2ecf20Sopenharmony_ci	if (mddev->level == 5) {
7858c2ecf20Sopenharmony_ci		if (mddev->layout == ALGORITHM_PARITY_N)
7868c2ecf20Sopenharmony_ci			return raid0_takeover_raid45(mddev);
7878c2ecf20Sopenharmony_ci
7888c2ecf20Sopenharmony_ci		pr_warn("md/raid0:%s: Raid can only takeover Raid5 with layout: %d\n",
7898c2ecf20Sopenharmony_ci			mdname(mddev), ALGORITHM_PARITY_N);
7908c2ecf20Sopenharmony_ci	}
7918c2ecf20Sopenharmony_ci
7928c2ecf20Sopenharmony_ci	if (mddev->level == 10)
7938c2ecf20Sopenharmony_ci		return raid0_takeover_raid10(mddev);
7948c2ecf20Sopenharmony_ci
7958c2ecf20Sopenharmony_ci	if (mddev->level == 1)
7968c2ecf20Sopenharmony_ci		return raid0_takeover_raid1(mddev);
7978c2ecf20Sopenharmony_ci
7988c2ecf20Sopenharmony_ci	pr_warn("Takeover from raid%i to raid0 not supported\n",
7998c2ecf20Sopenharmony_ci		mddev->level);
8008c2ecf20Sopenharmony_ci
8018c2ecf20Sopenharmony_ci	return ERR_PTR(-EINVAL);
8028c2ecf20Sopenharmony_ci}
8038c2ecf20Sopenharmony_ci
8048c2ecf20Sopenharmony_cistatic void raid0_quiesce(struct mddev *mddev, int quiesce)
8058c2ecf20Sopenharmony_ci{
8068c2ecf20Sopenharmony_ci}
8078c2ecf20Sopenharmony_ci
8088c2ecf20Sopenharmony_cistatic struct md_personality raid0_personality=
8098c2ecf20Sopenharmony_ci{
8108c2ecf20Sopenharmony_ci	.name		= "raid0",
8118c2ecf20Sopenharmony_ci	.level		= 0,
8128c2ecf20Sopenharmony_ci	.owner		= THIS_MODULE,
8138c2ecf20Sopenharmony_ci	.make_request	= raid0_make_request,
8148c2ecf20Sopenharmony_ci	.run		= raid0_run,
8158c2ecf20Sopenharmony_ci	.free		= raid0_free,
8168c2ecf20Sopenharmony_ci	.status		= raid0_status,
8178c2ecf20Sopenharmony_ci	.size		= raid0_size,
8188c2ecf20Sopenharmony_ci	.takeover	= raid0_takeover,
8198c2ecf20Sopenharmony_ci	.quiesce	= raid0_quiesce,
8208c2ecf20Sopenharmony_ci};
8218c2ecf20Sopenharmony_ci
8228c2ecf20Sopenharmony_cistatic int __init raid0_init (void)
8238c2ecf20Sopenharmony_ci{
8248c2ecf20Sopenharmony_ci	return register_md_personality (&raid0_personality);
8258c2ecf20Sopenharmony_ci}
8268c2ecf20Sopenharmony_ci
8278c2ecf20Sopenharmony_cistatic void raid0_exit (void)
8288c2ecf20Sopenharmony_ci{
8298c2ecf20Sopenharmony_ci	unregister_md_personality (&raid0_personality);
8308c2ecf20Sopenharmony_ci}
8318c2ecf20Sopenharmony_ci
8328c2ecf20Sopenharmony_cimodule_init(raid0_init);
8338c2ecf20Sopenharmony_cimodule_exit(raid0_exit);
8348c2ecf20Sopenharmony_ciMODULE_LICENSE("GPL");
8358c2ecf20Sopenharmony_ciMODULE_DESCRIPTION("RAID0 (striping) personality for MD");
8368c2ecf20Sopenharmony_ciMODULE_ALIAS("md-personality-2"); /* RAID0 */
8378c2ecf20Sopenharmony_ciMODULE_ALIAS("md-raid0");
8388c2ecf20Sopenharmony_ciMODULE_ALIAS("md-level-0");
839