xref: /OK3568_Linux_fs/kernel/drivers/md/raid0.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun    raid0.c : Multiple Devices driver for Linux
4*4882a593Smuzhiyun 	     Copyright (C) 1994-96 Marc ZYNGIER
5*4882a593Smuzhiyun 	     <zyngier@ufr-info-p7.ibp.fr> or
6*4882a593Smuzhiyun 	     <maz@gloups.fdn.fr>
7*4882a593Smuzhiyun 	     Copyright (C) 1999, 2000 Ingo Molnar, Red Hat
8*4882a593Smuzhiyun 
9*4882a593Smuzhiyun    RAID-0 management functions.
10*4882a593Smuzhiyun 
11*4882a593Smuzhiyun */
12*4882a593Smuzhiyun 
13*4882a593Smuzhiyun #include <linux/blkdev.h>
14*4882a593Smuzhiyun #include <linux/seq_file.h>
15*4882a593Smuzhiyun #include <linux/module.h>
16*4882a593Smuzhiyun #include <linux/slab.h>
17*4882a593Smuzhiyun #include <trace/events/block.h>
18*4882a593Smuzhiyun #include "md.h"
19*4882a593Smuzhiyun #include "raid0.h"
20*4882a593Smuzhiyun #include "raid5.h"
21*4882a593Smuzhiyun 
22*4882a593Smuzhiyun static int default_layout = 0;
23*4882a593Smuzhiyun module_param(default_layout, int, 0644);
24*4882a593Smuzhiyun 
25*4882a593Smuzhiyun #define UNSUPPORTED_MDDEV_FLAGS		\
26*4882a593Smuzhiyun 	((1L << MD_HAS_JOURNAL) |	\
27*4882a593Smuzhiyun 	 (1L << MD_JOURNAL_CLEAN) |	\
28*4882a593Smuzhiyun 	 (1L << MD_FAILFAST_SUPPORTED) |\
29*4882a593Smuzhiyun 	 (1L << MD_HAS_PPL) |		\
30*4882a593Smuzhiyun 	 (1L << MD_HAS_MULTIPLE_PPLS))
31*4882a593Smuzhiyun 
32*4882a593Smuzhiyun /*
33*4882a593Smuzhiyun  * inform the user of the raid configuration
34*4882a593Smuzhiyun */
dump_zones(struct mddev * mddev)35*4882a593Smuzhiyun static void dump_zones(struct mddev *mddev)
36*4882a593Smuzhiyun {
37*4882a593Smuzhiyun 	int j, k;
38*4882a593Smuzhiyun 	sector_t zone_size = 0;
39*4882a593Smuzhiyun 	sector_t zone_start = 0;
40*4882a593Smuzhiyun 	char b[BDEVNAME_SIZE];
41*4882a593Smuzhiyun 	struct r0conf *conf = mddev->private;
42*4882a593Smuzhiyun 	int raid_disks = conf->strip_zone[0].nb_dev;
43*4882a593Smuzhiyun 	pr_debug("md: RAID0 configuration for %s - %d zone%s\n",
44*4882a593Smuzhiyun 		 mdname(mddev),
45*4882a593Smuzhiyun 		 conf->nr_strip_zones, conf->nr_strip_zones==1?"":"s");
46*4882a593Smuzhiyun 	for (j = 0; j < conf->nr_strip_zones; j++) {
47*4882a593Smuzhiyun 		char line[200];
48*4882a593Smuzhiyun 		int len = 0;
49*4882a593Smuzhiyun 
50*4882a593Smuzhiyun 		for (k = 0; k < conf->strip_zone[j].nb_dev; k++)
51*4882a593Smuzhiyun 			len += scnprintf(line+len, 200-len, "%s%s", k?"/":"",
52*4882a593Smuzhiyun 					bdevname(conf->devlist[j*raid_disks
53*4882a593Smuzhiyun 							       + k]->bdev, b));
54*4882a593Smuzhiyun 		pr_debug("md: zone%d=[%s]\n", j, line);
55*4882a593Smuzhiyun 
56*4882a593Smuzhiyun 		zone_size  = conf->strip_zone[j].zone_end - zone_start;
57*4882a593Smuzhiyun 		pr_debug("      zone-offset=%10lluKB, device-offset=%10lluKB, size=%10lluKB\n",
58*4882a593Smuzhiyun 			(unsigned long long)zone_start>>1,
59*4882a593Smuzhiyun 			(unsigned long long)conf->strip_zone[j].dev_start>>1,
60*4882a593Smuzhiyun 			(unsigned long long)zone_size>>1);
61*4882a593Smuzhiyun 		zone_start = conf->strip_zone[j].zone_end;
62*4882a593Smuzhiyun 	}
63*4882a593Smuzhiyun }
64*4882a593Smuzhiyun 
create_strip_zones(struct mddev * mddev,struct r0conf ** private_conf)65*4882a593Smuzhiyun static int create_strip_zones(struct mddev *mddev, struct r0conf **private_conf)
66*4882a593Smuzhiyun {
67*4882a593Smuzhiyun 	int i, c, err;
68*4882a593Smuzhiyun 	sector_t curr_zone_end, sectors;
69*4882a593Smuzhiyun 	struct md_rdev *smallest, *rdev1, *rdev2, *rdev, **dev;
70*4882a593Smuzhiyun 	struct strip_zone *zone;
71*4882a593Smuzhiyun 	int cnt;
72*4882a593Smuzhiyun 	char b[BDEVNAME_SIZE];
73*4882a593Smuzhiyun 	char b2[BDEVNAME_SIZE];
74*4882a593Smuzhiyun 	struct r0conf *conf = kzalloc(sizeof(*conf), GFP_KERNEL);
75*4882a593Smuzhiyun 	unsigned blksize = 512;
76*4882a593Smuzhiyun 
77*4882a593Smuzhiyun 	*private_conf = ERR_PTR(-ENOMEM);
78*4882a593Smuzhiyun 	if (!conf)
79*4882a593Smuzhiyun 		return -ENOMEM;
80*4882a593Smuzhiyun 	rdev_for_each(rdev1, mddev) {
81*4882a593Smuzhiyun 		pr_debug("md/raid0:%s: looking at %s\n",
82*4882a593Smuzhiyun 			 mdname(mddev),
83*4882a593Smuzhiyun 			 bdevname(rdev1->bdev, b));
84*4882a593Smuzhiyun 		c = 0;
85*4882a593Smuzhiyun 
86*4882a593Smuzhiyun 		/* round size to chunk_size */
87*4882a593Smuzhiyun 		sectors = rdev1->sectors;
88*4882a593Smuzhiyun 		sector_div(sectors, mddev->chunk_sectors);
89*4882a593Smuzhiyun 		rdev1->sectors = sectors * mddev->chunk_sectors;
90*4882a593Smuzhiyun 
91*4882a593Smuzhiyun 		blksize = max(blksize, queue_logical_block_size(
92*4882a593Smuzhiyun 				      rdev1->bdev->bd_disk->queue));
93*4882a593Smuzhiyun 
94*4882a593Smuzhiyun 		rdev_for_each(rdev2, mddev) {
95*4882a593Smuzhiyun 			pr_debug("md/raid0:%s:   comparing %s(%llu)"
96*4882a593Smuzhiyun 				 " with %s(%llu)\n",
97*4882a593Smuzhiyun 				 mdname(mddev),
98*4882a593Smuzhiyun 				 bdevname(rdev1->bdev,b),
99*4882a593Smuzhiyun 				 (unsigned long long)rdev1->sectors,
100*4882a593Smuzhiyun 				 bdevname(rdev2->bdev,b2),
101*4882a593Smuzhiyun 				 (unsigned long long)rdev2->sectors);
102*4882a593Smuzhiyun 			if (rdev2 == rdev1) {
103*4882a593Smuzhiyun 				pr_debug("md/raid0:%s:   END\n",
104*4882a593Smuzhiyun 					 mdname(mddev));
105*4882a593Smuzhiyun 				break;
106*4882a593Smuzhiyun 			}
107*4882a593Smuzhiyun 			if (rdev2->sectors == rdev1->sectors) {
108*4882a593Smuzhiyun 				/*
109*4882a593Smuzhiyun 				 * Not unique, don't count it as a new
110*4882a593Smuzhiyun 				 * group
111*4882a593Smuzhiyun 				 */
112*4882a593Smuzhiyun 				pr_debug("md/raid0:%s:   EQUAL\n",
113*4882a593Smuzhiyun 					 mdname(mddev));
114*4882a593Smuzhiyun 				c = 1;
115*4882a593Smuzhiyun 				break;
116*4882a593Smuzhiyun 			}
117*4882a593Smuzhiyun 			pr_debug("md/raid0:%s:   NOT EQUAL\n",
118*4882a593Smuzhiyun 				 mdname(mddev));
119*4882a593Smuzhiyun 		}
120*4882a593Smuzhiyun 		if (!c) {
121*4882a593Smuzhiyun 			pr_debug("md/raid0:%s:   ==> UNIQUE\n",
122*4882a593Smuzhiyun 				 mdname(mddev));
123*4882a593Smuzhiyun 			conf->nr_strip_zones++;
124*4882a593Smuzhiyun 			pr_debug("md/raid0:%s: %d zones\n",
125*4882a593Smuzhiyun 				 mdname(mddev), conf->nr_strip_zones);
126*4882a593Smuzhiyun 		}
127*4882a593Smuzhiyun 	}
128*4882a593Smuzhiyun 	pr_debug("md/raid0:%s: FINAL %d zones\n",
129*4882a593Smuzhiyun 		 mdname(mddev), conf->nr_strip_zones);
130*4882a593Smuzhiyun 
131*4882a593Smuzhiyun 	/*
132*4882a593Smuzhiyun 	 * now since we have the hard sector sizes, we can make sure
133*4882a593Smuzhiyun 	 * chunk size is a multiple of that sector size
134*4882a593Smuzhiyun 	 */
135*4882a593Smuzhiyun 	if ((mddev->chunk_sectors << 9) % blksize) {
136*4882a593Smuzhiyun 		pr_warn("md/raid0:%s: chunk_size of %d not multiple of block size %d\n",
137*4882a593Smuzhiyun 			mdname(mddev),
138*4882a593Smuzhiyun 			mddev->chunk_sectors << 9, blksize);
139*4882a593Smuzhiyun 		err = -EINVAL;
140*4882a593Smuzhiyun 		goto abort;
141*4882a593Smuzhiyun 	}
142*4882a593Smuzhiyun 
143*4882a593Smuzhiyun 	err = -ENOMEM;
144*4882a593Smuzhiyun 	conf->strip_zone = kcalloc(conf->nr_strip_zones,
145*4882a593Smuzhiyun 				   sizeof(struct strip_zone),
146*4882a593Smuzhiyun 				   GFP_KERNEL);
147*4882a593Smuzhiyun 	if (!conf->strip_zone)
148*4882a593Smuzhiyun 		goto abort;
149*4882a593Smuzhiyun 	conf->devlist = kzalloc(array3_size(sizeof(struct md_rdev *),
150*4882a593Smuzhiyun 					    conf->nr_strip_zones,
151*4882a593Smuzhiyun 					    mddev->raid_disks),
152*4882a593Smuzhiyun 				GFP_KERNEL);
153*4882a593Smuzhiyun 	if (!conf->devlist)
154*4882a593Smuzhiyun 		goto abort;
155*4882a593Smuzhiyun 
156*4882a593Smuzhiyun 	/* The first zone must contain all devices, so here we check that
157*4882a593Smuzhiyun 	 * there is a proper alignment of slots to devices and find them all
158*4882a593Smuzhiyun 	 */
159*4882a593Smuzhiyun 	zone = &conf->strip_zone[0];
160*4882a593Smuzhiyun 	cnt = 0;
161*4882a593Smuzhiyun 	smallest = NULL;
162*4882a593Smuzhiyun 	dev = conf->devlist;
163*4882a593Smuzhiyun 	err = -EINVAL;
164*4882a593Smuzhiyun 	rdev_for_each(rdev1, mddev) {
165*4882a593Smuzhiyun 		int j = rdev1->raid_disk;
166*4882a593Smuzhiyun 
167*4882a593Smuzhiyun 		if (mddev->level == 10) {
168*4882a593Smuzhiyun 			/* taking over a raid10-n2 array */
169*4882a593Smuzhiyun 			j /= 2;
170*4882a593Smuzhiyun 			rdev1->new_raid_disk = j;
171*4882a593Smuzhiyun 		}
172*4882a593Smuzhiyun 
173*4882a593Smuzhiyun 		if (mddev->level == 1) {
174*4882a593Smuzhiyun 			/* taiking over a raid1 array-
175*4882a593Smuzhiyun 			 * we have only one active disk
176*4882a593Smuzhiyun 			 */
177*4882a593Smuzhiyun 			j = 0;
178*4882a593Smuzhiyun 			rdev1->new_raid_disk = j;
179*4882a593Smuzhiyun 		}
180*4882a593Smuzhiyun 
181*4882a593Smuzhiyun 		if (j < 0) {
182*4882a593Smuzhiyun 			pr_warn("md/raid0:%s: remove inactive devices before converting to RAID0\n",
183*4882a593Smuzhiyun 				mdname(mddev));
184*4882a593Smuzhiyun 			goto abort;
185*4882a593Smuzhiyun 		}
186*4882a593Smuzhiyun 		if (j >= mddev->raid_disks) {
187*4882a593Smuzhiyun 			pr_warn("md/raid0:%s: bad disk number %d - aborting!\n",
188*4882a593Smuzhiyun 				mdname(mddev), j);
189*4882a593Smuzhiyun 			goto abort;
190*4882a593Smuzhiyun 		}
191*4882a593Smuzhiyun 		if (dev[j]) {
192*4882a593Smuzhiyun 			pr_warn("md/raid0:%s: multiple devices for %d - aborting!\n",
193*4882a593Smuzhiyun 				mdname(mddev), j);
194*4882a593Smuzhiyun 			goto abort;
195*4882a593Smuzhiyun 		}
196*4882a593Smuzhiyun 		dev[j] = rdev1;
197*4882a593Smuzhiyun 
198*4882a593Smuzhiyun 		if (!smallest || (rdev1->sectors < smallest->sectors))
199*4882a593Smuzhiyun 			smallest = rdev1;
200*4882a593Smuzhiyun 		cnt++;
201*4882a593Smuzhiyun 	}
202*4882a593Smuzhiyun 	if (cnt != mddev->raid_disks) {
203*4882a593Smuzhiyun 		pr_warn("md/raid0:%s: too few disks (%d of %d) - aborting!\n",
204*4882a593Smuzhiyun 			mdname(mddev), cnt, mddev->raid_disks);
205*4882a593Smuzhiyun 		goto abort;
206*4882a593Smuzhiyun 	}
207*4882a593Smuzhiyun 	zone->nb_dev = cnt;
208*4882a593Smuzhiyun 	zone->zone_end = smallest->sectors * cnt;
209*4882a593Smuzhiyun 
210*4882a593Smuzhiyun 	curr_zone_end = zone->zone_end;
211*4882a593Smuzhiyun 
212*4882a593Smuzhiyun 	/* now do the other zones */
213*4882a593Smuzhiyun 	for (i = 1; i < conf->nr_strip_zones; i++)
214*4882a593Smuzhiyun 	{
215*4882a593Smuzhiyun 		int j;
216*4882a593Smuzhiyun 
217*4882a593Smuzhiyun 		zone = conf->strip_zone + i;
218*4882a593Smuzhiyun 		dev = conf->devlist + i * mddev->raid_disks;
219*4882a593Smuzhiyun 
220*4882a593Smuzhiyun 		pr_debug("md/raid0:%s: zone %d\n", mdname(mddev), i);
221*4882a593Smuzhiyun 		zone->dev_start = smallest->sectors;
222*4882a593Smuzhiyun 		smallest = NULL;
223*4882a593Smuzhiyun 		c = 0;
224*4882a593Smuzhiyun 
225*4882a593Smuzhiyun 		for (j=0; j<cnt; j++) {
226*4882a593Smuzhiyun 			rdev = conf->devlist[j];
227*4882a593Smuzhiyun 			if (rdev->sectors <= zone->dev_start) {
228*4882a593Smuzhiyun 				pr_debug("md/raid0:%s: checking %s ... nope\n",
229*4882a593Smuzhiyun 					 mdname(mddev),
230*4882a593Smuzhiyun 					 bdevname(rdev->bdev, b));
231*4882a593Smuzhiyun 				continue;
232*4882a593Smuzhiyun 			}
233*4882a593Smuzhiyun 			pr_debug("md/raid0:%s: checking %s ..."
234*4882a593Smuzhiyun 				 " contained as device %d\n",
235*4882a593Smuzhiyun 				 mdname(mddev),
236*4882a593Smuzhiyun 				 bdevname(rdev->bdev, b), c);
237*4882a593Smuzhiyun 			dev[c] = rdev;
238*4882a593Smuzhiyun 			c++;
239*4882a593Smuzhiyun 			if (!smallest || rdev->sectors < smallest->sectors) {
240*4882a593Smuzhiyun 				smallest = rdev;
241*4882a593Smuzhiyun 				pr_debug("md/raid0:%s:  (%llu) is smallest!.\n",
242*4882a593Smuzhiyun 					 mdname(mddev),
243*4882a593Smuzhiyun 					 (unsigned long long)rdev->sectors);
244*4882a593Smuzhiyun 			}
245*4882a593Smuzhiyun 		}
246*4882a593Smuzhiyun 
247*4882a593Smuzhiyun 		zone->nb_dev = c;
248*4882a593Smuzhiyun 		sectors = (smallest->sectors - zone->dev_start) * c;
249*4882a593Smuzhiyun 		pr_debug("md/raid0:%s: zone->nb_dev: %d, sectors: %llu\n",
250*4882a593Smuzhiyun 			 mdname(mddev),
251*4882a593Smuzhiyun 			 zone->nb_dev, (unsigned long long)sectors);
252*4882a593Smuzhiyun 
253*4882a593Smuzhiyun 		curr_zone_end += sectors;
254*4882a593Smuzhiyun 		zone->zone_end = curr_zone_end;
255*4882a593Smuzhiyun 
256*4882a593Smuzhiyun 		pr_debug("md/raid0:%s: current zone start: %llu\n",
257*4882a593Smuzhiyun 			 mdname(mddev),
258*4882a593Smuzhiyun 			 (unsigned long long)smallest->sectors);
259*4882a593Smuzhiyun 	}
260*4882a593Smuzhiyun 
261*4882a593Smuzhiyun 	if (conf->nr_strip_zones == 1 || conf->strip_zone[1].nb_dev == 1) {
262*4882a593Smuzhiyun 		conf->layout = RAID0_ORIG_LAYOUT;
263*4882a593Smuzhiyun 	} else if (mddev->layout == RAID0_ORIG_LAYOUT ||
264*4882a593Smuzhiyun 		   mddev->layout == RAID0_ALT_MULTIZONE_LAYOUT) {
265*4882a593Smuzhiyun 		conf->layout = mddev->layout;
266*4882a593Smuzhiyun 	} else if (default_layout == RAID0_ORIG_LAYOUT ||
267*4882a593Smuzhiyun 		   default_layout == RAID0_ALT_MULTIZONE_LAYOUT) {
268*4882a593Smuzhiyun 		conf->layout = default_layout;
269*4882a593Smuzhiyun 	} else {
270*4882a593Smuzhiyun 		pr_err("md/raid0:%s: cannot assemble multi-zone RAID0 with default_layout setting\n",
271*4882a593Smuzhiyun 		       mdname(mddev));
272*4882a593Smuzhiyun 		pr_err("md/raid0: please set raid0.default_layout to 1 or 2\n");
273*4882a593Smuzhiyun 		err = -EOPNOTSUPP;
274*4882a593Smuzhiyun 		goto abort;
275*4882a593Smuzhiyun 	}
276*4882a593Smuzhiyun 
277*4882a593Smuzhiyun 	pr_debug("md/raid0:%s: done.\n", mdname(mddev));
278*4882a593Smuzhiyun 	*private_conf = conf;
279*4882a593Smuzhiyun 
280*4882a593Smuzhiyun 	return 0;
281*4882a593Smuzhiyun abort:
282*4882a593Smuzhiyun 	kfree(conf->strip_zone);
283*4882a593Smuzhiyun 	kfree(conf->devlist);
284*4882a593Smuzhiyun 	kfree(conf);
285*4882a593Smuzhiyun 	*private_conf = ERR_PTR(err);
286*4882a593Smuzhiyun 	return err;
287*4882a593Smuzhiyun }
288*4882a593Smuzhiyun 
289*4882a593Smuzhiyun /* Find the zone which holds a particular offset
290*4882a593Smuzhiyun  * Update *sectorp to be an offset in that zone
291*4882a593Smuzhiyun  */
find_zone(struct r0conf * conf,sector_t * sectorp)292*4882a593Smuzhiyun static struct strip_zone *find_zone(struct r0conf *conf,
293*4882a593Smuzhiyun 				    sector_t *sectorp)
294*4882a593Smuzhiyun {
295*4882a593Smuzhiyun 	int i;
296*4882a593Smuzhiyun 	struct strip_zone *z = conf->strip_zone;
297*4882a593Smuzhiyun 	sector_t sector = *sectorp;
298*4882a593Smuzhiyun 
299*4882a593Smuzhiyun 	for (i = 0; i < conf->nr_strip_zones; i++)
300*4882a593Smuzhiyun 		if (sector < z[i].zone_end) {
301*4882a593Smuzhiyun 			if (i)
302*4882a593Smuzhiyun 				*sectorp = sector - z[i-1].zone_end;
303*4882a593Smuzhiyun 			return z + i;
304*4882a593Smuzhiyun 		}
305*4882a593Smuzhiyun 	BUG();
306*4882a593Smuzhiyun }
307*4882a593Smuzhiyun 
308*4882a593Smuzhiyun /*
309*4882a593Smuzhiyun  * remaps the bio to the target device. we separate two flows.
310*4882a593Smuzhiyun  * power 2 flow and a general flow for the sake of performance
311*4882a593Smuzhiyun */
map_sector(struct mddev * mddev,struct strip_zone * zone,sector_t sector,sector_t * sector_offset)312*4882a593Smuzhiyun static struct md_rdev *map_sector(struct mddev *mddev, struct strip_zone *zone,
313*4882a593Smuzhiyun 				sector_t sector, sector_t *sector_offset)
314*4882a593Smuzhiyun {
315*4882a593Smuzhiyun 	unsigned int sect_in_chunk;
316*4882a593Smuzhiyun 	sector_t chunk;
317*4882a593Smuzhiyun 	struct r0conf *conf = mddev->private;
318*4882a593Smuzhiyun 	int raid_disks = conf->strip_zone[0].nb_dev;
319*4882a593Smuzhiyun 	unsigned int chunk_sects = mddev->chunk_sectors;
320*4882a593Smuzhiyun 
321*4882a593Smuzhiyun 	if (is_power_of_2(chunk_sects)) {
322*4882a593Smuzhiyun 		int chunksect_bits = ffz(~chunk_sects);
323*4882a593Smuzhiyun 		/* find the sector offset inside the chunk */
324*4882a593Smuzhiyun 		sect_in_chunk  = sector & (chunk_sects - 1);
325*4882a593Smuzhiyun 		sector >>= chunksect_bits;
326*4882a593Smuzhiyun 		/* chunk in zone */
327*4882a593Smuzhiyun 		chunk = *sector_offset;
328*4882a593Smuzhiyun 		/* quotient is the chunk in real device*/
329*4882a593Smuzhiyun 		sector_div(chunk, zone->nb_dev << chunksect_bits);
330*4882a593Smuzhiyun 	} else{
331*4882a593Smuzhiyun 		sect_in_chunk = sector_div(sector, chunk_sects);
332*4882a593Smuzhiyun 		chunk = *sector_offset;
333*4882a593Smuzhiyun 		sector_div(chunk, chunk_sects * zone->nb_dev);
334*4882a593Smuzhiyun 	}
335*4882a593Smuzhiyun 	/*
336*4882a593Smuzhiyun 	*  position the bio over the real device
337*4882a593Smuzhiyun 	*  real sector = chunk in device + starting of zone
338*4882a593Smuzhiyun 	*	+ the position in the chunk
339*4882a593Smuzhiyun 	*/
340*4882a593Smuzhiyun 	*sector_offset = (chunk * chunk_sects) + sect_in_chunk;
341*4882a593Smuzhiyun 	return conf->devlist[(zone - conf->strip_zone)*raid_disks
342*4882a593Smuzhiyun 			     + sector_div(sector, zone->nb_dev)];
343*4882a593Smuzhiyun }
344*4882a593Smuzhiyun 
raid0_size(struct mddev * mddev,sector_t sectors,int raid_disks)345*4882a593Smuzhiyun static sector_t raid0_size(struct mddev *mddev, sector_t sectors, int raid_disks)
346*4882a593Smuzhiyun {
347*4882a593Smuzhiyun 	sector_t array_sectors = 0;
348*4882a593Smuzhiyun 	struct md_rdev *rdev;
349*4882a593Smuzhiyun 
350*4882a593Smuzhiyun 	WARN_ONCE(sectors || raid_disks,
351*4882a593Smuzhiyun 		  "%s does not support generic reshape\n", __func__);
352*4882a593Smuzhiyun 
353*4882a593Smuzhiyun 	rdev_for_each(rdev, mddev)
354*4882a593Smuzhiyun 		array_sectors += (rdev->sectors &
355*4882a593Smuzhiyun 				  ~(sector_t)(mddev->chunk_sectors-1));
356*4882a593Smuzhiyun 
357*4882a593Smuzhiyun 	return array_sectors;
358*4882a593Smuzhiyun }
359*4882a593Smuzhiyun 
360*4882a593Smuzhiyun static void raid0_free(struct mddev *mddev, void *priv);
361*4882a593Smuzhiyun 
raid0_run(struct mddev * mddev)362*4882a593Smuzhiyun static int raid0_run(struct mddev *mddev)
363*4882a593Smuzhiyun {
364*4882a593Smuzhiyun 	struct r0conf *conf;
365*4882a593Smuzhiyun 	int ret;
366*4882a593Smuzhiyun 
367*4882a593Smuzhiyun 	if (mddev->chunk_sectors == 0) {
368*4882a593Smuzhiyun 		pr_warn("md/raid0:%s: chunk size must be set.\n", mdname(mddev));
369*4882a593Smuzhiyun 		return -EINVAL;
370*4882a593Smuzhiyun 	}
371*4882a593Smuzhiyun 	if (md_check_no_bitmap(mddev))
372*4882a593Smuzhiyun 		return -EINVAL;
373*4882a593Smuzhiyun 
374*4882a593Smuzhiyun 	/* if private is not null, we are here after takeover */
375*4882a593Smuzhiyun 	if (mddev->private == NULL) {
376*4882a593Smuzhiyun 		ret = create_strip_zones(mddev, &conf);
377*4882a593Smuzhiyun 		if (ret < 0)
378*4882a593Smuzhiyun 			return ret;
379*4882a593Smuzhiyun 		mddev->private = conf;
380*4882a593Smuzhiyun 	}
381*4882a593Smuzhiyun 	conf = mddev->private;
382*4882a593Smuzhiyun 	if (mddev->queue) {
383*4882a593Smuzhiyun 		struct md_rdev *rdev;
384*4882a593Smuzhiyun 		bool discard_supported = false;
385*4882a593Smuzhiyun 
386*4882a593Smuzhiyun 		blk_queue_max_hw_sectors(mddev->queue, mddev->chunk_sectors);
387*4882a593Smuzhiyun 		blk_queue_max_write_same_sectors(mddev->queue, mddev->chunk_sectors);
388*4882a593Smuzhiyun 		blk_queue_max_write_zeroes_sectors(mddev->queue, mddev->chunk_sectors);
389*4882a593Smuzhiyun 		blk_queue_max_discard_sectors(mddev->queue, UINT_MAX);
390*4882a593Smuzhiyun 
391*4882a593Smuzhiyun 		blk_queue_io_min(mddev->queue, mddev->chunk_sectors << 9);
392*4882a593Smuzhiyun 		blk_queue_io_opt(mddev->queue,
393*4882a593Smuzhiyun 				 (mddev->chunk_sectors << 9) * mddev->raid_disks);
394*4882a593Smuzhiyun 
395*4882a593Smuzhiyun 		rdev_for_each(rdev, mddev) {
396*4882a593Smuzhiyun 			disk_stack_limits(mddev->gendisk, rdev->bdev,
397*4882a593Smuzhiyun 					  rdev->data_offset << 9);
398*4882a593Smuzhiyun 			if (blk_queue_discard(bdev_get_queue(rdev->bdev)))
399*4882a593Smuzhiyun 				discard_supported = true;
400*4882a593Smuzhiyun 		}
401*4882a593Smuzhiyun 		if (!discard_supported)
402*4882a593Smuzhiyun 			blk_queue_flag_clear(QUEUE_FLAG_DISCARD, mddev->queue);
403*4882a593Smuzhiyun 		else
404*4882a593Smuzhiyun 			blk_queue_flag_set(QUEUE_FLAG_DISCARD, mddev->queue);
405*4882a593Smuzhiyun 	}
406*4882a593Smuzhiyun 
407*4882a593Smuzhiyun 	/* calculate array device size */
408*4882a593Smuzhiyun 	md_set_array_sectors(mddev, raid0_size(mddev, 0, 0));
409*4882a593Smuzhiyun 
410*4882a593Smuzhiyun 	pr_debug("md/raid0:%s: md_size is %llu sectors.\n",
411*4882a593Smuzhiyun 		 mdname(mddev),
412*4882a593Smuzhiyun 		 (unsigned long long)mddev->array_sectors);
413*4882a593Smuzhiyun 
414*4882a593Smuzhiyun 	dump_zones(mddev);
415*4882a593Smuzhiyun 
416*4882a593Smuzhiyun 	ret = md_integrity_register(mddev);
417*4882a593Smuzhiyun 
418*4882a593Smuzhiyun 	return ret;
419*4882a593Smuzhiyun }
420*4882a593Smuzhiyun 
raid0_free(struct mddev * mddev,void * priv)421*4882a593Smuzhiyun static void raid0_free(struct mddev *mddev, void *priv)
422*4882a593Smuzhiyun {
423*4882a593Smuzhiyun 	struct r0conf *conf = priv;
424*4882a593Smuzhiyun 
425*4882a593Smuzhiyun 	kfree(conf->strip_zone);
426*4882a593Smuzhiyun 	kfree(conf->devlist);
427*4882a593Smuzhiyun 	kfree(conf);
428*4882a593Smuzhiyun }
429*4882a593Smuzhiyun 
raid0_handle_discard(struct mddev * mddev,struct bio * bio)430*4882a593Smuzhiyun static void raid0_handle_discard(struct mddev *mddev, struct bio *bio)
431*4882a593Smuzhiyun {
432*4882a593Smuzhiyun 	struct r0conf *conf = mddev->private;
433*4882a593Smuzhiyun 	struct strip_zone *zone;
434*4882a593Smuzhiyun 	sector_t start = bio->bi_iter.bi_sector;
435*4882a593Smuzhiyun 	sector_t end;
436*4882a593Smuzhiyun 	unsigned int stripe_size;
437*4882a593Smuzhiyun 	sector_t first_stripe_index, last_stripe_index;
438*4882a593Smuzhiyun 	sector_t start_disk_offset;
439*4882a593Smuzhiyun 	unsigned int start_disk_index;
440*4882a593Smuzhiyun 	sector_t end_disk_offset;
441*4882a593Smuzhiyun 	unsigned int end_disk_index;
442*4882a593Smuzhiyun 	unsigned int disk;
443*4882a593Smuzhiyun 
444*4882a593Smuzhiyun 	zone = find_zone(conf, &start);
445*4882a593Smuzhiyun 
446*4882a593Smuzhiyun 	if (bio_end_sector(bio) > zone->zone_end) {
447*4882a593Smuzhiyun 		struct bio *split = bio_split(bio,
448*4882a593Smuzhiyun 			zone->zone_end - bio->bi_iter.bi_sector, GFP_NOIO,
449*4882a593Smuzhiyun 			&mddev->bio_set);
450*4882a593Smuzhiyun 		bio_chain(split, bio);
451*4882a593Smuzhiyun 		submit_bio_noacct(bio);
452*4882a593Smuzhiyun 		bio = split;
453*4882a593Smuzhiyun 		end = zone->zone_end;
454*4882a593Smuzhiyun 	} else
455*4882a593Smuzhiyun 		end = bio_end_sector(bio);
456*4882a593Smuzhiyun 
457*4882a593Smuzhiyun 	if (zone != conf->strip_zone)
458*4882a593Smuzhiyun 		end = end - zone[-1].zone_end;
459*4882a593Smuzhiyun 
460*4882a593Smuzhiyun 	/* Now start and end is the offset in zone */
461*4882a593Smuzhiyun 	stripe_size = zone->nb_dev * mddev->chunk_sectors;
462*4882a593Smuzhiyun 
463*4882a593Smuzhiyun 	first_stripe_index = start;
464*4882a593Smuzhiyun 	sector_div(first_stripe_index, stripe_size);
465*4882a593Smuzhiyun 	last_stripe_index = end;
466*4882a593Smuzhiyun 	sector_div(last_stripe_index, stripe_size);
467*4882a593Smuzhiyun 
468*4882a593Smuzhiyun 	start_disk_index = (int)(start - first_stripe_index * stripe_size) /
469*4882a593Smuzhiyun 		mddev->chunk_sectors;
470*4882a593Smuzhiyun 	start_disk_offset = ((int)(start - first_stripe_index * stripe_size) %
471*4882a593Smuzhiyun 		mddev->chunk_sectors) +
472*4882a593Smuzhiyun 		first_stripe_index * mddev->chunk_sectors;
473*4882a593Smuzhiyun 	end_disk_index = (int)(end - last_stripe_index * stripe_size) /
474*4882a593Smuzhiyun 		mddev->chunk_sectors;
475*4882a593Smuzhiyun 	end_disk_offset = ((int)(end - last_stripe_index * stripe_size) %
476*4882a593Smuzhiyun 		mddev->chunk_sectors) +
477*4882a593Smuzhiyun 		last_stripe_index * mddev->chunk_sectors;
478*4882a593Smuzhiyun 
479*4882a593Smuzhiyun 	for (disk = 0; disk < zone->nb_dev; disk++) {
480*4882a593Smuzhiyun 		sector_t dev_start, dev_end;
481*4882a593Smuzhiyun 		struct bio *discard_bio = NULL;
482*4882a593Smuzhiyun 		struct md_rdev *rdev;
483*4882a593Smuzhiyun 
484*4882a593Smuzhiyun 		if (disk < start_disk_index)
485*4882a593Smuzhiyun 			dev_start = (first_stripe_index + 1) *
486*4882a593Smuzhiyun 				mddev->chunk_sectors;
487*4882a593Smuzhiyun 		else if (disk > start_disk_index)
488*4882a593Smuzhiyun 			dev_start = first_stripe_index * mddev->chunk_sectors;
489*4882a593Smuzhiyun 		else
490*4882a593Smuzhiyun 			dev_start = start_disk_offset;
491*4882a593Smuzhiyun 
492*4882a593Smuzhiyun 		if (disk < end_disk_index)
493*4882a593Smuzhiyun 			dev_end = (last_stripe_index + 1) * mddev->chunk_sectors;
494*4882a593Smuzhiyun 		else if (disk > end_disk_index)
495*4882a593Smuzhiyun 			dev_end = last_stripe_index * mddev->chunk_sectors;
496*4882a593Smuzhiyun 		else
497*4882a593Smuzhiyun 			dev_end = end_disk_offset;
498*4882a593Smuzhiyun 
499*4882a593Smuzhiyun 		if (dev_end <= dev_start)
500*4882a593Smuzhiyun 			continue;
501*4882a593Smuzhiyun 
502*4882a593Smuzhiyun 		rdev = conf->devlist[(zone - conf->strip_zone) *
503*4882a593Smuzhiyun 			conf->strip_zone[0].nb_dev + disk];
504*4882a593Smuzhiyun 		if (__blkdev_issue_discard(rdev->bdev,
505*4882a593Smuzhiyun 			dev_start + zone->dev_start + rdev->data_offset,
506*4882a593Smuzhiyun 			dev_end - dev_start, GFP_NOIO, 0, &discard_bio) ||
507*4882a593Smuzhiyun 		    !discard_bio)
508*4882a593Smuzhiyun 			continue;
509*4882a593Smuzhiyun 		bio_chain(discard_bio, bio);
510*4882a593Smuzhiyun 		bio_clone_blkg_association(discard_bio, bio);
511*4882a593Smuzhiyun 		if (mddev->gendisk)
512*4882a593Smuzhiyun 			trace_block_bio_remap(bdev_get_queue(rdev->bdev),
513*4882a593Smuzhiyun 				discard_bio, disk_devt(mddev->gendisk),
514*4882a593Smuzhiyun 				bio->bi_iter.bi_sector);
515*4882a593Smuzhiyun 		submit_bio_noacct(discard_bio);
516*4882a593Smuzhiyun 	}
517*4882a593Smuzhiyun 	bio_endio(bio);
518*4882a593Smuzhiyun }
519*4882a593Smuzhiyun 
raid0_make_request(struct mddev * mddev,struct bio * bio)520*4882a593Smuzhiyun static bool raid0_make_request(struct mddev *mddev, struct bio *bio)
521*4882a593Smuzhiyun {
522*4882a593Smuzhiyun 	struct r0conf *conf = mddev->private;
523*4882a593Smuzhiyun 	struct strip_zone *zone;
524*4882a593Smuzhiyun 	struct md_rdev *tmp_dev;
525*4882a593Smuzhiyun 	sector_t bio_sector;
526*4882a593Smuzhiyun 	sector_t sector;
527*4882a593Smuzhiyun 	sector_t orig_sector;
528*4882a593Smuzhiyun 	unsigned chunk_sects;
529*4882a593Smuzhiyun 	unsigned sectors;
530*4882a593Smuzhiyun 
531*4882a593Smuzhiyun 	if (unlikely(bio->bi_opf & REQ_PREFLUSH)
532*4882a593Smuzhiyun 	    && md_flush_request(mddev, bio))
533*4882a593Smuzhiyun 		return true;
534*4882a593Smuzhiyun 
535*4882a593Smuzhiyun 	if (unlikely((bio_op(bio) == REQ_OP_DISCARD))) {
536*4882a593Smuzhiyun 		raid0_handle_discard(mddev, bio);
537*4882a593Smuzhiyun 		return true;
538*4882a593Smuzhiyun 	}
539*4882a593Smuzhiyun 
540*4882a593Smuzhiyun 	bio_sector = bio->bi_iter.bi_sector;
541*4882a593Smuzhiyun 	sector = bio_sector;
542*4882a593Smuzhiyun 	chunk_sects = mddev->chunk_sectors;
543*4882a593Smuzhiyun 
544*4882a593Smuzhiyun 	sectors = chunk_sects -
545*4882a593Smuzhiyun 		(likely(is_power_of_2(chunk_sects))
546*4882a593Smuzhiyun 		 ? (sector & (chunk_sects-1))
547*4882a593Smuzhiyun 		 : sector_div(sector, chunk_sects));
548*4882a593Smuzhiyun 
549*4882a593Smuzhiyun 	/* Restore due to sector_div */
550*4882a593Smuzhiyun 	sector = bio_sector;
551*4882a593Smuzhiyun 
552*4882a593Smuzhiyun 	if (sectors < bio_sectors(bio)) {
553*4882a593Smuzhiyun 		struct bio *split = bio_split(bio, sectors, GFP_NOIO,
554*4882a593Smuzhiyun 					      &mddev->bio_set);
555*4882a593Smuzhiyun 		bio_chain(split, bio);
556*4882a593Smuzhiyun 		submit_bio_noacct(bio);
557*4882a593Smuzhiyun 		bio = split;
558*4882a593Smuzhiyun 	}
559*4882a593Smuzhiyun 
560*4882a593Smuzhiyun 	orig_sector = sector;
561*4882a593Smuzhiyun 	zone = find_zone(mddev->private, &sector);
562*4882a593Smuzhiyun 	switch (conf->layout) {
563*4882a593Smuzhiyun 	case RAID0_ORIG_LAYOUT:
564*4882a593Smuzhiyun 		tmp_dev = map_sector(mddev, zone, orig_sector, &sector);
565*4882a593Smuzhiyun 		break;
566*4882a593Smuzhiyun 	case RAID0_ALT_MULTIZONE_LAYOUT:
567*4882a593Smuzhiyun 		tmp_dev = map_sector(mddev, zone, sector, &sector);
568*4882a593Smuzhiyun 		break;
569*4882a593Smuzhiyun 	default:
570*4882a593Smuzhiyun 		WARN(1, "md/raid0:%s: Invalid layout\n", mdname(mddev));
571*4882a593Smuzhiyun 		bio_io_error(bio);
572*4882a593Smuzhiyun 		return true;
573*4882a593Smuzhiyun 	}
574*4882a593Smuzhiyun 
575*4882a593Smuzhiyun 	if (unlikely(is_mddev_broken(tmp_dev, "raid0"))) {
576*4882a593Smuzhiyun 		bio_io_error(bio);
577*4882a593Smuzhiyun 		return true;
578*4882a593Smuzhiyun 	}
579*4882a593Smuzhiyun 
580*4882a593Smuzhiyun 	bio_set_dev(bio, tmp_dev->bdev);
581*4882a593Smuzhiyun 	bio->bi_iter.bi_sector = sector + zone->dev_start +
582*4882a593Smuzhiyun 		tmp_dev->data_offset;
583*4882a593Smuzhiyun 
584*4882a593Smuzhiyun 	if (mddev->gendisk)
585*4882a593Smuzhiyun 		trace_block_bio_remap(bio->bi_disk->queue, bio,
586*4882a593Smuzhiyun 				disk_devt(mddev->gendisk), bio_sector);
587*4882a593Smuzhiyun 	mddev_check_writesame(mddev, bio);
588*4882a593Smuzhiyun 	mddev_check_write_zeroes(mddev, bio);
589*4882a593Smuzhiyun 	submit_bio_noacct(bio);
590*4882a593Smuzhiyun 	return true;
591*4882a593Smuzhiyun }
592*4882a593Smuzhiyun 
raid0_status(struct seq_file * seq,struct mddev * mddev)593*4882a593Smuzhiyun static void raid0_status(struct seq_file *seq, struct mddev *mddev)
594*4882a593Smuzhiyun {
595*4882a593Smuzhiyun 	seq_printf(seq, " %dk chunks", mddev->chunk_sectors / 2);
596*4882a593Smuzhiyun 	return;
597*4882a593Smuzhiyun }
598*4882a593Smuzhiyun 
raid0_takeover_raid45(struct mddev * mddev)599*4882a593Smuzhiyun static void *raid0_takeover_raid45(struct mddev *mddev)
600*4882a593Smuzhiyun {
601*4882a593Smuzhiyun 	struct md_rdev *rdev;
602*4882a593Smuzhiyun 	struct r0conf *priv_conf;
603*4882a593Smuzhiyun 
604*4882a593Smuzhiyun 	if (mddev->degraded != 1) {
605*4882a593Smuzhiyun 		pr_warn("md/raid0:%s: raid5 must be degraded! Degraded disks: %d\n",
606*4882a593Smuzhiyun 			mdname(mddev),
607*4882a593Smuzhiyun 			mddev->degraded);
608*4882a593Smuzhiyun 		return ERR_PTR(-EINVAL);
609*4882a593Smuzhiyun 	}
610*4882a593Smuzhiyun 
611*4882a593Smuzhiyun 	rdev_for_each(rdev, mddev) {
612*4882a593Smuzhiyun 		/* check slot number for a disk */
613*4882a593Smuzhiyun 		if (rdev->raid_disk == mddev->raid_disks-1) {
614*4882a593Smuzhiyun 			pr_warn("md/raid0:%s: raid5 must have missing parity disk!\n",
615*4882a593Smuzhiyun 				mdname(mddev));
616*4882a593Smuzhiyun 			return ERR_PTR(-EINVAL);
617*4882a593Smuzhiyun 		}
618*4882a593Smuzhiyun 		rdev->sectors = mddev->dev_sectors;
619*4882a593Smuzhiyun 	}
620*4882a593Smuzhiyun 
621*4882a593Smuzhiyun 	/* Set new parameters */
622*4882a593Smuzhiyun 	mddev->new_level = 0;
623*4882a593Smuzhiyun 	mddev->new_layout = 0;
624*4882a593Smuzhiyun 	mddev->new_chunk_sectors = mddev->chunk_sectors;
625*4882a593Smuzhiyun 	mddev->raid_disks--;
626*4882a593Smuzhiyun 	mddev->delta_disks = -1;
627*4882a593Smuzhiyun 	/* make sure it will be not marked as dirty */
628*4882a593Smuzhiyun 	mddev->recovery_cp = MaxSector;
629*4882a593Smuzhiyun 	mddev_clear_unsupported_flags(mddev, UNSUPPORTED_MDDEV_FLAGS);
630*4882a593Smuzhiyun 
631*4882a593Smuzhiyun 	create_strip_zones(mddev, &priv_conf);
632*4882a593Smuzhiyun 
633*4882a593Smuzhiyun 	return priv_conf;
634*4882a593Smuzhiyun }
635*4882a593Smuzhiyun 
raid0_takeover_raid10(struct mddev * mddev)636*4882a593Smuzhiyun static void *raid0_takeover_raid10(struct mddev *mddev)
637*4882a593Smuzhiyun {
638*4882a593Smuzhiyun 	struct r0conf *priv_conf;
639*4882a593Smuzhiyun 
640*4882a593Smuzhiyun 	/* Check layout:
641*4882a593Smuzhiyun 	 *  - far_copies must be 1
642*4882a593Smuzhiyun 	 *  - near_copies must be 2
643*4882a593Smuzhiyun 	 *  - disks number must be even
644*4882a593Smuzhiyun 	 *  - all mirrors must be already degraded
645*4882a593Smuzhiyun 	 */
646*4882a593Smuzhiyun 	if (mddev->layout != ((1 << 8) + 2)) {
647*4882a593Smuzhiyun 		pr_warn("md/raid0:%s:: Raid0 cannot takeover layout: 0x%x\n",
648*4882a593Smuzhiyun 			mdname(mddev),
649*4882a593Smuzhiyun 			mddev->layout);
650*4882a593Smuzhiyun 		return ERR_PTR(-EINVAL);
651*4882a593Smuzhiyun 	}
652*4882a593Smuzhiyun 	if (mddev->raid_disks & 1) {
653*4882a593Smuzhiyun 		pr_warn("md/raid0:%s: Raid0 cannot takeover Raid10 with odd disk number.\n",
654*4882a593Smuzhiyun 			mdname(mddev));
655*4882a593Smuzhiyun 		return ERR_PTR(-EINVAL);
656*4882a593Smuzhiyun 	}
657*4882a593Smuzhiyun 	if (mddev->degraded != (mddev->raid_disks>>1)) {
658*4882a593Smuzhiyun 		pr_warn("md/raid0:%s: All mirrors must be already degraded!\n",
659*4882a593Smuzhiyun 			mdname(mddev));
660*4882a593Smuzhiyun 		return ERR_PTR(-EINVAL);
661*4882a593Smuzhiyun 	}
662*4882a593Smuzhiyun 
663*4882a593Smuzhiyun 	/* Set new parameters */
664*4882a593Smuzhiyun 	mddev->new_level = 0;
665*4882a593Smuzhiyun 	mddev->new_layout = 0;
666*4882a593Smuzhiyun 	mddev->new_chunk_sectors = mddev->chunk_sectors;
667*4882a593Smuzhiyun 	mddev->delta_disks = - mddev->raid_disks / 2;
668*4882a593Smuzhiyun 	mddev->raid_disks += mddev->delta_disks;
669*4882a593Smuzhiyun 	mddev->degraded = 0;
670*4882a593Smuzhiyun 	/* make sure it will be not marked as dirty */
671*4882a593Smuzhiyun 	mddev->recovery_cp = MaxSector;
672*4882a593Smuzhiyun 	mddev_clear_unsupported_flags(mddev, UNSUPPORTED_MDDEV_FLAGS);
673*4882a593Smuzhiyun 
674*4882a593Smuzhiyun 	create_strip_zones(mddev, &priv_conf);
675*4882a593Smuzhiyun 	return priv_conf;
676*4882a593Smuzhiyun }
677*4882a593Smuzhiyun 
raid0_takeover_raid1(struct mddev * mddev)678*4882a593Smuzhiyun static void *raid0_takeover_raid1(struct mddev *mddev)
679*4882a593Smuzhiyun {
680*4882a593Smuzhiyun 	struct r0conf *priv_conf;
681*4882a593Smuzhiyun 	int chunksect;
682*4882a593Smuzhiyun 
683*4882a593Smuzhiyun 	/* Check layout:
684*4882a593Smuzhiyun 	 *  - (N - 1) mirror drives must be already faulty
685*4882a593Smuzhiyun 	 */
686*4882a593Smuzhiyun 	if ((mddev->raid_disks - 1) != mddev->degraded) {
687*4882a593Smuzhiyun 		pr_err("md/raid0:%s: (N - 1) mirrors drives must be already faulty!\n",
688*4882a593Smuzhiyun 		       mdname(mddev));
689*4882a593Smuzhiyun 		return ERR_PTR(-EINVAL);
690*4882a593Smuzhiyun 	}
691*4882a593Smuzhiyun 
692*4882a593Smuzhiyun 	/*
693*4882a593Smuzhiyun 	 * a raid1 doesn't have the notion of chunk size, so
694*4882a593Smuzhiyun 	 * figure out the largest suitable size we can use.
695*4882a593Smuzhiyun 	 */
696*4882a593Smuzhiyun 	chunksect = 64 * 2; /* 64K by default */
697*4882a593Smuzhiyun 
698*4882a593Smuzhiyun 	/* The array must be an exact multiple of chunksize */
699*4882a593Smuzhiyun 	while (chunksect && (mddev->array_sectors & (chunksect - 1)))
700*4882a593Smuzhiyun 		chunksect >>= 1;
701*4882a593Smuzhiyun 
702*4882a593Smuzhiyun 	if ((chunksect << 9) < PAGE_SIZE)
703*4882a593Smuzhiyun 		/* array size does not allow a suitable chunk size */
704*4882a593Smuzhiyun 		return ERR_PTR(-EINVAL);
705*4882a593Smuzhiyun 
706*4882a593Smuzhiyun 	/* Set new parameters */
707*4882a593Smuzhiyun 	mddev->new_level = 0;
708*4882a593Smuzhiyun 	mddev->new_layout = 0;
709*4882a593Smuzhiyun 	mddev->new_chunk_sectors = chunksect;
710*4882a593Smuzhiyun 	mddev->chunk_sectors = chunksect;
711*4882a593Smuzhiyun 	mddev->delta_disks = 1 - mddev->raid_disks;
712*4882a593Smuzhiyun 	mddev->raid_disks = 1;
713*4882a593Smuzhiyun 	/* make sure it will be not marked as dirty */
714*4882a593Smuzhiyun 	mddev->recovery_cp = MaxSector;
715*4882a593Smuzhiyun 	mddev_clear_unsupported_flags(mddev, UNSUPPORTED_MDDEV_FLAGS);
716*4882a593Smuzhiyun 
717*4882a593Smuzhiyun 	create_strip_zones(mddev, &priv_conf);
718*4882a593Smuzhiyun 	return priv_conf;
719*4882a593Smuzhiyun }
720*4882a593Smuzhiyun 
raid0_takeover(struct mddev * mddev)721*4882a593Smuzhiyun static void *raid0_takeover(struct mddev *mddev)
722*4882a593Smuzhiyun {
723*4882a593Smuzhiyun 	/* raid0 can take over:
724*4882a593Smuzhiyun 	 *  raid4 - if all data disks are active.
725*4882a593Smuzhiyun 	 *  raid5 - providing it is Raid4 layout and one disk is faulty
726*4882a593Smuzhiyun 	 *  raid10 - assuming we have all necessary active disks
727*4882a593Smuzhiyun 	 *  raid1 - with (N -1) mirror drives faulty
728*4882a593Smuzhiyun 	 */
729*4882a593Smuzhiyun 
730*4882a593Smuzhiyun 	if (mddev->bitmap) {
731*4882a593Smuzhiyun 		pr_warn("md/raid0: %s: cannot takeover array with bitmap\n",
732*4882a593Smuzhiyun 			mdname(mddev));
733*4882a593Smuzhiyun 		return ERR_PTR(-EBUSY);
734*4882a593Smuzhiyun 	}
735*4882a593Smuzhiyun 	if (mddev->level == 4)
736*4882a593Smuzhiyun 		return raid0_takeover_raid45(mddev);
737*4882a593Smuzhiyun 
738*4882a593Smuzhiyun 	if (mddev->level == 5) {
739*4882a593Smuzhiyun 		if (mddev->layout == ALGORITHM_PARITY_N)
740*4882a593Smuzhiyun 			return raid0_takeover_raid45(mddev);
741*4882a593Smuzhiyun 
742*4882a593Smuzhiyun 		pr_warn("md/raid0:%s: Raid can only takeover Raid5 with layout: %d\n",
743*4882a593Smuzhiyun 			mdname(mddev), ALGORITHM_PARITY_N);
744*4882a593Smuzhiyun 	}
745*4882a593Smuzhiyun 
746*4882a593Smuzhiyun 	if (mddev->level == 10)
747*4882a593Smuzhiyun 		return raid0_takeover_raid10(mddev);
748*4882a593Smuzhiyun 
749*4882a593Smuzhiyun 	if (mddev->level == 1)
750*4882a593Smuzhiyun 		return raid0_takeover_raid1(mddev);
751*4882a593Smuzhiyun 
752*4882a593Smuzhiyun 	pr_warn("Takeover from raid%i to raid0 not supported\n",
753*4882a593Smuzhiyun 		mddev->level);
754*4882a593Smuzhiyun 
755*4882a593Smuzhiyun 	return ERR_PTR(-EINVAL);
756*4882a593Smuzhiyun }
757*4882a593Smuzhiyun 
raid0_quiesce(struct mddev * mddev,int quiesce)758*4882a593Smuzhiyun static void raid0_quiesce(struct mddev *mddev, int quiesce)
759*4882a593Smuzhiyun {
760*4882a593Smuzhiyun }
761*4882a593Smuzhiyun 
762*4882a593Smuzhiyun static struct md_personality raid0_personality=
763*4882a593Smuzhiyun {
764*4882a593Smuzhiyun 	.name		= "raid0",
765*4882a593Smuzhiyun 	.level		= 0,
766*4882a593Smuzhiyun 	.owner		= THIS_MODULE,
767*4882a593Smuzhiyun 	.make_request	= raid0_make_request,
768*4882a593Smuzhiyun 	.run		= raid0_run,
769*4882a593Smuzhiyun 	.free		= raid0_free,
770*4882a593Smuzhiyun 	.status		= raid0_status,
771*4882a593Smuzhiyun 	.size		= raid0_size,
772*4882a593Smuzhiyun 	.takeover	= raid0_takeover,
773*4882a593Smuzhiyun 	.quiesce	= raid0_quiesce,
774*4882a593Smuzhiyun };
775*4882a593Smuzhiyun 
raid0_init(void)776*4882a593Smuzhiyun static int __init raid0_init (void)
777*4882a593Smuzhiyun {
778*4882a593Smuzhiyun 	return register_md_personality (&raid0_personality);
779*4882a593Smuzhiyun }
780*4882a593Smuzhiyun 
raid0_exit(void)781*4882a593Smuzhiyun static void raid0_exit (void)
782*4882a593Smuzhiyun {
783*4882a593Smuzhiyun 	unregister_md_personality (&raid0_personality);
784*4882a593Smuzhiyun }
785*4882a593Smuzhiyun 
786*4882a593Smuzhiyun module_init(raid0_init);
787*4882a593Smuzhiyun module_exit(raid0_exit);
788*4882a593Smuzhiyun MODULE_LICENSE("GPL");
789*4882a593Smuzhiyun MODULE_DESCRIPTION("RAID0 (striping) personality for MD");
790*4882a593Smuzhiyun MODULE_ALIAS("md-personality-2"); /* RAID0 */
791*4882a593Smuzhiyun MODULE_ALIAS("md-raid0");
792*4882a593Smuzhiyun MODULE_ALIAS("md-level-0");
793