xref: /openbmc/linux/drivers/md/raid0.c (revision 726bd223)
1 /*
2    raid0.c : Multiple Devices driver for Linux
3 	     Copyright (C) 1994-96 Marc ZYNGIER
4 	     <zyngier@ufr-info-p7.ibp.fr> or
5 	     <maz@gloups.fdn.fr>
6 	     Copyright (C) 1999, 2000 Ingo Molnar, Red Hat
7 
8    RAID-0 management functions.
9 
10    This program is free software; you can redistribute it and/or modify
11    it under the terms of the GNU General Public License as published by
12    the Free Software Foundation; either version 2, or (at your option)
13    any later version.
14 
15    You should have received a copy of the GNU General Public License
16    (for example /usr/src/linux/COPYING); if not, write to the Free
17    Software Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
18 */
19 
20 #include <linux/blkdev.h>
21 #include <linux/seq_file.h>
22 #include <linux/module.h>
23 #include <linux/slab.h>
24 #include <trace/events/block.h>
25 #include "md.h"
26 #include "raid0.h"
27 #include "raid5.h"
28 
29 #define UNSUPPORTED_MDDEV_FLAGS		\
30 	((1L << MD_HAS_JOURNAL) |	\
31 	 (1L << MD_JOURNAL_CLEAN) |	\
32 	 (1L << MD_FAILFAST_SUPPORTED))
33 
34 static int raid0_congested(struct mddev *mddev, int bits)
35 {
36 	struct r0conf *conf = mddev->private;
37 	struct md_rdev **devlist = conf->devlist;
38 	int raid_disks = conf->strip_zone[0].nb_dev;
39 	int i, ret = 0;
40 
41 	for (i = 0; i < raid_disks && !ret ; i++) {
42 		struct request_queue *q = bdev_get_queue(devlist[i]->bdev);
43 
44 		ret |= bdi_congested(q->backing_dev_info, bits);
45 	}
46 	return ret;
47 }
48 
49 /*
50  * inform the user of the raid configuration
51 */
52 static void dump_zones(struct mddev *mddev)
53 {
54 	int j, k;
55 	sector_t zone_size = 0;
56 	sector_t zone_start = 0;
57 	char b[BDEVNAME_SIZE];
58 	struct r0conf *conf = mddev->private;
59 	int raid_disks = conf->strip_zone[0].nb_dev;
60 	pr_debug("md: RAID0 configuration for %s - %d zone%s\n",
61 		 mdname(mddev),
62 		 conf->nr_strip_zones, conf->nr_strip_zones==1?"":"s");
63 	for (j = 0; j < conf->nr_strip_zones; j++) {
64 		char line[200];
65 		int len = 0;
66 
67 		for (k = 0; k < conf->strip_zone[j].nb_dev; k++)
68 			len += snprintf(line+len, 200-len, "%s%s", k?"/":"",
69 					bdevname(conf->devlist[j*raid_disks
70 							       + k]->bdev, b));
71 		pr_debug("md: zone%d=[%s]\n", j, line);
72 
73 		zone_size  = conf->strip_zone[j].zone_end - zone_start;
74 		pr_debug("      zone-offset=%10lluKB, device-offset=%10lluKB, size=%10lluKB\n",
75 			(unsigned long long)zone_start>>1,
76 			(unsigned long long)conf->strip_zone[j].dev_start>>1,
77 			(unsigned long long)zone_size>>1);
78 		zone_start = conf->strip_zone[j].zone_end;
79 	}
80 }
81 
82 static int create_strip_zones(struct mddev *mddev, struct r0conf **private_conf)
83 {
84 	int i, c, err;
85 	sector_t curr_zone_end, sectors;
86 	struct md_rdev *smallest, *rdev1, *rdev2, *rdev, **dev;
87 	struct strip_zone *zone;
88 	int cnt;
89 	char b[BDEVNAME_SIZE];
90 	char b2[BDEVNAME_SIZE];
91 	struct r0conf *conf = kzalloc(sizeof(*conf), GFP_KERNEL);
92 	unsigned short blksize = 512;
93 
94 	*private_conf = ERR_PTR(-ENOMEM);
95 	if (!conf)
96 		return -ENOMEM;
97 	rdev_for_each(rdev1, mddev) {
98 		pr_debug("md/raid0:%s: looking at %s\n",
99 			 mdname(mddev),
100 			 bdevname(rdev1->bdev, b));
101 		c = 0;
102 
103 		/* round size to chunk_size */
104 		sectors = rdev1->sectors;
105 		sector_div(sectors, mddev->chunk_sectors);
106 		rdev1->sectors = sectors * mddev->chunk_sectors;
107 
108 		blksize = max(blksize, queue_logical_block_size(
109 				      rdev1->bdev->bd_disk->queue));
110 
111 		rdev_for_each(rdev2, mddev) {
112 			pr_debug("md/raid0:%s:   comparing %s(%llu)"
113 				 " with %s(%llu)\n",
114 				 mdname(mddev),
115 				 bdevname(rdev1->bdev,b),
116 				 (unsigned long long)rdev1->sectors,
117 				 bdevname(rdev2->bdev,b2),
118 				 (unsigned long long)rdev2->sectors);
119 			if (rdev2 == rdev1) {
120 				pr_debug("md/raid0:%s:   END\n",
121 					 mdname(mddev));
122 				break;
123 			}
124 			if (rdev2->sectors == rdev1->sectors) {
125 				/*
126 				 * Not unique, don't count it as a new
127 				 * group
128 				 */
129 				pr_debug("md/raid0:%s:   EQUAL\n",
130 					 mdname(mddev));
131 				c = 1;
132 				break;
133 			}
134 			pr_debug("md/raid0:%s:   NOT EQUAL\n",
135 				 mdname(mddev));
136 		}
137 		if (!c) {
138 			pr_debug("md/raid0:%s:   ==> UNIQUE\n",
139 				 mdname(mddev));
140 			conf->nr_strip_zones++;
141 			pr_debug("md/raid0:%s: %d zones\n",
142 				 mdname(mddev), conf->nr_strip_zones);
143 		}
144 	}
145 	pr_debug("md/raid0:%s: FINAL %d zones\n",
146 		 mdname(mddev), conf->nr_strip_zones);
147 	/*
148 	 * now since we have the hard sector sizes, we can make sure
149 	 * chunk size is a multiple of that sector size
150 	 */
151 	if ((mddev->chunk_sectors << 9) % blksize) {
152 		pr_warn("md/raid0:%s: chunk_size of %d not multiple of block size %d\n",
153 			mdname(mddev),
154 			mddev->chunk_sectors << 9, blksize);
155 		err = -EINVAL;
156 		goto abort;
157 	}
158 
159 	err = -ENOMEM;
160 	conf->strip_zone = kzalloc(sizeof(struct strip_zone)*
161 				conf->nr_strip_zones, GFP_KERNEL);
162 	if (!conf->strip_zone)
163 		goto abort;
164 	conf->devlist = kzalloc(sizeof(struct md_rdev*)*
165 				conf->nr_strip_zones*mddev->raid_disks,
166 				GFP_KERNEL);
167 	if (!conf->devlist)
168 		goto abort;
169 
170 	/* The first zone must contain all devices, so here we check that
171 	 * there is a proper alignment of slots to devices and find them all
172 	 */
173 	zone = &conf->strip_zone[0];
174 	cnt = 0;
175 	smallest = NULL;
176 	dev = conf->devlist;
177 	err = -EINVAL;
178 	rdev_for_each(rdev1, mddev) {
179 		int j = rdev1->raid_disk;
180 
181 		if (mddev->level == 10) {
182 			/* taking over a raid10-n2 array */
183 			j /= 2;
184 			rdev1->new_raid_disk = j;
185 		}
186 
187 		if (mddev->level == 1) {
188 			/* taiking over a raid1 array-
189 			 * we have only one active disk
190 			 */
191 			j = 0;
192 			rdev1->new_raid_disk = j;
193 		}
194 
195 		if (j < 0) {
196 			pr_warn("md/raid0:%s: remove inactive devices before converting to RAID0\n",
197 				mdname(mddev));
198 			goto abort;
199 		}
200 		if (j >= mddev->raid_disks) {
201 			pr_warn("md/raid0:%s: bad disk number %d - aborting!\n",
202 				mdname(mddev), j);
203 			goto abort;
204 		}
205 		if (dev[j]) {
206 			pr_warn("md/raid0:%s: multiple devices for %d - aborting!\n",
207 				mdname(mddev), j);
208 			goto abort;
209 		}
210 		dev[j] = rdev1;
211 
212 		if (!smallest || (rdev1->sectors < smallest->sectors))
213 			smallest = rdev1;
214 		cnt++;
215 	}
216 	if (cnt != mddev->raid_disks) {
217 		pr_warn("md/raid0:%s: too few disks (%d of %d) - aborting!\n",
218 			mdname(mddev), cnt, mddev->raid_disks);
219 		goto abort;
220 	}
221 	zone->nb_dev = cnt;
222 	zone->zone_end = smallest->sectors * cnt;
223 
224 	curr_zone_end = zone->zone_end;
225 
226 	/* now do the other zones */
227 	for (i = 1; i < conf->nr_strip_zones; i++)
228 	{
229 		int j;
230 
231 		zone = conf->strip_zone + i;
232 		dev = conf->devlist + i * mddev->raid_disks;
233 
234 		pr_debug("md/raid0:%s: zone %d\n", mdname(mddev), i);
235 		zone->dev_start = smallest->sectors;
236 		smallest = NULL;
237 		c = 0;
238 
239 		for (j=0; j<cnt; j++) {
240 			rdev = conf->devlist[j];
241 			if (rdev->sectors <= zone->dev_start) {
242 				pr_debug("md/raid0:%s: checking %s ... nope\n",
243 					 mdname(mddev),
244 					 bdevname(rdev->bdev, b));
245 				continue;
246 			}
247 			pr_debug("md/raid0:%s: checking %s ..."
248 				 " contained as device %d\n",
249 				 mdname(mddev),
250 				 bdevname(rdev->bdev, b), c);
251 			dev[c] = rdev;
252 			c++;
253 			if (!smallest || rdev->sectors < smallest->sectors) {
254 				smallest = rdev;
255 				pr_debug("md/raid0:%s:  (%llu) is smallest!.\n",
256 					 mdname(mddev),
257 					 (unsigned long long)rdev->sectors);
258 			}
259 		}
260 
261 		zone->nb_dev = c;
262 		sectors = (smallest->sectors - zone->dev_start) * c;
263 		pr_debug("md/raid0:%s: zone->nb_dev: %d, sectors: %llu\n",
264 			 mdname(mddev),
265 			 zone->nb_dev, (unsigned long long)sectors);
266 
267 		curr_zone_end += sectors;
268 		zone->zone_end = curr_zone_end;
269 
270 		pr_debug("md/raid0:%s: current zone start: %llu\n",
271 			 mdname(mddev),
272 			 (unsigned long long)smallest->sectors);
273 	}
274 
275 	pr_debug("md/raid0:%s: done.\n", mdname(mddev));
276 	*private_conf = conf;
277 
278 	return 0;
279 abort:
280 	kfree(conf->strip_zone);
281 	kfree(conf->devlist);
282 	kfree(conf);
283 	*private_conf = ERR_PTR(err);
284 	return err;
285 }
286 
287 /* Find the zone which holds a particular offset
288  * Update *sectorp to be an offset in that zone
289  */
290 static struct strip_zone *find_zone(struct r0conf *conf,
291 				    sector_t *sectorp)
292 {
293 	int i;
294 	struct strip_zone *z = conf->strip_zone;
295 	sector_t sector = *sectorp;
296 
297 	for (i = 0; i < conf->nr_strip_zones; i++)
298 		if (sector < z[i].zone_end) {
299 			if (i)
300 				*sectorp = sector - z[i-1].zone_end;
301 			return z + i;
302 		}
303 	BUG();
304 }
305 
306 /*
307  * remaps the bio to the target device. we separate two flows.
308  * power 2 flow and a general flow for the sake of performance
309 */
310 static struct md_rdev *map_sector(struct mddev *mddev, struct strip_zone *zone,
311 				sector_t sector, sector_t *sector_offset)
312 {
313 	unsigned int sect_in_chunk;
314 	sector_t chunk;
315 	struct r0conf *conf = mddev->private;
316 	int raid_disks = conf->strip_zone[0].nb_dev;
317 	unsigned int chunk_sects = mddev->chunk_sectors;
318 
319 	if (is_power_of_2(chunk_sects)) {
320 		int chunksect_bits = ffz(~chunk_sects);
321 		/* find the sector offset inside the chunk */
322 		sect_in_chunk  = sector & (chunk_sects - 1);
323 		sector >>= chunksect_bits;
324 		/* chunk in zone */
325 		chunk = *sector_offset;
326 		/* quotient is the chunk in real device*/
327 		sector_div(chunk, zone->nb_dev << chunksect_bits);
328 	} else{
329 		sect_in_chunk = sector_div(sector, chunk_sects);
330 		chunk = *sector_offset;
331 		sector_div(chunk, chunk_sects * zone->nb_dev);
332 	}
333 	/*
334 	*  position the bio over the real device
335 	*  real sector = chunk in device + starting of zone
336 	*	+ the position in the chunk
337 	*/
338 	*sector_offset = (chunk * chunk_sects) + sect_in_chunk;
339 	return conf->devlist[(zone - conf->strip_zone)*raid_disks
340 			     + sector_div(sector, zone->nb_dev)];
341 }
342 
343 static sector_t raid0_size(struct mddev *mddev, sector_t sectors, int raid_disks)
344 {
345 	sector_t array_sectors = 0;
346 	struct md_rdev *rdev;
347 
348 	WARN_ONCE(sectors || raid_disks,
349 		  "%s does not support generic reshape\n", __func__);
350 
351 	rdev_for_each(rdev, mddev)
352 		array_sectors += (rdev->sectors &
353 				  ~(sector_t)(mddev->chunk_sectors-1));
354 
355 	return array_sectors;
356 }
357 
358 static void raid0_free(struct mddev *mddev, void *priv);
359 
360 static int raid0_run(struct mddev *mddev)
361 {
362 	struct r0conf *conf;
363 	int ret;
364 
365 	if (mddev->chunk_sectors == 0) {
366 		pr_warn("md/raid0:%s: chunk size must be set.\n", mdname(mddev));
367 		return -EINVAL;
368 	}
369 	if (md_check_no_bitmap(mddev))
370 		return -EINVAL;
371 
372 	/* if private is not null, we are here after takeover */
373 	if (mddev->private == NULL) {
374 		ret = create_strip_zones(mddev, &conf);
375 		if (ret < 0)
376 			return ret;
377 		mddev->private = conf;
378 	}
379 	conf = mddev->private;
380 	if (mddev->queue) {
381 		struct md_rdev *rdev;
382 		bool discard_supported = false;
383 
384 		blk_queue_max_hw_sectors(mddev->queue, mddev->chunk_sectors);
385 		blk_queue_max_write_same_sectors(mddev->queue, mddev->chunk_sectors);
386 		blk_queue_max_discard_sectors(mddev->queue, mddev->chunk_sectors);
387 
388 		blk_queue_io_min(mddev->queue, mddev->chunk_sectors << 9);
389 		blk_queue_io_opt(mddev->queue,
390 				 (mddev->chunk_sectors << 9) * mddev->raid_disks);
391 
392 		rdev_for_each(rdev, mddev) {
393 			disk_stack_limits(mddev->gendisk, rdev->bdev,
394 					  rdev->data_offset << 9);
395 			if (blk_queue_discard(bdev_get_queue(rdev->bdev)))
396 				discard_supported = true;
397 		}
398 		if (!discard_supported)
399 			queue_flag_clear_unlocked(QUEUE_FLAG_DISCARD, mddev->queue);
400 		else
401 			queue_flag_set_unlocked(QUEUE_FLAG_DISCARD, mddev->queue);
402 	}
403 
404 	/* calculate array device size */
405 	md_set_array_sectors(mddev, raid0_size(mddev, 0, 0));
406 
407 	pr_debug("md/raid0:%s: md_size is %llu sectors.\n",
408 		 mdname(mddev),
409 		 (unsigned long long)mddev->array_sectors);
410 
411 	if (mddev->queue) {
412 		/* calculate the max read-ahead size.
413 		 * For read-ahead of large files to be effective, we need to
414 		 * readahead at least twice a whole stripe. i.e. number of devices
415 		 * multiplied by chunk size times 2.
416 		 * If an individual device has an ra_pages greater than the
417 		 * chunk size, then we will not drive that device as hard as it
418 		 * wants.  We consider this a configuration error: a larger
419 		 * chunksize should be used in that case.
420 		 */
421 		int stripe = mddev->raid_disks *
422 			(mddev->chunk_sectors << 9) / PAGE_SIZE;
423 		if (mddev->queue->backing_dev_info->ra_pages < 2* stripe)
424 			mddev->queue->backing_dev_info->ra_pages = 2* stripe;
425 	}
426 
427 	dump_zones(mddev);
428 
429 	ret = md_integrity_register(mddev);
430 
431 	return ret;
432 }
433 
434 static void raid0_free(struct mddev *mddev, void *priv)
435 {
436 	struct r0conf *conf = priv;
437 
438 	kfree(conf->strip_zone);
439 	kfree(conf->devlist);
440 	kfree(conf);
441 }
442 
443 /*
444  * Is io distribute over 1 or more chunks ?
445 */
446 static inline int is_io_in_chunk_boundary(struct mddev *mddev,
447 			unsigned int chunk_sects, struct bio *bio)
448 {
449 	if (likely(is_power_of_2(chunk_sects))) {
450 		return chunk_sects >=
451 			((bio->bi_iter.bi_sector & (chunk_sects-1))
452 					+ bio_sectors(bio));
453 	} else{
454 		sector_t sector = bio->bi_iter.bi_sector;
455 		return chunk_sects >= (sector_div(sector, chunk_sects)
456 						+ bio_sectors(bio));
457 	}
458 }
459 
460 static void raid0_make_request(struct mddev *mddev, struct bio *bio)
461 {
462 	struct strip_zone *zone;
463 	struct md_rdev *tmp_dev;
464 	struct bio *split;
465 
466 	if (unlikely(bio->bi_opf & REQ_PREFLUSH)) {
467 		md_flush_request(mddev, bio);
468 		return;
469 	}
470 
471 	do {
472 		sector_t bio_sector = bio->bi_iter.bi_sector;
473 		sector_t sector = bio_sector;
474 		unsigned chunk_sects = mddev->chunk_sectors;
475 
476 		unsigned sectors = chunk_sects -
477 			(likely(is_power_of_2(chunk_sects))
478 			 ? (sector & (chunk_sects-1))
479 			 : sector_div(sector, chunk_sects));
480 
481 		/* Restore due to sector_div */
482 		sector = bio_sector;
483 
484 		if (sectors < bio_sectors(bio)) {
485 			split = bio_split(bio, sectors, GFP_NOIO, fs_bio_set);
486 			bio_chain(split, bio);
487 		} else {
488 			split = bio;
489 		}
490 
491 		zone = find_zone(mddev->private, &sector);
492 		tmp_dev = map_sector(mddev, zone, sector, &sector);
493 		split->bi_bdev = tmp_dev->bdev;
494 		split->bi_iter.bi_sector = sector + zone->dev_start +
495 			tmp_dev->data_offset;
496 
497 		if (unlikely((bio_op(split) == REQ_OP_DISCARD) &&
498 			 !blk_queue_discard(bdev_get_queue(split->bi_bdev)))) {
499 			/* Just ignore it */
500 			bio_endio(split);
501 		} else {
502 			if (mddev->gendisk)
503 				trace_block_bio_remap(bdev_get_queue(split->bi_bdev),
504 						      split, disk_devt(mddev->gendisk),
505 						      bio_sector);
506 			mddev_check_writesame(mddev, split);
507 			generic_make_request(split);
508 		}
509 	} while (split != bio);
510 }
511 
512 static void raid0_status(struct seq_file *seq, struct mddev *mddev)
513 {
514 	seq_printf(seq, " %dk chunks", mddev->chunk_sectors / 2);
515 	return;
516 }
517 
518 static void *raid0_takeover_raid45(struct mddev *mddev)
519 {
520 	struct md_rdev *rdev;
521 	struct r0conf *priv_conf;
522 
523 	if (mddev->degraded != 1) {
524 		pr_warn("md/raid0:%s: raid5 must be degraded! Degraded disks: %d\n",
525 			mdname(mddev),
526 			mddev->degraded);
527 		return ERR_PTR(-EINVAL);
528 	}
529 
530 	rdev_for_each(rdev, mddev) {
531 		/* check slot number for a disk */
532 		if (rdev->raid_disk == mddev->raid_disks-1) {
533 			pr_warn("md/raid0:%s: raid5 must have missing parity disk!\n",
534 				mdname(mddev));
535 			return ERR_PTR(-EINVAL);
536 		}
537 		rdev->sectors = mddev->dev_sectors;
538 	}
539 
540 	/* Set new parameters */
541 	mddev->new_level = 0;
542 	mddev->new_layout = 0;
543 	mddev->new_chunk_sectors = mddev->chunk_sectors;
544 	mddev->raid_disks--;
545 	mddev->delta_disks = -1;
546 	/* make sure it will be not marked as dirty */
547 	mddev->recovery_cp = MaxSector;
548 	mddev_clear_unsupported_flags(mddev, UNSUPPORTED_MDDEV_FLAGS);
549 
550 	create_strip_zones(mddev, &priv_conf);
551 
552 	return priv_conf;
553 }
554 
555 static void *raid0_takeover_raid10(struct mddev *mddev)
556 {
557 	struct r0conf *priv_conf;
558 
559 	/* Check layout:
560 	 *  - far_copies must be 1
561 	 *  - near_copies must be 2
562 	 *  - disks number must be even
563 	 *  - all mirrors must be already degraded
564 	 */
565 	if (mddev->layout != ((1 << 8) + 2)) {
566 		pr_warn("md/raid0:%s:: Raid0 cannot takeover layout: 0x%x\n",
567 			mdname(mddev),
568 			mddev->layout);
569 		return ERR_PTR(-EINVAL);
570 	}
571 	if (mddev->raid_disks & 1) {
572 		pr_warn("md/raid0:%s: Raid0 cannot takeover Raid10 with odd disk number.\n",
573 			mdname(mddev));
574 		return ERR_PTR(-EINVAL);
575 	}
576 	if (mddev->degraded != (mddev->raid_disks>>1)) {
577 		pr_warn("md/raid0:%s: All mirrors must be already degraded!\n",
578 			mdname(mddev));
579 		return ERR_PTR(-EINVAL);
580 	}
581 
582 	/* Set new parameters */
583 	mddev->new_level = 0;
584 	mddev->new_layout = 0;
585 	mddev->new_chunk_sectors = mddev->chunk_sectors;
586 	mddev->delta_disks = - mddev->raid_disks / 2;
587 	mddev->raid_disks += mddev->delta_disks;
588 	mddev->degraded = 0;
589 	/* make sure it will be not marked as dirty */
590 	mddev->recovery_cp = MaxSector;
591 	mddev_clear_unsupported_flags(mddev, UNSUPPORTED_MDDEV_FLAGS);
592 
593 	create_strip_zones(mddev, &priv_conf);
594 	return priv_conf;
595 }
596 
597 static void *raid0_takeover_raid1(struct mddev *mddev)
598 {
599 	struct r0conf *priv_conf;
600 	int chunksect;
601 
602 	/* Check layout:
603 	 *  - (N - 1) mirror drives must be already faulty
604 	 */
605 	if ((mddev->raid_disks - 1) != mddev->degraded) {
606 		pr_err("md/raid0:%s: (N - 1) mirrors drives must be already faulty!\n",
607 		       mdname(mddev));
608 		return ERR_PTR(-EINVAL);
609 	}
610 
611 	/*
612 	 * a raid1 doesn't have the notion of chunk size, so
613 	 * figure out the largest suitable size we can use.
614 	 */
615 	chunksect = 64 * 2; /* 64K by default */
616 
617 	/* The array must be an exact multiple of chunksize */
618 	while (chunksect && (mddev->array_sectors & (chunksect - 1)))
619 		chunksect >>= 1;
620 
621 	if ((chunksect << 9) < PAGE_SIZE)
622 		/* array size does not allow a suitable chunk size */
623 		return ERR_PTR(-EINVAL);
624 
625 	/* Set new parameters */
626 	mddev->new_level = 0;
627 	mddev->new_layout = 0;
628 	mddev->new_chunk_sectors = chunksect;
629 	mddev->chunk_sectors = chunksect;
630 	mddev->delta_disks = 1 - mddev->raid_disks;
631 	mddev->raid_disks = 1;
632 	/* make sure it will be not marked as dirty */
633 	mddev->recovery_cp = MaxSector;
634 	mddev_clear_unsupported_flags(mddev, UNSUPPORTED_MDDEV_FLAGS);
635 
636 	create_strip_zones(mddev, &priv_conf);
637 	return priv_conf;
638 }
639 
640 static void *raid0_takeover(struct mddev *mddev)
641 {
642 	/* raid0 can take over:
643 	 *  raid4 - if all data disks are active.
644 	 *  raid5 - providing it is Raid4 layout and one disk is faulty
645 	 *  raid10 - assuming we have all necessary active disks
646 	 *  raid1 - with (N -1) mirror drives faulty
647 	 */
648 
649 	if (mddev->bitmap) {
650 		pr_warn("md/raid0: %s: cannot takeover array with bitmap\n",
651 			mdname(mddev));
652 		return ERR_PTR(-EBUSY);
653 	}
654 	if (mddev->level == 4)
655 		return raid0_takeover_raid45(mddev);
656 
657 	if (mddev->level == 5) {
658 		if (mddev->layout == ALGORITHM_PARITY_N)
659 			return raid0_takeover_raid45(mddev);
660 
661 		pr_warn("md/raid0:%s: Raid can only takeover Raid5 with layout: %d\n",
662 			mdname(mddev), ALGORITHM_PARITY_N);
663 	}
664 
665 	if (mddev->level == 10)
666 		return raid0_takeover_raid10(mddev);
667 
668 	if (mddev->level == 1)
669 		return raid0_takeover_raid1(mddev);
670 
671 	pr_warn("Takeover from raid%i to raid0 not supported\n",
672 		mddev->level);
673 
674 	return ERR_PTR(-EINVAL);
675 }
676 
677 static void raid0_quiesce(struct mddev *mddev, int state)
678 {
679 }
680 
681 static struct md_personality raid0_personality=
682 {
683 	.name		= "raid0",
684 	.level		= 0,
685 	.owner		= THIS_MODULE,
686 	.make_request	= raid0_make_request,
687 	.run		= raid0_run,
688 	.free		= raid0_free,
689 	.status		= raid0_status,
690 	.size		= raid0_size,
691 	.takeover	= raid0_takeover,
692 	.quiesce	= raid0_quiesce,
693 	.congested	= raid0_congested,
694 };
695 
696 static int __init raid0_init (void)
697 {
698 	return register_md_personality (&raid0_personality);
699 }
700 
701 static void raid0_exit (void)
702 {
703 	unregister_md_personality (&raid0_personality);
704 }
705 
706 module_init(raid0_init);
707 module_exit(raid0_exit);
708 MODULE_LICENSE("GPL");
709 MODULE_DESCRIPTION("RAID0 (striping) personality for MD");
710 MODULE_ALIAS("md-personality-2"); /* RAID0 */
711 MODULE_ALIAS("md-raid0");
712 MODULE_ALIAS("md-level-0");
713