Loading...
1/*
2 raid0.c : Multiple Devices driver for Linux
3 Copyright (C) 1994-96 Marc ZYNGIER
4 <zyngier@ufr-info-p7.ibp.fr> or
5 <maz@gloups.fdn.fr>
6 Copyright (C) 1999, 2000 Ingo Molnar, Red Hat
7
8
9 RAID-0 management functions.
10
11 This program is free software; you can redistribute it and/or modify
12 it under the terms of the GNU General Public License as published by
13 the Free Software Foundation; either version 2, or (at your option)
14 any later version.
15
16 You should have received a copy of the GNU General Public License
17 (for example /usr/src/linux/COPYING); if not, write to the Free
18 Software Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
19*/
20
21#include <linux/blkdev.h>
22#include <linux/seq_file.h>
23#include <linux/slab.h>
24#include "md.h"
25#include "raid0.h"
26#include "raid5.h"
27
28static int raid0_congested(void *data, int bits)
29{
30 mddev_t *mddev = data;
31 raid0_conf_t *conf = mddev->private;
32 mdk_rdev_t **devlist = conf->devlist;
33 int raid_disks = conf->strip_zone[0].nb_dev;
34 int i, ret = 0;
35
36 if (mddev_congested(mddev, bits))
37 return 1;
38
39 for (i = 0; i < raid_disks && !ret ; i++) {
40 struct request_queue *q = bdev_get_queue(devlist[i]->bdev);
41
42 ret |= bdi_congested(&q->backing_dev_info, bits);
43 }
44 return ret;
45}
46
47/*
48 * inform the user of the raid configuration
49*/
50static void dump_zones(mddev_t *mddev)
51{
52 int j, k, h;
53 sector_t zone_size = 0;
54 sector_t zone_start = 0;
55 char b[BDEVNAME_SIZE];
56 raid0_conf_t *conf = mddev->private;
57 int raid_disks = conf->strip_zone[0].nb_dev;
58 printk(KERN_INFO "******* %s configuration *********\n",
59 mdname(mddev));
60 h = 0;
61 for (j = 0; j < conf->nr_strip_zones; j++) {
62 printk(KERN_INFO "zone%d=[", j);
63 for (k = 0; k < conf->strip_zone[j].nb_dev; k++)
64 printk(KERN_CONT "%s/",
65 bdevname(conf->devlist[j*raid_disks
66 + k]->bdev, b));
67 printk(KERN_CONT "]\n");
68
69 zone_size = conf->strip_zone[j].zone_end - zone_start;
70 printk(KERN_INFO " zone offset=%llukb "
71 "device offset=%llukb size=%llukb\n",
72 (unsigned long long)zone_start>>1,
73 (unsigned long long)conf->strip_zone[j].dev_start>>1,
74 (unsigned long long)zone_size>>1);
75 zone_start = conf->strip_zone[j].zone_end;
76 }
77 printk(KERN_INFO "**********************************\n\n");
78}
79
80static int create_strip_zones(mddev_t *mddev, raid0_conf_t **private_conf)
81{
82 int i, c, err;
83 sector_t curr_zone_end, sectors;
84 mdk_rdev_t *smallest, *rdev1, *rdev2, *rdev, **dev;
85 struct strip_zone *zone;
86 int cnt;
87 char b[BDEVNAME_SIZE];
88 raid0_conf_t *conf = kzalloc(sizeof(*conf), GFP_KERNEL);
89
90 if (!conf)
91 return -ENOMEM;
92 list_for_each_entry(rdev1, &mddev->disks, same_set) {
93 printk(KERN_INFO "md/raid0:%s: looking at %s\n",
94 mdname(mddev),
95 bdevname(rdev1->bdev, b));
96 c = 0;
97
98 /* round size to chunk_size */
99 sectors = rdev1->sectors;
100 sector_div(sectors, mddev->chunk_sectors);
101 rdev1->sectors = sectors * mddev->chunk_sectors;
102
103 list_for_each_entry(rdev2, &mddev->disks, same_set) {
104 printk(KERN_INFO "md/raid0:%s: comparing %s(%llu)",
105 mdname(mddev),
106 bdevname(rdev1->bdev,b),
107 (unsigned long long)rdev1->sectors);
108 printk(KERN_CONT " with %s(%llu)\n",
109 bdevname(rdev2->bdev,b),
110 (unsigned long long)rdev2->sectors);
111 if (rdev2 == rdev1) {
112 printk(KERN_INFO "md/raid0:%s: END\n",
113 mdname(mddev));
114 break;
115 }
116 if (rdev2->sectors == rdev1->sectors) {
117 /*
118 * Not unique, don't count it as a new
119 * group
120 */
121 printk(KERN_INFO "md/raid0:%s: EQUAL\n",
122 mdname(mddev));
123 c = 1;
124 break;
125 }
126 printk(KERN_INFO "md/raid0:%s: NOT EQUAL\n",
127 mdname(mddev));
128 }
129 if (!c) {
130 printk(KERN_INFO "md/raid0:%s: ==> UNIQUE\n",
131 mdname(mddev));
132 conf->nr_strip_zones++;
133 printk(KERN_INFO "md/raid0:%s: %d zones\n",
134 mdname(mddev), conf->nr_strip_zones);
135 }
136 }
137 printk(KERN_INFO "md/raid0:%s: FINAL %d zones\n",
138 mdname(mddev), conf->nr_strip_zones);
139 err = -ENOMEM;
140 conf->strip_zone = kzalloc(sizeof(struct strip_zone)*
141 conf->nr_strip_zones, GFP_KERNEL);
142 if (!conf->strip_zone)
143 goto abort;
144 conf->devlist = kzalloc(sizeof(mdk_rdev_t*)*
145 conf->nr_strip_zones*mddev->raid_disks,
146 GFP_KERNEL);
147 if (!conf->devlist)
148 goto abort;
149
150 /* The first zone must contain all devices, so here we check that
151 * there is a proper alignment of slots to devices and find them all
152 */
153 zone = &conf->strip_zone[0];
154 cnt = 0;
155 smallest = NULL;
156 dev = conf->devlist;
157 err = -EINVAL;
158 list_for_each_entry(rdev1, &mddev->disks, same_set) {
159 int j = rdev1->raid_disk;
160
161 if (mddev->level == 10) {
162 /* taking over a raid10-n2 array */
163 j /= 2;
164 rdev1->new_raid_disk = j;
165 }
166
167 if (mddev->level == 1) {
168 /* taiking over a raid1 array-
169 * we have only one active disk
170 */
171 j = 0;
172 rdev1->new_raid_disk = j;
173 }
174
175 if (j < 0 || j >= mddev->raid_disks) {
176 printk(KERN_ERR "md/raid0:%s: bad disk number %d - "
177 "aborting!\n", mdname(mddev), j);
178 goto abort;
179 }
180 if (dev[j]) {
181 printk(KERN_ERR "md/raid0:%s: multiple devices for %d - "
182 "aborting!\n", mdname(mddev), j);
183 goto abort;
184 }
185 dev[j] = rdev1;
186
187 disk_stack_limits(mddev->gendisk, rdev1->bdev,
188 rdev1->data_offset << 9);
189 /* as we don't honour merge_bvec_fn, we must never risk
190 * violating it, so limit ->max_segments to 1, lying within
191 * a single page.
192 */
193
194 if (rdev1->bdev->bd_disk->queue->merge_bvec_fn) {
195 blk_queue_max_segments(mddev->queue, 1);
196 blk_queue_segment_boundary(mddev->queue,
197 PAGE_CACHE_SIZE - 1);
198 }
199 if (!smallest || (rdev1->sectors < smallest->sectors))
200 smallest = rdev1;
201 cnt++;
202 }
203 if (cnt != mddev->raid_disks) {
204 printk(KERN_ERR "md/raid0:%s: too few disks (%d of %d) - "
205 "aborting!\n", mdname(mddev), cnt, mddev->raid_disks);
206 goto abort;
207 }
208 zone->nb_dev = cnt;
209 zone->zone_end = smallest->sectors * cnt;
210
211 curr_zone_end = zone->zone_end;
212
213 /* now do the other zones */
214 for (i = 1; i < conf->nr_strip_zones; i++)
215 {
216 int j;
217
218 zone = conf->strip_zone + i;
219 dev = conf->devlist + i * mddev->raid_disks;
220
221 printk(KERN_INFO "md/raid0:%s: zone %d\n",
222 mdname(mddev), i);
223 zone->dev_start = smallest->sectors;
224 smallest = NULL;
225 c = 0;
226
227 for (j=0; j<cnt; j++) {
228 rdev = conf->devlist[j];
229 printk(KERN_INFO "md/raid0:%s: checking %s ...",
230 mdname(mddev),
231 bdevname(rdev->bdev, b));
232 if (rdev->sectors <= zone->dev_start) {
233 printk(KERN_CONT " nope.\n");
234 continue;
235 }
236 printk(KERN_CONT " contained as device %d\n", c);
237 dev[c] = rdev;
238 c++;
239 if (!smallest || rdev->sectors < smallest->sectors) {
240 smallest = rdev;
241 printk(KERN_INFO "md/raid0:%s: (%llu) is smallest!.\n",
242 mdname(mddev),
243 (unsigned long long)rdev->sectors);
244 }
245 }
246
247 zone->nb_dev = c;
248 sectors = (smallest->sectors - zone->dev_start) * c;
249 printk(KERN_INFO "md/raid0:%s: zone->nb_dev: %d, sectors: %llu\n",
250 mdname(mddev),
251 zone->nb_dev, (unsigned long long)sectors);
252
253 curr_zone_end += sectors;
254 zone->zone_end = curr_zone_end;
255
256 printk(KERN_INFO "md/raid0:%s: current zone start: %llu\n",
257 mdname(mddev),
258 (unsigned long long)smallest->sectors);
259 }
260 mddev->queue->backing_dev_info.congested_fn = raid0_congested;
261 mddev->queue->backing_dev_info.congested_data = mddev;
262
263 /*
264 * now since we have the hard sector sizes, we can make sure
265 * chunk size is a multiple of that sector size
266 */
267 if ((mddev->chunk_sectors << 9) % queue_logical_block_size(mddev->queue)) {
268 printk(KERN_ERR "md/raid0:%s: chunk_size of %d not valid\n",
269 mdname(mddev),
270 mddev->chunk_sectors << 9);
271 goto abort;
272 }
273
274 blk_queue_io_min(mddev->queue, mddev->chunk_sectors << 9);
275 blk_queue_io_opt(mddev->queue,
276 (mddev->chunk_sectors << 9) * mddev->raid_disks);
277
278 printk(KERN_INFO "md/raid0:%s: done.\n", mdname(mddev));
279 *private_conf = conf;
280
281 return 0;
282abort:
283 kfree(conf->strip_zone);
284 kfree(conf->devlist);
285 kfree(conf);
286 *private_conf = NULL;
287 return err;
288}
289
290/**
291 * raid0_mergeable_bvec -- tell bio layer if a two requests can be merged
292 * @q: request queue
293 * @bvm: properties of new bio
294 * @biovec: the request that could be merged to it.
295 *
296 * Return amount of bytes we can accept at this offset
297 */
298static int raid0_mergeable_bvec(struct request_queue *q,
299 struct bvec_merge_data *bvm,
300 struct bio_vec *biovec)
301{
302 mddev_t *mddev = q->queuedata;
303 sector_t sector = bvm->bi_sector + get_start_sect(bvm->bi_bdev);
304 int max;
305 unsigned int chunk_sectors = mddev->chunk_sectors;
306 unsigned int bio_sectors = bvm->bi_size >> 9;
307
308 if (is_power_of_2(chunk_sectors))
309 max = (chunk_sectors - ((sector & (chunk_sectors-1))
310 + bio_sectors)) << 9;
311 else
312 max = (chunk_sectors - (sector_div(sector, chunk_sectors)
313 + bio_sectors)) << 9;
314 if (max < 0) max = 0; /* bio_add cannot handle a negative return */
315 if (max <= biovec->bv_len && bio_sectors == 0)
316 return biovec->bv_len;
317 else
318 return max;
319}
320
321static sector_t raid0_size(mddev_t *mddev, sector_t sectors, int raid_disks)
322{
323 sector_t array_sectors = 0;
324 mdk_rdev_t *rdev;
325
326 WARN_ONCE(sectors || raid_disks,
327 "%s does not support generic reshape\n", __func__);
328
329 list_for_each_entry(rdev, &mddev->disks, same_set)
330 array_sectors += rdev->sectors;
331
332 return array_sectors;
333}
334
335static int raid0_run(mddev_t *mddev)
336{
337 raid0_conf_t *conf;
338 int ret;
339
340 if (mddev->chunk_sectors == 0) {
341 printk(KERN_ERR "md/raid0:%s: chunk size must be set.\n",
342 mdname(mddev));
343 return -EINVAL;
344 }
345 if (md_check_no_bitmap(mddev))
346 return -EINVAL;
347 blk_queue_max_hw_sectors(mddev->queue, mddev->chunk_sectors);
348
349 /* if private is not null, we are here after takeover */
350 if (mddev->private == NULL) {
351 ret = create_strip_zones(mddev, &conf);
352 if (ret < 0)
353 return ret;
354 mddev->private = conf;
355 }
356 conf = mddev->private;
357
358 /* calculate array device size */
359 md_set_array_sectors(mddev, raid0_size(mddev, 0, 0));
360
361 printk(KERN_INFO "md/raid0:%s: md_size is %llu sectors.\n",
362 mdname(mddev),
363 (unsigned long long)mddev->array_sectors);
364 /* calculate the max read-ahead size.
365 * For read-ahead of large files to be effective, we need to
366 * readahead at least twice a whole stripe. i.e. number of devices
367 * multiplied by chunk size times 2.
368 * If an individual device has an ra_pages greater than the
369 * chunk size, then we will not drive that device as hard as it
370 * wants. We consider this a configuration error: a larger
371 * chunksize should be used in that case.
372 */
373 {
374 int stripe = mddev->raid_disks *
375 (mddev->chunk_sectors << 9) / PAGE_SIZE;
376 if (mddev->queue->backing_dev_info.ra_pages < 2* stripe)
377 mddev->queue->backing_dev_info.ra_pages = 2* stripe;
378 }
379
380 blk_queue_merge_bvec(mddev->queue, raid0_mergeable_bvec);
381 dump_zones(mddev);
382 return md_integrity_register(mddev);
383}
384
385static int raid0_stop(mddev_t *mddev)
386{
387 raid0_conf_t *conf = mddev->private;
388
389 blk_sync_queue(mddev->queue); /* the unplug fn references 'conf'*/
390 kfree(conf->strip_zone);
391 kfree(conf->devlist);
392 kfree(conf);
393 mddev->private = NULL;
394 return 0;
395}
396
397/* Find the zone which holds a particular offset
398 * Update *sectorp to be an offset in that zone
399 */
400static struct strip_zone *find_zone(struct raid0_private_data *conf,
401 sector_t *sectorp)
402{
403 int i;
404 struct strip_zone *z = conf->strip_zone;
405 sector_t sector = *sectorp;
406
407 for (i = 0; i < conf->nr_strip_zones; i++)
408 if (sector < z[i].zone_end) {
409 if (i)
410 *sectorp = sector - z[i-1].zone_end;
411 return z + i;
412 }
413 BUG();
414}
415
416/*
417 * remaps the bio to the target device. we separate two flows.
418 * power 2 flow and a general flow for the sake of perfromance
419*/
420static mdk_rdev_t *map_sector(mddev_t *mddev, struct strip_zone *zone,
421 sector_t sector, sector_t *sector_offset)
422{
423 unsigned int sect_in_chunk;
424 sector_t chunk;
425 raid0_conf_t *conf = mddev->private;
426 int raid_disks = conf->strip_zone[0].nb_dev;
427 unsigned int chunk_sects = mddev->chunk_sectors;
428
429 if (is_power_of_2(chunk_sects)) {
430 int chunksect_bits = ffz(~chunk_sects);
431 /* find the sector offset inside the chunk */
432 sect_in_chunk = sector & (chunk_sects - 1);
433 sector >>= chunksect_bits;
434 /* chunk in zone */
435 chunk = *sector_offset;
436 /* quotient is the chunk in real device*/
437 sector_div(chunk, zone->nb_dev << chunksect_bits);
438 } else{
439 sect_in_chunk = sector_div(sector, chunk_sects);
440 chunk = *sector_offset;
441 sector_div(chunk, chunk_sects * zone->nb_dev);
442 }
443 /*
444 * position the bio over the real device
445 * real sector = chunk in device + starting of zone
446 * + the position in the chunk
447 */
448 *sector_offset = (chunk * chunk_sects) + sect_in_chunk;
449 return conf->devlist[(zone - conf->strip_zone)*raid_disks
450 + sector_div(sector, zone->nb_dev)];
451}
452
453/*
454 * Is io distribute over 1 or more chunks ?
455*/
456static inline int is_io_in_chunk_boundary(mddev_t *mddev,
457 unsigned int chunk_sects, struct bio *bio)
458{
459 if (likely(is_power_of_2(chunk_sects))) {
460 return chunk_sects >= ((bio->bi_sector & (chunk_sects-1))
461 + (bio->bi_size >> 9));
462 } else{
463 sector_t sector = bio->bi_sector;
464 return chunk_sects >= (sector_div(sector, chunk_sects)
465 + (bio->bi_size >> 9));
466 }
467}
468
469static int raid0_make_request(mddev_t *mddev, struct bio *bio)
470{
471 unsigned int chunk_sects;
472 sector_t sector_offset;
473 struct strip_zone *zone;
474 mdk_rdev_t *tmp_dev;
475
476 if (unlikely(bio->bi_rw & REQ_FLUSH)) {
477 md_flush_request(mddev, bio);
478 return 0;
479 }
480
481 chunk_sects = mddev->chunk_sectors;
482 if (unlikely(!is_io_in_chunk_boundary(mddev, chunk_sects, bio))) {
483 sector_t sector = bio->bi_sector;
484 struct bio_pair *bp;
485 /* Sanity check -- queue functions should prevent this happening */
486 if (bio->bi_vcnt != 1 ||
487 bio->bi_idx != 0)
488 goto bad_map;
489 /* This is a one page bio that upper layers
490 * refuse to split for us, so we need to split it.
491 */
492 if (likely(is_power_of_2(chunk_sects)))
493 bp = bio_split(bio, chunk_sects - (sector &
494 (chunk_sects-1)));
495 else
496 bp = bio_split(bio, chunk_sects -
497 sector_div(sector, chunk_sects));
498 if (raid0_make_request(mddev, &bp->bio1))
499 generic_make_request(&bp->bio1);
500 if (raid0_make_request(mddev, &bp->bio2))
501 generic_make_request(&bp->bio2);
502
503 bio_pair_release(bp);
504 return 0;
505 }
506
507 sector_offset = bio->bi_sector;
508 zone = find_zone(mddev->private, §or_offset);
509 tmp_dev = map_sector(mddev, zone, bio->bi_sector,
510 §or_offset);
511 bio->bi_bdev = tmp_dev->bdev;
512 bio->bi_sector = sector_offset + zone->dev_start +
513 tmp_dev->data_offset;
514 /*
515 * Let the main block layer submit the IO and resolve recursion:
516 */
517 return 1;
518
519bad_map:
520 printk("md/raid0:%s: make_request bug: can't convert block across chunks"
521 " or bigger than %dk %llu %d\n",
522 mdname(mddev), chunk_sects / 2,
523 (unsigned long long)bio->bi_sector, bio->bi_size >> 10);
524
525 bio_io_error(bio);
526 return 0;
527}
528
529static void raid0_status(struct seq_file *seq, mddev_t *mddev)
530{
531#undef MD_DEBUG
532#ifdef MD_DEBUG
533 int j, k, h;
534 char b[BDEVNAME_SIZE];
535 raid0_conf_t *conf = mddev->private;
536 int raid_disks = conf->strip_zone[0].nb_dev;
537
538 sector_t zone_size;
539 sector_t zone_start = 0;
540 h = 0;
541
542 for (j = 0; j < conf->nr_strip_zones; j++) {
543 seq_printf(seq, " z%d", j);
544 seq_printf(seq, "=[");
545 for (k = 0; k < conf->strip_zone[j].nb_dev; k++)
546 seq_printf(seq, "%s/", bdevname(
547 conf->devlist[j*raid_disks + k]
548 ->bdev, b));
549
550 zone_size = conf->strip_zone[j].zone_end - zone_start;
551 seq_printf(seq, "] ze=%lld ds=%lld s=%lld\n",
552 (unsigned long long)zone_start>>1,
553 (unsigned long long)conf->strip_zone[j].dev_start>>1,
554 (unsigned long long)zone_size>>1);
555 zone_start = conf->strip_zone[j].zone_end;
556 }
557#endif
558 seq_printf(seq, " %dk chunks", mddev->chunk_sectors / 2);
559 return;
560}
561
562static void *raid0_takeover_raid45(mddev_t *mddev)
563{
564 mdk_rdev_t *rdev;
565 raid0_conf_t *priv_conf;
566
567 if (mddev->degraded != 1) {
568 printk(KERN_ERR "md/raid0:%s: raid5 must be degraded! Degraded disks: %d\n",
569 mdname(mddev),
570 mddev->degraded);
571 return ERR_PTR(-EINVAL);
572 }
573
574 list_for_each_entry(rdev, &mddev->disks, same_set) {
575 /* check slot number for a disk */
576 if (rdev->raid_disk == mddev->raid_disks-1) {
577 printk(KERN_ERR "md/raid0:%s: raid5 must have missing parity disk!\n",
578 mdname(mddev));
579 return ERR_PTR(-EINVAL);
580 }
581 }
582
583 /* Set new parameters */
584 mddev->new_level = 0;
585 mddev->new_layout = 0;
586 mddev->new_chunk_sectors = mddev->chunk_sectors;
587 mddev->raid_disks--;
588 mddev->delta_disks = -1;
589 /* make sure it will be not marked as dirty */
590 mddev->recovery_cp = MaxSector;
591
592 create_strip_zones(mddev, &priv_conf);
593 return priv_conf;
594}
595
596static void *raid0_takeover_raid10(mddev_t *mddev)
597{
598 raid0_conf_t *priv_conf;
599
600 /* Check layout:
601 * - far_copies must be 1
602 * - near_copies must be 2
603 * - disks number must be even
604 * - all mirrors must be already degraded
605 */
606 if (mddev->layout != ((1 << 8) + 2)) {
607 printk(KERN_ERR "md/raid0:%s:: Raid0 cannot takover layout: 0x%x\n",
608 mdname(mddev),
609 mddev->layout);
610 return ERR_PTR(-EINVAL);
611 }
612 if (mddev->raid_disks & 1) {
613 printk(KERN_ERR "md/raid0:%s: Raid0 cannot takover Raid10 with odd disk number.\n",
614 mdname(mddev));
615 return ERR_PTR(-EINVAL);
616 }
617 if (mddev->degraded != (mddev->raid_disks>>1)) {
618 printk(KERN_ERR "md/raid0:%s: All mirrors must be already degraded!\n",
619 mdname(mddev));
620 return ERR_PTR(-EINVAL);
621 }
622
623 /* Set new parameters */
624 mddev->new_level = 0;
625 mddev->new_layout = 0;
626 mddev->new_chunk_sectors = mddev->chunk_sectors;
627 mddev->delta_disks = - mddev->raid_disks / 2;
628 mddev->raid_disks += mddev->delta_disks;
629 mddev->degraded = 0;
630 /* make sure it will be not marked as dirty */
631 mddev->recovery_cp = MaxSector;
632
633 create_strip_zones(mddev, &priv_conf);
634 return priv_conf;
635}
636
637static void *raid0_takeover_raid1(mddev_t *mddev)
638{
639 raid0_conf_t *priv_conf;
640
641 /* Check layout:
642 * - (N - 1) mirror drives must be already faulty
643 */
644 if ((mddev->raid_disks - 1) != mddev->degraded) {
645 printk(KERN_ERR "md/raid0:%s: (N - 1) mirrors drives must be already faulty!\n",
646 mdname(mddev));
647 return ERR_PTR(-EINVAL);
648 }
649
650 /* Set new parameters */
651 mddev->new_level = 0;
652 mddev->new_layout = 0;
653 mddev->new_chunk_sectors = 128; /* by default set chunk size to 64k */
654 mddev->delta_disks = 1 - mddev->raid_disks;
655 mddev->raid_disks = 1;
656 /* make sure it will be not marked as dirty */
657 mddev->recovery_cp = MaxSector;
658
659 create_strip_zones(mddev, &priv_conf);
660 return priv_conf;
661}
662
663static void *raid0_takeover(mddev_t *mddev)
664{
665 /* raid0 can take over:
666 * raid4 - if all data disks are active.
667 * raid5 - providing it is Raid4 layout and one disk is faulty
668 * raid10 - assuming we have all necessary active disks
669 * raid1 - with (N -1) mirror drives faulty
670 */
671 if (mddev->level == 4)
672 return raid0_takeover_raid45(mddev);
673
674 if (mddev->level == 5) {
675 if (mddev->layout == ALGORITHM_PARITY_N)
676 return raid0_takeover_raid45(mddev);
677
678 printk(KERN_ERR "md/raid0:%s: Raid can only takeover Raid5 with layout: %d\n",
679 mdname(mddev), ALGORITHM_PARITY_N);
680 }
681
682 if (mddev->level == 10)
683 return raid0_takeover_raid10(mddev);
684
685 if (mddev->level == 1)
686 return raid0_takeover_raid1(mddev);
687
688 printk(KERN_ERR "Takeover from raid%i to raid0 not supported\n",
689 mddev->level);
690
691 return ERR_PTR(-EINVAL);
692}
693
694static void raid0_quiesce(mddev_t *mddev, int state)
695{
696}
697
698static struct mdk_personality raid0_personality=
699{
700 .name = "raid0",
701 .level = 0,
702 .owner = THIS_MODULE,
703 .make_request = raid0_make_request,
704 .run = raid0_run,
705 .stop = raid0_stop,
706 .status = raid0_status,
707 .size = raid0_size,
708 .takeover = raid0_takeover,
709 .quiesce = raid0_quiesce,
710};
711
712static int __init raid0_init (void)
713{
714 return register_md_personality (&raid0_personality);
715}
716
717static void raid0_exit (void)
718{
719 unregister_md_personality (&raid0_personality);
720}
721
722module_init(raid0_init);
723module_exit(raid0_exit);
724MODULE_LICENSE("GPL");
725MODULE_DESCRIPTION("RAID0 (striping) personality for MD");
726MODULE_ALIAS("md-personality-2"); /* RAID0 */
727MODULE_ALIAS("md-raid0");
728MODULE_ALIAS("md-level-0");
1/*
2 raid0.c : Multiple Devices driver for Linux
3 Copyright (C) 1994-96 Marc ZYNGIER
4 <zyngier@ufr-info-p7.ibp.fr> or
5 <maz@gloups.fdn.fr>
6 Copyright (C) 1999, 2000 Ingo Molnar, Red Hat
7
8 RAID-0 management functions.
9
10 This program is free software; you can redistribute it and/or modify
11 it under the terms of the GNU General Public License as published by
12 the Free Software Foundation; either version 2, or (at your option)
13 any later version.
14
15 You should have received a copy of the GNU General Public License
16 (for example /usr/src/linux/COPYING); if not, write to the Free
17 Software Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
18*/
19
20#include <linux/blkdev.h>
21#include <linux/seq_file.h>
22#include <linux/module.h>
23#include <linux/slab.h>
24#include "md.h"
25#include "raid0.h"
26#include "raid5.h"
27
28static int raid0_congested(struct mddev *mddev, int bits)
29{
30 struct r0conf *conf = mddev->private;
31 struct md_rdev **devlist = conf->devlist;
32 int raid_disks = conf->strip_zone[0].nb_dev;
33 int i, ret = 0;
34
35 for (i = 0; i < raid_disks && !ret ; i++) {
36 struct request_queue *q = bdev_get_queue(devlist[i]->bdev);
37
38 ret |= bdi_congested(&q->backing_dev_info, bits);
39 }
40 return ret;
41}
42
43/*
44 * inform the user of the raid configuration
45*/
46static void dump_zones(struct mddev *mddev)
47{
48 int j, k;
49 sector_t zone_size = 0;
50 sector_t zone_start = 0;
51 char b[BDEVNAME_SIZE];
52 struct r0conf *conf = mddev->private;
53 int raid_disks = conf->strip_zone[0].nb_dev;
54 printk(KERN_INFO "md: RAID0 configuration for %s - %d zone%s\n",
55 mdname(mddev),
56 conf->nr_strip_zones, conf->nr_strip_zones==1?"":"s");
57 for (j = 0; j < conf->nr_strip_zones; j++) {
58 printk(KERN_INFO "md: zone%d=[", j);
59 for (k = 0; k < conf->strip_zone[j].nb_dev; k++)
60 printk(KERN_CONT "%s%s", k?"/":"",
61 bdevname(conf->devlist[j*raid_disks
62 + k]->bdev, b));
63 printk(KERN_CONT "]\n");
64
65 zone_size = conf->strip_zone[j].zone_end - zone_start;
66 printk(KERN_INFO " zone-offset=%10lluKB, "
67 "device-offset=%10lluKB, size=%10lluKB\n",
68 (unsigned long long)zone_start>>1,
69 (unsigned long long)conf->strip_zone[j].dev_start>>1,
70 (unsigned long long)zone_size>>1);
71 zone_start = conf->strip_zone[j].zone_end;
72 }
73}
74
75static int create_strip_zones(struct mddev *mddev, struct r0conf **private_conf)
76{
77 int i, c, err;
78 sector_t curr_zone_end, sectors;
79 struct md_rdev *smallest, *rdev1, *rdev2, *rdev, **dev;
80 struct strip_zone *zone;
81 int cnt;
82 char b[BDEVNAME_SIZE];
83 char b2[BDEVNAME_SIZE];
84 struct r0conf *conf = kzalloc(sizeof(*conf), GFP_KERNEL);
85 unsigned short blksize = 512;
86
87 *private_conf = ERR_PTR(-ENOMEM);
88 if (!conf)
89 return -ENOMEM;
90 rdev_for_each(rdev1, mddev) {
91 pr_debug("md/raid0:%s: looking at %s\n",
92 mdname(mddev),
93 bdevname(rdev1->bdev, b));
94 c = 0;
95
96 /* round size to chunk_size */
97 sectors = rdev1->sectors;
98 sector_div(sectors, mddev->chunk_sectors);
99 rdev1->sectors = sectors * mddev->chunk_sectors;
100
101 blksize = max(blksize, queue_logical_block_size(
102 rdev1->bdev->bd_disk->queue));
103
104 rdev_for_each(rdev2, mddev) {
105 pr_debug("md/raid0:%s: comparing %s(%llu)"
106 " with %s(%llu)\n",
107 mdname(mddev),
108 bdevname(rdev1->bdev,b),
109 (unsigned long long)rdev1->sectors,
110 bdevname(rdev2->bdev,b2),
111 (unsigned long long)rdev2->sectors);
112 if (rdev2 == rdev1) {
113 pr_debug("md/raid0:%s: END\n",
114 mdname(mddev));
115 break;
116 }
117 if (rdev2->sectors == rdev1->sectors) {
118 /*
119 * Not unique, don't count it as a new
120 * group
121 */
122 pr_debug("md/raid0:%s: EQUAL\n",
123 mdname(mddev));
124 c = 1;
125 break;
126 }
127 pr_debug("md/raid0:%s: NOT EQUAL\n",
128 mdname(mddev));
129 }
130 if (!c) {
131 pr_debug("md/raid0:%s: ==> UNIQUE\n",
132 mdname(mddev));
133 conf->nr_strip_zones++;
134 pr_debug("md/raid0:%s: %d zones\n",
135 mdname(mddev), conf->nr_strip_zones);
136 }
137 }
138 pr_debug("md/raid0:%s: FINAL %d zones\n",
139 mdname(mddev), conf->nr_strip_zones);
140 /*
141 * now since we have the hard sector sizes, we can make sure
142 * chunk size is a multiple of that sector size
143 */
144 if ((mddev->chunk_sectors << 9) % blksize) {
145 printk(KERN_ERR "md/raid0:%s: chunk_size of %d not multiple of block size %d\n",
146 mdname(mddev),
147 mddev->chunk_sectors << 9, blksize);
148 err = -EINVAL;
149 goto abort;
150 }
151
152 err = -ENOMEM;
153 conf->strip_zone = kzalloc(sizeof(struct strip_zone)*
154 conf->nr_strip_zones, GFP_KERNEL);
155 if (!conf->strip_zone)
156 goto abort;
157 conf->devlist = kzalloc(sizeof(struct md_rdev*)*
158 conf->nr_strip_zones*mddev->raid_disks,
159 GFP_KERNEL);
160 if (!conf->devlist)
161 goto abort;
162
163 /* The first zone must contain all devices, so here we check that
164 * there is a proper alignment of slots to devices and find them all
165 */
166 zone = &conf->strip_zone[0];
167 cnt = 0;
168 smallest = NULL;
169 dev = conf->devlist;
170 err = -EINVAL;
171 rdev_for_each(rdev1, mddev) {
172 int j = rdev1->raid_disk;
173
174 if (mddev->level == 10) {
175 /* taking over a raid10-n2 array */
176 j /= 2;
177 rdev1->new_raid_disk = j;
178 }
179
180 if (mddev->level == 1) {
181 /* taiking over a raid1 array-
182 * we have only one active disk
183 */
184 j = 0;
185 rdev1->new_raid_disk = j;
186 }
187
188 if (j < 0) {
189 printk(KERN_ERR
190 "md/raid0:%s: remove inactive devices before converting to RAID0\n",
191 mdname(mddev));
192 goto abort;
193 }
194 if (j >= mddev->raid_disks) {
195 printk(KERN_ERR "md/raid0:%s: bad disk number %d - "
196 "aborting!\n", mdname(mddev), j);
197 goto abort;
198 }
199 if (dev[j]) {
200 printk(KERN_ERR "md/raid0:%s: multiple devices for %d - "
201 "aborting!\n", mdname(mddev), j);
202 goto abort;
203 }
204 dev[j] = rdev1;
205
206 if (!smallest || (rdev1->sectors < smallest->sectors))
207 smallest = rdev1;
208 cnt++;
209 }
210 if (cnt != mddev->raid_disks) {
211 printk(KERN_ERR "md/raid0:%s: too few disks (%d of %d) - "
212 "aborting!\n", mdname(mddev), cnt, mddev->raid_disks);
213 goto abort;
214 }
215 zone->nb_dev = cnt;
216 zone->zone_end = smallest->sectors * cnt;
217
218 curr_zone_end = zone->zone_end;
219
220 /* now do the other zones */
221 for (i = 1; i < conf->nr_strip_zones; i++)
222 {
223 int j;
224
225 zone = conf->strip_zone + i;
226 dev = conf->devlist + i * mddev->raid_disks;
227
228 pr_debug("md/raid0:%s: zone %d\n", mdname(mddev), i);
229 zone->dev_start = smallest->sectors;
230 smallest = NULL;
231 c = 0;
232
233 for (j=0; j<cnt; j++) {
234 rdev = conf->devlist[j];
235 if (rdev->sectors <= zone->dev_start) {
236 pr_debug("md/raid0:%s: checking %s ... nope\n",
237 mdname(mddev),
238 bdevname(rdev->bdev, b));
239 continue;
240 }
241 pr_debug("md/raid0:%s: checking %s ..."
242 " contained as device %d\n",
243 mdname(mddev),
244 bdevname(rdev->bdev, b), c);
245 dev[c] = rdev;
246 c++;
247 if (!smallest || rdev->sectors < smallest->sectors) {
248 smallest = rdev;
249 pr_debug("md/raid0:%s: (%llu) is smallest!.\n",
250 mdname(mddev),
251 (unsigned long long)rdev->sectors);
252 }
253 }
254
255 zone->nb_dev = c;
256 sectors = (smallest->sectors - zone->dev_start) * c;
257 pr_debug("md/raid0:%s: zone->nb_dev: %d, sectors: %llu\n",
258 mdname(mddev),
259 zone->nb_dev, (unsigned long long)sectors);
260
261 curr_zone_end += sectors;
262 zone->zone_end = curr_zone_end;
263
264 pr_debug("md/raid0:%s: current zone start: %llu\n",
265 mdname(mddev),
266 (unsigned long long)smallest->sectors);
267 }
268
269 pr_debug("md/raid0:%s: done.\n", mdname(mddev));
270 *private_conf = conf;
271
272 return 0;
273abort:
274 kfree(conf->strip_zone);
275 kfree(conf->devlist);
276 kfree(conf);
277 *private_conf = ERR_PTR(err);
278 return err;
279}
280
281/* Find the zone which holds a particular offset
282 * Update *sectorp to be an offset in that zone
283 */
284static struct strip_zone *find_zone(struct r0conf *conf,
285 sector_t *sectorp)
286{
287 int i;
288 struct strip_zone *z = conf->strip_zone;
289 sector_t sector = *sectorp;
290
291 for (i = 0; i < conf->nr_strip_zones; i++)
292 if (sector < z[i].zone_end) {
293 if (i)
294 *sectorp = sector - z[i-1].zone_end;
295 return z + i;
296 }
297 BUG();
298}
299
300/*
301 * remaps the bio to the target device. we separate two flows.
302 * power 2 flow and a general flow for the sake of performance
303*/
304static struct md_rdev *map_sector(struct mddev *mddev, struct strip_zone *zone,
305 sector_t sector, sector_t *sector_offset)
306{
307 unsigned int sect_in_chunk;
308 sector_t chunk;
309 struct r0conf *conf = mddev->private;
310 int raid_disks = conf->strip_zone[0].nb_dev;
311 unsigned int chunk_sects = mddev->chunk_sectors;
312
313 if (is_power_of_2(chunk_sects)) {
314 int chunksect_bits = ffz(~chunk_sects);
315 /* find the sector offset inside the chunk */
316 sect_in_chunk = sector & (chunk_sects - 1);
317 sector >>= chunksect_bits;
318 /* chunk in zone */
319 chunk = *sector_offset;
320 /* quotient is the chunk in real device*/
321 sector_div(chunk, zone->nb_dev << chunksect_bits);
322 } else{
323 sect_in_chunk = sector_div(sector, chunk_sects);
324 chunk = *sector_offset;
325 sector_div(chunk, chunk_sects * zone->nb_dev);
326 }
327 /*
328 * position the bio over the real device
329 * real sector = chunk in device + starting of zone
330 * + the position in the chunk
331 */
332 *sector_offset = (chunk * chunk_sects) + sect_in_chunk;
333 return conf->devlist[(zone - conf->strip_zone)*raid_disks
334 + sector_div(sector, zone->nb_dev)];
335}
336
337static sector_t raid0_size(struct mddev *mddev, sector_t sectors, int raid_disks)
338{
339 sector_t array_sectors = 0;
340 struct md_rdev *rdev;
341
342 WARN_ONCE(sectors || raid_disks,
343 "%s does not support generic reshape\n", __func__);
344
345 rdev_for_each(rdev, mddev)
346 array_sectors += (rdev->sectors &
347 ~(sector_t)(mddev->chunk_sectors-1));
348
349 return array_sectors;
350}
351
352static void raid0_free(struct mddev *mddev, void *priv);
353
354static int raid0_run(struct mddev *mddev)
355{
356 struct r0conf *conf;
357 int ret;
358
359 if (mddev->chunk_sectors == 0) {
360 printk(KERN_ERR "md/raid0:%s: chunk size must be set.\n",
361 mdname(mddev));
362 return -EINVAL;
363 }
364 if (md_check_no_bitmap(mddev))
365 return -EINVAL;
366
367 /* if private is not null, we are here after takeover */
368 if (mddev->private == NULL) {
369 ret = create_strip_zones(mddev, &conf);
370 if (ret < 0)
371 return ret;
372 mddev->private = conf;
373 }
374 conf = mddev->private;
375 if (mddev->queue) {
376 struct md_rdev *rdev;
377 bool discard_supported = false;
378
379 blk_queue_max_hw_sectors(mddev->queue, mddev->chunk_sectors);
380 blk_queue_max_write_same_sectors(mddev->queue, mddev->chunk_sectors);
381 blk_queue_max_discard_sectors(mddev->queue, mddev->chunk_sectors);
382
383 blk_queue_io_min(mddev->queue, mddev->chunk_sectors << 9);
384 blk_queue_io_opt(mddev->queue,
385 (mddev->chunk_sectors << 9) * mddev->raid_disks);
386
387 rdev_for_each(rdev, mddev) {
388 disk_stack_limits(mddev->gendisk, rdev->bdev,
389 rdev->data_offset << 9);
390 if (blk_queue_discard(bdev_get_queue(rdev->bdev)))
391 discard_supported = true;
392 }
393 if (!discard_supported)
394 queue_flag_clear_unlocked(QUEUE_FLAG_DISCARD, mddev->queue);
395 else
396 queue_flag_set_unlocked(QUEUE_FLAG_DISCARD, mddev->queue);
397 }
398
399 /* calculate array device size */
400 md_set_array_sectors(mddev, raid0_size(mddev, 0, 0));
401
402 printk(KERN_INFO "md/raid0:%s: md_size is %llu sectors.\n",
403 mdname(mddev),
404 (unsigned long long)mddev->array_sectors);
405
406 if (mddev->queue) {
407 /* calculate the max read-ahead size.
408 * For read-ahead of large files to be effective, we need to
409 * readahead at least twice a whole stripe. i.e. number of devices
410 * multiplied by chunk size times 2.
411 * If an individual device has an ra_pages greater than the
412 * chunk size, then we will not drive that device as hard as it
413 * wants. We consider this a configuration error: a larger
414 * chunksize should be used in that case.
415 */
416 int stripe = mddev->raid_disks *
417 (mddev->chunk_sectors << 9) / PAGE_SIZE;
418 if (mddev->queue->backing_dev_info.ra_pages < 2* stripe)
419 mddev->queue->backing_dev_info.ra_pages = 2* stripe;
420 }
421
422 dump_zones(mddev);
423
424 ret = md_integrity_register(mddev);
425
426 return ret;
427}
428
429static void raid0_free(struct mddev *mddev, void *priv)
430{
431 struct r0conf *conf = priv;
432
433 kfree(conf->strip_zone);
434 kfree(conf->devlist);
435 kfree(conf);
436}
437
438/*
439 * Is io distribute over 1 or more chunks ?
440*/
441static inline int is_io_in_chunk_boundary(struct mddev *mddev,
442 unsigned int chunk_sects, struct bio *bio)
443{
444 if (likely(is_power_of_2(chunk_sects))) {
445 return chunk_sects >=
446 ((bio->bi_iter.bi_sector & (chunk_sects-1))
447 + bio_sectors(bio));
448 } else{
449 sector_t sector = bio->bi_iter.bi_sector;
450 return chunk_sects >= (sector_div(sector, chunk_sects)
451 + bio_sectors(bio));
452 }
453}
454
455static void raid0_make_request(struct mddev *mddev, struct bio *bio)
456{
457 struct strip_zone *zone;
458 struct md_rdev *tmp_dev;
459 struct bio *split;
460
461 if (unlikely(bio->bi_rw & REQ_FLUSH)) {
462 md_flush_request(mddev, bio);
463 return;
464 }
465
466 do {
467 sector_t sector = bio->bi_iter.bi_sector;
468 unsigned chunk_sects = mddev->chunk_sectors;
469
470 unsigned sectors = chunk_sects -
471 (likely(is_power_of_2(chunk_sects))
472 ? (sector & (chunk_sects-1))
473 : sector_div(sector, chunk_sects));
474
475 /* Restore due to sector_div */
476 sector = bio->bi_iter.bi_sector;
477
478 if (sectors < bio_sectors(bio)) {
479 split = bio_split(bio, sectors, GFP_NOIO, fs_bio_set);
480 bio_chain(split, bio);
481 } else {
482 split = bio;
483 }
484
485 zone = find_zone(mddev->private, §or);
486 tmp_dev = map_sector(mddev, zone, sector, §or);
487 split->bi_bdev = tmp_dev->bdev;
488 split->bi_iter.bi_sector = sector + zone->dev_start +
489 tmp_dev->data_offset;
490
491 if (unlikely((split->bi_rw & REQ_DISCARD) &&
492 !blk_queue_discard(bdev_get_queue(split->bi_bdev)))) {
493 /* Just ignore it */
494 bio_endio(split);
495 } else
496 generic_make_request(split);
497 } while (split != bio);
498}
499
500static void raid0_status(struct seq_file *seq, struct mddev *mddev)
501{
502 seq_printf(seq, " %dk chunks", mddev->chunk_sectors / 2);
503 return;
504}
505
506static void *raid0_takeover_raid45(struct mddev *mddev)
507{
508 struct md_rdev *rdev;
509 struct r0conf *priv_conf;
510
511 if (mddev->degraded != 1) {
512 printk(KERN_ERR "md/raid0:%s: raid5 must be degraded! Degraded disks: %d\n",
513 mdname(mddev),
514 mddev->degraded);
515 return ERR_PTR(-EINVAL);
516 }
517
518 rdev_for_each(rdev, mddev) {
519 /* check slot number for a disk */
520 if (rdev->raid_disk == mddev->raid_disks-1) {
521 printk(KERN_ERR "md/raid0:%s: raid5 must have missing parity disk!\n",
522 mdname(mddev));
523 return ERR_PTR(-EINVAL);
524 }
525 rdev->sectors = mddev->dev_sectors;
526 }
527
528 /* Set new parameters */
529 mddev->new_level = 0;
530 mddev->new_layout = 0;
531 mddev->new_chunk_sectors = mddev->chunk_sectors;
532 mddev->raid_disks--;
533 mddev->delta_disks = -1;
534 /* make sure it will be not marked as dirty */
535 mddev->recovery_cp = MaxSector;
536
537 create_strip_zones(mddev, &priv_conf);
538 return priv_conf;
539}
540
541static void *raid0_takeover_raid10(struct mddev *mddev)
542{
543 struct r0conf *priv_conf;
544
545 /* Check layout:
546 * - far_copies must be 1
547 * - near_copies must be 2
548 * - disks number must be even
549 * - all mirrors must be already degraded
550 */
551 if (mddev->layout != ((1 << 8) + 2)) {
552 printk(KERN_ERR "md/raid0:%s:: Raid0 cannot takeover layout: 0x%x\n",
553 mdname(mddev),
554 mddev->layout);
555 return ERR_PTR(-EINVAL);
556 }
557 if (mddev->raid_disks & 1) {
558 printk(KERN_ERR "md/raid0:%s: Raid0 cannot takeover Raid10 with odd disk number.\n",
559 mdname(mddev));
560 return ERR_PTR(-EINVAL);
561 }
562 if (mddev->degraded != (mddev->raid_disks>>1)) {
563 printk(KERN_ERR "md/raid0:%s: All mirrors must be already degraded!\n",
564 mdname(mddev));
565 return ERR_PTR(-EINVAL);
566 }
567
568 /* Set new parameters */
569 mddev->new_level = 0;
570 mddev->new_layout = 0;
571 mddev->new_chunk_sectors = mddev->chunk_sectors;
572 mddev->delta_disks = - mddev->raid_disks / 2;
573 mddev->raid_disks += mddev->delta_disks;
574 mddev->degraded = 0;
575 /* make sure it will be not marked as dirty */
576 mddev->recovery_cp = MaxSector;
577
578 create_strip_zones(mddev, &priv_conf);
579 return priv_conf;
580}
581
582static void *raid0_takeover_raid1(struct mddev *mddev)
583{
584 struct r0conf *priv_conf;
585 int chunksect;
586
587 /* Check layout:
588 * - (N - 1) mirror drives must be already faulty
589 */
590 if ((mddev->raid_disks - 1) != mddev->degraded) {
591 printk(KERN_ERR "md/raid0:%s: (N - 1) mirrors drives must be already faulty!\n",
592 mdname(mddev));
593 return ERR_PTR(-EINVAL);
594 }
595
596 /*
597 * a raid1 doesn't have the notion of chunk size, so
598 * figure out the largest suitable size we can use.
599 */
600 chunksect = 64 * 2; /* 64K by default */
601
602 /* The array must be an exact multiple of chunksize */
603 while (chunksect && (mddev->array_sectors & (chunksect - 1)))
604 chunksect >>= 1;
605
606 if ((chunksect << 9) < PAGE_SIZE)
607 /* array size does not allow a suitable chunk size */
608 return ERR_PTR(-EINVAL);
609
610 /* Set new parameters */
611 mddev->new_level = 0;
612 mddev->new_layout = 0;
613 mddev->new_chunk_sectors = chunksect;
614 mddev->chunk_sectors = chunksect;
615 mddev->delta_disks = 1 - mddev->raid_disks;
616 mddev->raid_disks = 1;
617 /* make sure it will be not marked as dirty */
618 mddev->recovery_cp = MaxSector;
619
620 create_strip_zones(mddev, &priv_conf);
621 return priv_conf;
622}
623
624static void *raid0_takeover(struct mddev *mddev)
625{
626 /* raid0 can take over:
627 * raid4 - if all data disks are active.
628 * raid5 - providing it is Raid4 layout and one disk is faulty
629 * raid10 - assuming we have all necessary active disks
630 * raid1 - with (N -1) mirror drives faulty
631 */
632
633 if (mddev->bitmap) {
634 printk(KERN_ERR "md/raid0: %s: cannot takeover array with bitmap\n",
635 mdname(mddev));
636 return ERR_PTR(-EBUSY);
637 }
638 if (mddev->level == 4)
639 return raid0_takeover_raid45(mddev);
640
641 if (mddev->level == 5) {
642 if (mddev->layout == ALGORITHM_PARITY_N)
643 return raid0_takeover_raid45(mddev);
644
645 printk(KERN_ERR "md/raid0:%s: Raid can only takeover Raid5 with layout: %d\n",
646 mdname(mddev), ALGORITHM_PARITY_N);
647 }
648
649 if (mddev->level == 10)
650 return raid0_takeover_raid10(mddev);
651
652 if (mddev->level == 1)
653 return raid0_takeover_raid1(mddev);
654
655 printk(KERN_ERR "Takeover from raid%i to raid0 not supported\n",
656 mddev->level);
657
658 return ERR_PTR(-EINVAL);
659}
660
661static void raid0_quiesce(struct mddev *mddev, int state)
662{
663}
664
665static struct md_personality raid0_personality=
666{
667 .name = "raid0",
668 .level = 0,
669 .owner = THIS_MODULE,
670 .make_request = raid0_make_request,
671 .run = raid0_run,
672 .free = raid0_free,
673 .status = raid0_status,
674 .size = raid0_size,
675 .takeover = raid0_takeover,
676 .quiesce = raid0_quiesce,
677 .congested = raid0_congested,
678};
679
680static int __init raid0_init (void)
681{
682 return register_md_personality (&raid0_personality);
683}
684
685static void raid0_exit (void)
686{
687 unregister_md_personality (&raid0_personality);
688}
689
690module_init(raid0_init);
691module_exit(raid0_exit);
692MODULE_LICENSE("GPL");
693MODULE_DESCRIPTION("RAID0 (striping) personality for MD");
694MODULE_ALIAS("md-personality-2"); /* RAID0 */
695MODULE_ALIAS("md-raid0");
696MODULE_ALIAS("md-level-0");