raid5.c
来自「Linux Kernel 2.6.9 for OMAP1710」· C语言 代码 · 共 1,920 行 · 第 1/4 页
C
1,920 行
spin_unlock_irq(&conf->device_lock); return 0;}/* FIXME go_faster isn't used */static int sync_request (mddev_t *mddev, sector_t sector_nr, int go_faster){ raid5_conf_t *conf = (raid5_conf_t *) mddev->private; struct stripe_head *sh; int sectors_per_chunk = conf->chunk_size >> 9; sector_t x; unsigned long stripe; int chunk_offset; int dd_idx, pd_idx; sector_t first_sector; int raid_disks = conf->raid_disks; int data_disks = raid_disks-1; if (sector_nr >= mddev->size <<1) { /* just being told to finish up .. nothing much to do */ unplug_slaves(mddev); return 0; } x = sector_nr; chunk_offset = sector_div(x, sectors_per_chunk); stripe = x; BUG_ON(x != stripe); first_sector = raid5_compute_sector((sector_t)stripe*data_disks*sectors_per_chunk + chunk_offset, raid_disks, data_disks, &dd_idx, &pd_idx, conf); sh = get_active_stripe(conf, sector_nr, pd_idx, 1); if (sh == NULL) { sh = get_active_stripe(conf, sector_nr, pd_idx, 0); /* make sure we don't swamp the stripe cache if someone else * is trying to get access */ set_current_state(TASK_UNINTERRUPTIBLE); schedule_timeout(1); } spin_lock(&sh->lock); set_bit(STRIPE_SYNCING, &sh->state); clear_bit(STRIPE_INSYNC, &sh->state); spin_unlock(&sh->lock); handle_stripe(sh); release_stripe(sh); return STRIPE_SECTORS;}/* * This is our raid5 kernel thread. * * We scan the hash table for stripes which can be handled now. * During the scan, completed stripes are saved for us by the interrupt * handler, so that they will not have to wait for our next wakeup. */static void raid5d (mddev_t *mddev){ struct stripe_head *sh; raid5_conf_t *conf = mddev_to_conf(mddev); int handled; PRINTK("+++ raid5d active\n"); md_check_recovery(mddev); md_handle_safemode(mddev); handled = 0; spin_lock_irq(&conf->device_lock); while (1) { struct list_head *first; if (list_empty(&conf->handle_list) && atomic_read(&conf->preread_active_stripes) < IO_THRESHOLD && !blk_queue_plugged(mddev->queue) && !list_empty(&conf->delayed_list)) raid5_activate_delayed(conf); if (list_empty(&conf->handle_list)) break; first = conf->handle_list.next; sh = list_entry(first, struct stripe_head, lru); list_del_init(first); atomic_inc(&sh->count); if (atomic_read(&sh->count)!= 1) BUG(); spin_unlock_irq(&conf->device_lock); handled++; handle_stripe(sh); release_stripe(sh); spin_lock_irq(&conf->device_lock); } PRINTK("%d stripes handled\n", handled); spin_unlock_irq(&conf->device_lock); unplug_slaves(mddev); PRINTK("--- raid5d inactive\n");}static int run (mddev_t *mddev){ raid5_conf_t *conf; int raid_disk, memory; mdk_rdev_t *rdev; struct disk_info *disk; struct list_head *tmp; if (mddev->level != 5 && mddev->level != 4) { printk("raid5: %s: raid level not set to 4/5 (%d)\n", mdname(mddev), mddev->level); return -EIO; } mddev->private = kmalloc (sizeof (raid5_conf_t) + mddev->raid_disks * sizeof(struct disk_info), GFP_KERNEL); if ((conf = mddev->private) == NULL) goto abort; memset (conf, 0, sizeof (*conf) + mddev->raid_disks * sizeof(struct disk_info) ); conf->mddev = mddev; if ((conf->stripe_hashtbl = (struct stripe_head **) __get_free_pages(GFP_ATOMIC, HASH_PAGES_ORDER)) == NULL) goto abort; memset(conf->stripe_hashtbl, 0, HASH_PAGES * PAGE_SIZE); conf->device_lock = SPIN_LOCK_UNLOCKED; init_waitqueue_head(&conf->wait_for_stripe); INIT_LIST_HEAD(&conf->handle_list); INIT_LIST_HEAD(&conf->delayed_list); INIT_LIST_HEAD(&conf->inactive_list); atomic_set(&conf->active_stripes, 0); atomic_set(&conf->preread_active_stripes, 0); mddev->queue->unplug_fn = raid5_unplug_device; mddev->queue->issue_flush_fn = raid5_issue_flush; PRINTK("raid5: run(%s) called.\n", mdname(mddev)); ITERATE_RDEV(mddev,rdev,tmp) { raid_disk = rdev->raid_disk; if (raid_disk >= mddev->raid_disks || raid_disk < 0) continue; disk = conf->disks + raid_disk; disk->rdev = rdev; if (rdev->in_sync) { char b[BDEVNAME_SIZE]; printk(KERN_INFO "raid5: device %s operational as raid" " disk %d\n", bdevname(rdev->bdev,b), raid_disk); conf->working_disks++; } } conf->raid_disks = mddev->raid_disks; /* * 0 for a fully functional array, 1 for a degraded array. */ mddev->degraded = conf->failed_disks = conf->raid_disks - conf->working_disks; conf->mddev = mddev; conf->chunk_size = mddev->chunk_size; conf->level = mddev->level; conf->algorithm = mddev->layout; conf->max_nr_stripes = NR_STRIPES; /* device size must be a multiple of chunk size */ mddev->size &= ~(mddev->chunk_size/1024 -1); if (!conf->chunk_size || conf->chunk_size % 4) { printk(KERN_ERR "raid5: invalid chunk size %d for %s\n", conf->chunk_size, mdname(mddev)); goto abort; } if (conf->algorithm > ALGORITHM_RIGHT_SYMMETRIC) { printk(KERN_ERR "raid5: unsupported parity algorithm %d for %s\n", conf->algorithm, mdname(mddev)); goto abort; } if (mddev->degraded > 1) { printk(KERN_ERR "raid5: not enough operational devices for %s" " (%d/%d failed)\n", mdname(mddev), conf->failed_disks, conf->raid_disks); goto abort; } if (mddev->degraded == 1 && mddev->recovery_cp != MaxSector) { printk(KERN_ERR "raid5: cannot start dirty degraded array for %s\n", mdname(mddev)); goto abort; } { mddev->thread = md_register_thread(raid5d, mddev, "%s_raid5"); if (!mddev->thread) { printk(KERN_ERR "raid5: couldn't allocate thread for %s\n", mdname(mddev)); goto abort; } }memory = conf->max_nr_stripes * (sizeof(struct stripe_head) + conf->raid_disks * ((sizeof(struct bio) + PAGE_SIZE))) / 1024; if (grow_stripes(conf, conf->max_nr_stripes)) { printk(KERN_ERR "raid5: couldn't allocate %dkB for buffers\n", memory); shrink_stripes(conf); md_unregister_thread(mddev->thread); goto abort; } else printk(KERN_INFO "raid5: allocated %dkB for %s\n", memory, mdname(mddev)); if (mddev->degraded == 0) printk("raid5: raid level %d set %s active with %d out of %d" " devices, algorithm %d\n", conf->level, mdname(mddev), mddev->raid_disks-mddev->degraded, mddev->raid_disks, conf->algorithm); else printk(KERN_ALERT "raid5: raid level %d set %s active with %d" " out of %d devices, algorithm %d\n", conf->level, mdname(mddev), mddev->raid_disks - mddev->degraded, mddev->raid_disks, conf->algorithm); print_raid5_conf(conf); /* read-ahead size must cover two whole stripes, which is * 2 * (n-1) * chunksize where 'n' is the number of raid devices */ { int stripe = (mddev->raid_disks-1) * mddev->chunk_size / PAGE_CACHE_SIZE; if (mddev->queue->backing_dev_info.ra_pages < 2 * stripe) mddev->queue->backing_dev_info.ra_pages = 2 * stripe; } /* Ok, everything is just fine now */ mddev->array_size = mddev->size * (mddev->raid_disks - 1); return 0;abort: if (conf) { print_raid5_conf(conf); if (conf->stripe_hashtbl) free_pages((unsigned long) conf->stripe_hashtbl, HASH_PAGES_ORDER); kfree(conf); } mddev->private = NULL; printk(KERN_ALERT "raid5: failed to run raid set %s\n", mdname(mddev)); return -EIO;}static int stop (mddev_t *mddev){ raid5_conf_t *conf = (raid5_conf_t *) mddev->private; md_unregister_thread(mddev->thread); mddev->thread = NULL; shrink_stripes(conf); free_pages((unsigned long) conf->stripe_hashtbl, HASH_PAGES_ORDER); kfree(conf); mddev->private = NULL; return 0;}#if RAID5_DEBUGstatic void print_sh (struct stripe_head *sh){ int i; printk("sh %llu, pd_idx %d, state %ld.\n", (unsigned long long)sh->sector, sh->pd_idx, sh->state); printk("sh %llu, count %d.\n", (unsigned long long)sh->sector, atomic_read(&sh->count)); printk("sh %llu, ", (unsigned long long)sh->sector); for (i = 0; i < sh->raid_conf->raid_disks; i++) { printk("(cache%d: %p %ld) ", i, sh->dev[i].page, sh->dev[i].flags); } printk("\n");}static void printall (raid5_conf_t *conf){ struct stripe_head *sh; int i; spin_lock_irq(&conf->device_lock); for (i = 0; i < NR_HASH; i++) { sh = conf->stripe_hashtbl[i]; for (; sh; sh = sh->hash_next) { if (sh->raid_conf != conf) continue; print_sh(sh); } } spin_unlock_irq(&conf->device_lock);}#endifstatic void status (struct seq_file *seq, mddev_t *mddev){ raid5_conf_t *conf = (raid5_conf_t *) mddev->private; int i; seq_printf (seq, " level %d, %dk chunk, algorithm %d", mddev->level, mddev->chunk_size >> 10, mddev->layout); seq_printf (seq, " [%d/%d] [", conf->raid_disks, conf->working_disks); for (i = 0; i < conf->raid_disks; i++) seq_printf (seq, "%s", conf->disks[i].rdev && conf->disks[i].rdev->in_sync ? "U" : "_"); seq_printf (seq, "]");#if RAID5_DEBUG#define D(x) \ seq_printf (seq, "<"#x":%d>", atomic_read(&conf->x)) printall(conf);#endif}static void print_raid5_conf (raid5_conf_t *conf){ int i; struct disk_info *tmp; printk("RAID5 conf printout:\n"); if (!conf) { printk("(conf==NULL)\n"); return; } printk(" --- rd:%d wd:%d fd:%d\n", conf->raid_disks, conf->working_disks, conf->failed_disks); for (i = 0; i < conf->raid_disks; i++) { char b[BDEVNAME_SIZE]; tmp = conf->disks + i; if (tmp->rdev) printk(" disk %d, o:%d, dev:%s\n", i, !tmp->rdev->faulty, bdevname(tmp->rdev->bdev,b)); }}static int raid5_spare_active(mddev_t *mddev){ int i; raid5_conf_t *conf = mddev->private; struct disk_info *tmp; spin_lock_irq(&conf->device_lock); for (i = 0; i < conf->raid_disks; i++) { tmp = conf->disks + i; if (tmp->rdev && !tmp->rdev->faulty && !tmp->rdev->in_sync) { mddev->degraded--; conf->failed_disks--; conf->working_disks++; tmp->rdev->in_sync = 1; } } spin_unlock_irq(&conf->device_lock); print_raid5_conf(conf); return 0;}static int raid5_remove_disk(mddev_t *mddev, int number){ raid5_conf_t *conf = mddev->private; int err = 1; struct disk_info *p = conf->disks + number; print_raid5_conf(conf); spin_lock_irq(&conf->device_lock); if (p->rdev) { if (p->rdev->in_sync || atomic_read(&p->rdev->nr_pending)) { err = -EBUSY; goto abort; } p->rdev = NULL; err = 0; } if (err) MD_BUG();abort: spin_unlock_irq(&conf->device_lock); print_raid5_conf(conf); return err;}static int raid5_add_disk(mddev_t *mddev, mdk_rdev_t *rdev){ raid5_conf_t *conf = mddev->private; int found = 0; int disk; struct disk_info *p; spin_lock_irq(&conf->device_lock); /* * find the disk ... */ for (disk=0; disk < mddev->raid_disks; disk++) if ((p=conf->disks + disk)->rdev == NULL) { p->rdev = rdev; rdev->in_sync = 0; rdev->raid_disk = disk; found = 1; break; } spin_unlock_irq(&conf->device_lock); print_raid5_conf(conf); return found;}static int raid5_resize(mddev_t *mddev, sector_t sectors){ /* no resync is happening, and there is enough space * on all devices, so we can resize. * We need to make sure resync covers any new space. * If the array is shrinking we should possibly wait until * any io in the removed space completes, but it hardly seems * worth it. */ sectors &= ~((sector_t)mddev->chunk_size/512 - 1); mddev->array_size = (sectors * (mddev->raid_disks-1))>>1; set_capacity(mddev->gendisk, mddev->array_size << 1); mddev->changed = 1; if (sectors/2 > mddev->size && mddev->recovery_cp == MaxSector) { mddev->recovery_cp = mddev->size << 1; set_bit(MD_RECOVERY_NEEDED, &mddev->recovery); } mddev->size = sectors /2; return 0;}static mdk_personality_t raid5_personality={ .name = "raid5", .owner = THIS_MODULE, .make_request = make_request, .run = run, .stop = stop, .status = status, .error_handler = error, .hot_add_disk = raid5_add_disk, .hot_remove_disk= raid5_remove_disk, .spare_active = raid5_spare_active, .sync_request = sync_request, .resize = raid5_resize,};static int __init raid5_init (void){ return register_md_personality (RAID5, &raid5_personality);}static void raid5_exit (void){ unregister_md_personality (RAID5);}module_init(raid5_init);module_exit(raid5_exit);MODULE_LICENSE("GPL");MODULE_ALIAS("md-personality-4"); /* RAID5 */
⌨️ 快捷键说明
复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?