raid6main.c

来自「Linux Kernel 2.6.9 for OMAP1710」· C语言 代码 · 共 2,095 行 · 第 1/4 页

C
2,095
字号
		new_sector = raid6_compute_sector(logical_sector,						  raid_disks, data_disks, &dd_idx, &pd_idx, conf);		PRINTK("raid6: make_request, sector %Lu logical %Lu\n",		       (unsigned long long)new_sector,		       (unsigned long long)logical_sector);		sh = get_active_stripe(conf, new_sector, pd_idx, (bi->bi_rw&RWA_MASK));		if (sh) {			add_stripe_bio(sh, bi, dd_idx, (bi->bi_rw&RW_MASK));			raid6_plug_device(conf);			handle_stripe(sh);			release_stripe(sh);		} else {			/* cannot get stripe for read-ahead, just give-up */			clear_bit(BIO_UPTODATE, &bi->bi_flags);			break;		}	}	spin_lock_irq(&conf->device_lock);	if (--bi->bi_phys_segments == 0) {		int bytes = bi->bi_size;		if ( bio_data_dir(bi) == WRITE )			md_write_end(mddev);		bi->bi_size = 0;		bi->bi_end_io(bi, bytes, 0);	}	spin_unlock_irq(&conf->device_lock);	return 0;}/* FIXME go_faster isn't used */static int sync_request (mddev_t *mddev, sector_t sector_nr, int go_faster){	raid6_conf_t *conf = (raid6_conf_t *) mddev->private;	struct stripe_head *sh;	int sectors_per_chunk = conf->chunk_size >> 9;	sector_t x;	unsigned long stripe;	int chunk_offset;	int dd_idx, pd_idx;	sector_t first_sector;	int raid_disks = conf->raid_disks;	int data_disks = raid_disks - 2;	if (sector_nr >= mddev->size <<1) {		/* just being told to finish up .. nothing much to do */		unplug_slaves(mddev);		return 0;	}	x = sector_nr;	chunk_offset = sector_div(x, sectors_per_chunk);	stripe = x;	BUG_ON(x != stripe);	first_sector = raid6_compute_sector((sector_t)stripe*data_disks*sectors_per_chunk		+ chunk_offset, raid_disks, data_disks, &dd_idx, &pd_idx, conf);	sh = get_active_stripe(conf, sector_nr, pd_idx, 1);	if (sh == NULL) {		sh = get_active_stripe(conf, sector_nr, pd_idx, 0);		/* make sure we don't swamp the stripe cache if someone else		 * is trying to get access		 */		set_current_state(TASK_UNINTERRUPTIBLE);		schedule_timeout(1);	}	spin_lock(&sh->lock);	set_bit(STRIPE_SYNCING, &sh->state);	clear_bit(STRIPE_INSYNC, &sh->state);	spin_unlock(&sh->lock);	handle_stripe(sh);	release_stripe(sh);	return STRIPE_SECTORS;}/* * This is our raid6 kernel thread. * * We scan the hash table for stripes which can be handled now. * During the scan, completed stripes are saved for us by the interrupt * handler, so that they will not have to wait for our next wakeup. */static void raid6d (mddev_t *mddev){	struct stripe_head *sh;	raid6_conf_t *conf = mddev_to_conf(mddev);	int handled;	PRINTK("+++ raid6d active\n");	md_check_recovery(mddev);	md_handle_safemode(mddev);	handled = 0;	spin_lock_irq(&conf->device_lock);	while (1) {		struct list_head *first;		if (list_empty(&conf->handle_list) &&		    atomic_read(&conf->preread_active_stripes) < IO_THRESHOLD &&		    !blk_queue_plugged(mddev->queue) &&		    !list_empty(&conf->delayed_list))			raid6_activate_delayed(conf);		if (list_empty(&conf->handle_list))			break;		first = conf->handle_list.next;		sh = list_entry(first, struct stripe_head, lru);		list_del_init(first);		atomic_inc(&sh->count);		if (atomic_read(&sh->count)!= 1)			BUG();		spin_unlock_irq(&conf->device_lock);		handled++;		handle_stripe(sh);		release_stripe(sh);		spin_lock_irq(&conf->device_lock);	}	PRINTK("%d stripes handled\n", handled);	spin_unlock_irq(&conf->device_lock);	unplug_slaves(mddev);	PRINTK("--- raid6d inactive\n");}static int run (mddev_t *mddev){	raid6_conf_t *conf;	int raid_disk, memory;	mdk_rdev_t *rdev;	struct disk_info *disk;	struct list_head *tmp;	if (mddev->level != 6) {		PRINTK("raid6: %s: raid level not set to 6 (%d)\n", mdname(mddev), mddev->level);		return -EIO;	}	mddev->private = kmalloc (sizeof (raid6_conf_t)				  + mddev->raid_disks * sizeof(struct disk_info),				  GFP_KERNEL);	if ((conf = mddev->private) == NULL)		goto abort;	memset (conf, 0, sizeof (*conf) + mddev->raid_disks * sizeof(struct disk_info) );	conf->mddev = mddev;	if ((conf->stripe_hashtbl = (struct stripe_head **) __get_free_pages(GFP_ATOMIC, HASH_PAGES_ORDER)) == NULL)		goto abort;	memset(conf->stripe_hashtbl, 0, HASH_PAGES * PAGE_SIZE);	conf->device_lock = SPIN_LOCK_UNLOCKED;	init_waitqueue_head(&conf->wait_for_stripe);	INIT_LIST_HEAD(&conf->handle_list);	INIT_LIST_HEAD(&conf->delayed_list);	INIT_LIST_HEAD(&conf->inactive_list);	atomic_set(&conf->active_stripes, 0);	atomic_set(&conf->preread_active_stripes, 0);	mddev->queue->unplug_fn = raid6_unplug_device;	mddev->queue->issue_flush_fn = raid6_issue_flush;	PRINTK("raid6: run(%s) called.\n", mdname(mddev));	ITERATE_RDEV(mddev,rdev,tmp) {		raid_disk = rdev->raid_disk;		if (raid_disk >= mddev->raid_disks		    || raid_disk < 0)			continue;		disk = conf->disks + raid_disk;		disk->rdev = rdev;		if (rdev->in_sync) {			char b[BDEVNAME_SIZE];			printk(KERN_INFO "raid6: device %s operational as raid"			       " disk %d\n", bdevname(rdev->bdev,b),			       raid_disk);			conf->working_disks++;		}	}	conf->raid_disks = mddev->raid_disks;	/*	 * 0 for a fully functional array, 1 or 2 for a degraded array.	 */	mddev->degraded = conf->failed_disks = conf->raid_disks - conf->working_disks;	conf->mddev = mddev;	conf->chunk_size = mddev->chunk_size;	conf->level = mddev->level;	conf->algorithm = mddev->layout;	conf->max_nr_stripes = NR_STRIPES;	/* device size must be a multiple of chunk size */	mddev->size &= ~(mddev->chunk_size/1024 -1);	if (conf->raid_disks < 4) {		printk(KERN_ERR "raid6: not enough configured devices for %s (%d, minimum 4)\n",		       mdname(mddev), conf->raid_disks);		goto abort;	}	if (!conf->chunk_size || conf->chunk_size % 4) {		printk(KERN_ERR "raid6: invalid chunk size %d for %s\n",		       conf->chunk_size, mdname(mddev));		goto abort;	}	if (conf->algorithm > ALGORITHM_RIGHT_SYMMETRIC) {		printk(KERN_ERR		       "raid6: unsupported parity algorithm %d for %s\n",		       conf->algorithm, mdname(mddev));		goto abort;	}	if (mddev->degraded > 2) {		printk(KERN_ERR "raid6: not enough operational devices for %s"		       " (%d/%d failed)\n",		       mdname(mddev), conf->failed_disks, conf->raid_disks);		goto abort;	}#if 0				/* FIX: For now */	if (mddev->degraded > 0 &&	    mddev->recovery_cp != MaxSector) {		printk(KERN_ERR "raid6: cannot start dirty degraded array for %s\n", mdname(mddev));		goto abort;	}#endif	{		mddev->thread = md_register_thread(raid6d, mddev, "%s_raid6");		if (!mddev->thread) {			printk(KERN_ERR			       "raid6: couldn't allocate thread for %s\n",			       mdname(mddev));			goto abort;		}	}	memory = conf->max_nr_stripes * (sizeof(struct stripe_head) +		 conf->raid_disks * ((sizeof(struct bio) + PAGE_SIZE))) / 1024;	if (grow_stripes(conf, conf->max_nr_stripes)) {		printk(KERN_ERR		       "raid6: couldn't allocate %dkB for buffers\n", memory);		shrink_stripes(conf);		md_unregister_thread(mddev->thread);		goto abort;	} else		printk(KERN_INFO "raid6: allocated %dkB for %s\n",		       memory, mdname(mddev));	if (mddev->degraded == 0)		printk(KERN_INFO "raid6: raid level %d set %s active with %d out of %d"		       " devices, algorithm %d\n", conf->level, mdname(mddev),		       mddev->raid_disks-mddev->degraded, mddev->raid_disks,		       conf->algorithm);	else		printk(KERN_ALERT "raid6: raid level %d set %s active with %d"		       " out of %d devices, algorithm %d\n", conf->level,		       mdname(mddev), mddev->raid_disks - mddev->degraded,		       mddev->raid_disks, conf->algorithm);	print_raid6_conf(conf);	/* read-ahead size must cover two whole stripes, which is	 * 2 * (n-2) * chunksize where 'n' is the number of raid devices	 */	{		int stripe = (mddev->raid_disks-2) * mddev->chunk_size			/ PAGE_CACHE_SIZE;		if (mddev->queue->backing_dev_info.ra_pages < 2 * stripe)			mddev->queue->backing_dev_info.ra_pages = 2 * stripe;	}	/* Ok, everything is just fine now */	mddev->array_size =  mddev->size * (mddev->raid_disks - 2);	return 0;abort:	if (conf) {		print_raid6_conf(conf);		if (conf->stripe_hashtbl)			free_pages((unsigned long) conf->stripe_hashtbl,							HASH_PAGES_ORDER);		kfree(conf);	}	mddev->private = NULL;	printk(KERN_ALERT "raid6: failed to run raid set %s\n", mdname(mddev));	return -EIO;}static int stop (mddev_t *mddev){	raid6_conf_t *conf = (raid6_conf_t *) mddev->private;	md_unregister_thread(mddev->thread);	mddev->thread = NULL;	shrink_stripes(conf);	free_pages((unsigned long) conf->stripe_hashtbl, HASH_PAGES_ORDER);	kfree(conf);	mddev->private = NULL;	return 0;}#if RAID6_DUMPSTATEstatic void print_sh (struct seq_file *seq, struct stripe_head *sh){	int i;	seq_printf(seq, "sh %llu, pd_idx %d, state %ld.\n",		   (unsigned long long)sh->sector, sh->pd_idx, sh->state);	seq_printf(seq, "sh %llu,  count %d.\n",		   (unsigned long long)sh->sector, atomic_read(&sh->count));	seq_printf(seq, "sh %llu, ", (unsigned long long)sh->sector);	for (i = 0; i < sh->raid_conf->raid_disks; i++) {		seq_printf(seq, "(cache%d: %p %ld) ",			   i, sh->dev[i].page, sh->dev[i].flags);	}	seq_printf(seq, "\n");}static void printall (struct seq_file *seq, raid6_conf_t *conf){	struct stripe_head *sh;	int i;	spin_lock_irq(&conf->device_lock);	for (i = 0; i < NR_HASH; i++) {		sh = conf->stripe_hashtbl[i];		for (; sh; sh = sh->hash_next) {			if (sh->raid_conf != conf)				continue;			print_sh(seq, sh);		}	}	spin_unlock_irq(&conf->device_lock);}#endifstatic void status (struct seq_file *seq, mddev_t *mddev){	raid6_conf_t *conf = (raid6_conf_t *) mddev->private;	int i;	seq_printf (seq, " level %d, %dk chunk, algorithm %d", mddev->level, mddev->chunk_size >> 10, mddev->layout);	seq_printf (seq, " [%d/%d] [", conf->raid_disks, conf->working_disks);	for (i = 0; i < conf->raid_disks; i++) 		seq_printf (seq, "%s",			    conf->disks[i].rdev &&			    conf->disks[i].rdev->in_sync ? "U" : "_");	seq_printf (seq, "]");#if RAID6_DUMPSTATE	seq_printf (seq, "\n");	printall(seq, conf);#endif}static void print_raid6_conf (raid6_conf_t *conf){	int i;	struct disk_info *tmp;	printk("RAID6 conf printout:\n");	if (!conf) {		printk("(conf==NULL)\n");		return;	}	printk(" --- rd:%d wd:%d fd:%d\n", conf->raid_disks,		 conf->working_disks, conf->failed_disks);	for (i = 0; i < conf->raid_disks; i++) {		char b[BDEVNAME_SIZE];		tmp = conf->disks + i;		if (tmp->rdev)		printk(" disk %d, o:%d, dev:%s\n",			i, !tmp->rdev->faulty,			bdevname(tmp->rdev->bdev,b));	}}static int raid6_spare_active(mddev_t *mddev){	int i;	raid6_conf_t *conf = mddev->private;	struct disk_info *tmp;	spin_lock_irq(&conf->device_lock);	for (i = 0; i < conf->raid_disks; i++) {		tmp = conf->disks + i;		if (tmp->rdev		    && !tmp->rdev->faulty		    && !tmp->rdev->in_sync) {			mddev->degraded--;			conf->failed_disks--;			conf->working_disks++;			tmp->rdev->in_sync = 1;		}	}	spin_unlock_irq(&conf->device_lock);	print_raid6_conf(conf);	return 0;}static int raid6_remove_disk(mddev_t *mddev, int number){	raid6_conf_t *conf = mddev->private;	int err = 1;	struct disk_info *p = conf->disks + number;	print_raid6_conf(conf);	spin_lock_irq(&conf->device_lock);	if (p->rdev) {		if (p->rdev->in_sync ||		    atomic_read(&p->rdev->nr_pending)) {			err = -EBUSY;			goto abort;		}		p->rdev = NULL;		err = 0;	}	if (err)		MD_BUG();abort:	spin_unlock_irq(&conf->device_lock);	print_raid6_conf(conf);	return err;}static int raid6_add_disk(mddev_t *mddev, mdk_rdev_t *rdev){	raid6_conf_t *conf = mddev->private;	int found = 0;	int disk;	struct disk_info *p;	spin_lock_irq(&conf->device_lock);	/*	 * find the disk ...	 */	for (disk=0; disk < mddev->raid_disks; disk++)		if ((p=conf->disks + disk)->rdev == NULL) {			p->rdev = rdev;			rdev->in_sync = 0;			rdev->raid_disk = disk;			found = 1;			break;		}	spin_unlock_irq(&conf->device_lock);	print_raid6_conf(conf);	return found;}static int raid6_resize(mddev_t *mddev, sector_t sectors){	/* no resync is happening, and there is enough space	 * on all devices, so we can resize.	 * We need to make sure resync covers any new space.	 * If the array is shrinking we should possibly wait until	 * any io in the removed space completes, but it hardly seems	 * worth it.	 */	sectors &= ~((sector_t)mddev->chunk_size/512 - 1);	mddev->array_size = (sectors * (mddev->raid_disks-2))>>1;	set_capacity(mddev->gendisk, mddev->array_size << 1);	mddev->changed = 1;	if (sectors/2  > mddev->size && mddev->recovery_cp == MaxSector) {		mddev->recovery_cp = mddev->size << 1;		set_bit(MD_RECOVERY_NEEDED, &mddev->recovery);	}	mddev->size = sectors /2;	return 0;}static mdk_personality_t raid6_personality={	.name		= "raid6",	.owner		= THIS_MODULE,	.make_request	= make_request,	.run		= run,	.stop		= stop,	.status		= status,	.error_handler	= error,	.hot_add_disk	= raid6_add_disk,	.hot_remove_disk= raid6_remove_disk,	.spare_active	= raid6_spare_active,	.sync_request	= sync_request,	.resize		= raid6_resize,};static int __init raid6_init (void){	int e;	e = raid6_select_algo();	if ( e )		return e;	return register_md_personality (RAID6, &raid6_personality);}static void raid6_exit (void){	unregister_md_personality (RAID6);}module_init(raid6_init);module_exit(raid6_exit);MODULE_LICENSE("GPL");MODULE_ALIAS("md-personality-8"); /* RAID6 */

⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?