patch-2.3.43 linux/drivers/block/raid0.c
Next file: linux/drivers/block/rd.c
Previous file: linux/drivers/block/paride/pt.c
Back to the patch index
Back to the overall index
- Lines: 580
- Date:
Tue Feb 8 11:39:00 2000
- Orig file:
v2.3.42/linux/drivers/block/raid0.c
- Orig date:
Fri Jan 21 18:19:16 2000
diff -u --recursive --new-file v2.3.42/linux/drivers/block/raid0.c linux/drivers/block/raid0.c
@@ -1,9 +1,10 @@
-
/*
raid0.c : Multiple Devices driver for Linux
Copyright (C) 1994-96 Marc ZYNGIER
<zyngier@ufr-info-p7.ibp.fr> or
<maz@gloups.fdn.fr>
+ Copyright (C) 1999, 2000 Ingo Molnar, Red Hat
+
RAID-0 management functions.
@@ -18,146 +19,201 @@
*/
#include <linux/module.h>
-#include <linux/md.h>
-#include <linux/raid0.h>
-#include <linux/vmalloc.h>
+#include <linux/raid/raid0.h>
#define MAJOR_NR MD_MAJOR
#define MD_DRIVER
#define MD_PERSONALITY
-static int create_strip_zones (int minor, struct md_dev *mddev)
+static int create_strip_zones (mddev_t *mddev)
{
- int i, j, c=0;
- int current_offset=0;
- struct real_dev *smallest_by_zone;
- struct raid0_data *data=(struct raid0_data *) mddev->private;
-
- data->nr_strip_zones=1;
-
- for (i=1; i<mddev->nb_dev; i++)
- {
- for (j=0; j<i; j++)
- if (mddev->devices[i].size==mddev->devices[j].size)
- {
- c=1;
- break;
- }
-
- if (!c)
- data->nr_strip_zones++;
-
- c=0;
- }
-
- if ((data->strip_zone=vmalloc(sizeof(struct strip_zone)*data->nr_strip_zones)) == NULL)
- return 1;
-
- data->smallest=NULL;
-
- for (i=0; i<data->nr_strip_zones; i++)
- {
- data->strip_zone[i].dev_offset=current_offset;
- smallest_by_zone=NULL;
- c=0;
-
- for (j=0; j<mddev->nb_dev; j++)
- if (mddev->devices[j].size>current_offset)
- {
- data->strip_zone[i].dev[c++]=mddev->devices+j;
- if (!smallest_by_zone ||
- smallest_by_zone->size > mddev->devices[j].size)
- smallest_by_zone=mddev->devices+j;
- }
-
- data->strip_zone[i].nb_dev=c;
- data->strip_zone[i].size=(smallest_by_zone->size-current_offset)*c;
-
- if (!data->smallest ||
- data->smallest->size > data->strip_zone[i].size)
- data->smallest=data->strip_zone+i;
-
- data->strip_zone[i].zone_offset=i ? (data->strip_zone[i-1].zone_offset+
- data->strip_zone[i-1].size) : 0;
- current_offset=smallest_by_zone->size;
- }
- return 0;
+ int i, c, j, j1, j2;
+ int current_offset, curr_zone_offset;
+ raid0_conf_t *conf = mddev_to_conf(mddev);
+ mdk_rdev_t *smallest, *rdev1, *rdev2, *rdev;
+
+ /*
+ * The number of 'same size groups'
+ */
+ conf->nr_strip_zones = 0;
+
+ ITERATE_RDEV_ORDERED(mddev,rdev1,j1) {
+ printk("raid0: looking at %s\n", partition_name(rdev1->dev));
+ c = 0;
+ ITERATE_RDEV_ORDERED(mddev,rdev2,j2) {
+ printk("raid0: comparing %s(%d) with %s(%d)\n", partition_name(rdev1->dev), rdev1->size, partition_name(rdev2->dev), rdev2->size);
+ if (rdev2 == rdev1) {
+ printk("raid0: END\n");
+ break;
+ }
+ if (rdev2->size == rdev1->size)
+ {
+ /*
+ * Not unique, dont count it as a new
+ * group
+ */
+ printk("raid0: EQUAL\n");
+ c = 1;
+ break;
+ }
+ printk("raid0: NOT EQUAL\n");
+ }
+ if (!c) {
+ printk("raid0: ==> UNIQUE\n");
+ conf->nr_strip_zones++;
+ printk("raid0: %d zones\n", conf->nr_strip_zones);
+ }
+ }
+ printk("raid0: FINAL %d zones\n", conf->nr_strip_zones);
+
+ conf->strip_zone = vmalloc(sizeof(struct strip_zone)*
+ conf->nr_strip_zones);
+ if (!conf->strip_zone)
+ return 1;
+
+
+ conf->smallest = NULL;
+ current_offset = 0;
+ curr_zone_offset = 0;
+
+ for (i = 0; i < conf->nr_strip_zones; i++)
+ {
+ struct strip_zone *zone = conf->strip_zone + i;
+
+ printk("zone %d\n", i);
+ zone->dev_offset = current_offset;
+ smallest = NULL;
+ c = 0;
+
+ ITERATE_RDEV_ORDERED(mddev,rdev,j) {
+
+ printk(" checking %s ...", partition_name(rdev->dev));
+ if (rdev->size > current_offset)
+ {
+ printk(" contained as device %d\n", c);
+ zone->dev[c] = rdev;
+ c++;
+ if (!smallest || (rdev->size <smallest->size)) {
+ smallest = rdev;
+ printk(" (%d) is smallest!.\n", rdev->size);
+ }
+ } else
+ printk(" nope.\n");
+ }
+
+ zone->nb_dev = c;
+ zone->size = (smallest->size - current_offset) * c;
+ printk(" zone->nb_dev: %d, size: %d\n",zone->nb_dev,zone->size);
+
+ if (!conf->smallest || (zone->size < conf->smallest->size))
+ conf->smallest = zone;
+
+ zone->zone_offset = curr_zone_offset;
+ curr_zone_offset += zone->size;
+
+ current_offset = smallest->size;
+ printk("current zone offset: %d\n", current_offset);
+ }
+ printk("done.\n");
+ return 0;
}
-static int raid0_run (int minor, struct md_dev *mddev)
+static int raid0_run (mddev_t *mddev)
{
- int cur=0, i=0, size, zone0_size, nb_zone;
- struct raid0_data *data;
+ int cur=0, i=0, size, zone0_size, nb_zone;
+ raid0_conf_t *conf;
- MOD_INC_USE_COUNT;
-
- if ((mddev->private=vmalloc (sizeof (struct raid0_data))) == NULL) return 1;
- data=(struct raid0_data *) mddev->private;
-
- if (create_strip_zones (minor, mddev))
- {
- vfree(data);
- return 1;
- }
-
- nb_zone=data->nr_zones=
- md_size[minor]/data->smallest->size +
- (md_size[minor]%data->smallest->size ? 1 : 0);
-
- printk ("raid0 : Allocating %ld bytes for hash.\n",(long)sizeof(struct raid0_hash)*nb_zone);
- if ((data->hash_table=vmalloc (sizeof (struct raid0_hash)*nb_zone)) == NULL)
- {
- vfree(data->strip_zone);
- vfree(data);
- return 1;
- }
- size=data->strip_zone[cur].size;
-
- i=0;
- while (cur<data->nr_strip_zones)
- {
- data->hash_table[i].zone0=data->strip_zone+cur;
-
- if (size>=data->smallest->size)/* If we completely fill the slot */
- {
- data->hash_table[i++].zone1=NULL;
- size-=data->smallest->size;
-
- if (!size)
- {
- if (++cur==data->nr_strip_zones) continue;
- size=data->strip_zone[cur].size;
- }
-
- continue;
- }
-
- if (++cur==data->nr_strip_zones) /* Last dev, set unit1 as NULL */
- {
- data->hash_table[i].zone1=NULL;
- continue;
- }
-
- zone0_size=size; /* Here, we use a 2nd dev to fill the slot */
- size=data->strip_zone[cur].size;
- data->hash_table[i++].zone1=data->strip_zone+cur;
- size-=(data->smallest->size - zone0_size);
- }
+ MOD_INC_USE_COUNT;
- return (0);
+ conf = vmalloc(sizeof (raid0_conf_t));
+ if (!conf)
+ goto out;
+ mddev->private = (void *)conf;
+
+ if (md_check_ordering(mddev)) {
+ printk("raid0: disks are not ordered, aborting!\n");
+ goto out_free_conf;
+ }
+
+ if (create_strip_zones (mddev))
+ goto out_free_conf;
+
+ printk("raid0 : md_size is %d blocks.\n", md_size[mdidx(mddev)]);
+ printk("raid0 : conf->smallest->size is %d blocks.\n", conf->smallest->size);
+ nb_zone = md_size[mdidx(mddev)]/conf->smallest->size +
+ (md_size[mdidx(mddev)] % conf->smallest->size ? 1 : 0);
+ printk("raid0 : nb_zone is %d.\n", nb_zone);
+ conf->nr_zones = nb_zone;
+
+ printk("raid0 : Allocating %d bytes for hash.\n",
+ sizeof(struct raid0_hash)*nb_zone);
+
+ conf->hash_table = vmalloc (sizeof (struct raid0_hash)*nb_zone);
+ if (!conf->hash_table)
+ goto out_free_zone_conf;
+ size = conf->strip_zone[cur].size;
+
+ i = 0;
+ while (cur < conf->nr_strip_zones) {
+ conf->hash_table[i].zone0 = conf->strip_zone + cur;
+
+ /*
+ * If we completely fill the slot
+ */
+ if (size >= conf->smallest->size) {
+ conf->hash_table[i++].zone1 = NULL;
+ size -= conf->smallest->size;
+
+ if (!size) {
+ if (++cur == conf->nr_strip_zones)
+ continue;
+ size = conf->strip_zone[cur].size;
+ }
+ continue;
+ }
+ if (++cur == conf->nr_strip_zones) {
+ /*
+ * Last dev, set unit1 as NULL
+ */
+ conf->hash_table[i].zone1=NULL;
+ continue;
+ }
+
+ /*
+ * Here we use a 2nd dev to fill the slot
+ */
+ zone0_size = size;
+ size = conf->strip_zone[cur].size;
+ conf->hash_table[i++].zone1 = conf->strip_zone + cur;
+ size -= (conf->smallest->size - zone0_size);
+ }
+ return 0;
+
+out_free_zone_conf:
+ vfree(conf->strip_zone);
+ conf->strip_zone = NULL;
+
+out_free_conf:
+ vfree(conf);
+ mddev->private = NULL;
+out:
+ MOD_DEC_USE_COUNT;
+ return 1;
}
-
-static int raid0_stop (int minor, struct md_dev *mddev)
+static int raid0_stop (mddev_t *mddev)
{
- struct raid0_data *data=(struct raid0_data *) mddev->private;
+ raid0_conf_t *conf = mddev_to_conf(mddev);
- vfree (data->hash_table);
- vfree (data->strip_zone);
- vfree (data);
+ vfree (conf->hash_table);
+ conf->hash_table = NULL;
+ vfree (conf->strip_zone);
+ conf->strip_zone = NULL;
+ vfree (conf);
+ mddev->private = NULL;
- MOD_DEC_USE_COUNT;
- return 0;
+ MOD_DEC_USE_COUNT;
+ return 0;
}
/*
@@ -167,135 +223,142 @@
* Of course, those facts may not be valid anymore (and surely won't...)
* Hey guys, there's some work out there ;-)
*/
-static int raid0_map (struct md_dev *mddev, kdev_t *rdev,
- unsigned long *rsector, unsigned long size)
+static int raid0_make_request (mddev_t *mddev, int rw, struct buffer_head * bh)
{
- struct raid0_data *data=(struct raid0_data *) mddev->private;
- static struct raid0_hash *hash;
- struct strip_zone *zone;
- struct real_dev *tmp_dev;
- int blk_in_chunk, factor, chunk, chunk_size;
- long block, rblock;
-
- factor=FACTOR(mddev);
- chunk_size=(1UL << FACTOR_SHIFT(factor));
- block=*rsector >> 1;
- hash=data->hash_table+(block/data->smallest->size);
-
- if (hash - data->hash_table > data->nr_zones)
- {
- printk(KERN_DEBUG "raid0_map: invalid block %ul\n", block);
- return -1;
- }
-
- /* Sanity check */
- if ((chunk_size*2)<(*rsector % (chunk_size*2))+size)
- {
- printk ("raid0_convert : can't convert block across chunks or bigger than %dk %ld %ld\n", chunk_size, *rsector, size);
- return (-1);
- }
-
- if (block >= (hash->zone0->size +
- hash->zone0->zone_offset))
- {
- if (!hash->zone1)
- {
- printk ("raid0_convert : hash->zone1==NULL for block %ld\n", block);
- return (-1);
- }
-
- zone=hash->zone1;
- }
- else
- zone=hash->zone0;
+ unsigned long size = bh->b_size >> 10;
+ raid0_conf_t *conf = mddev_to_conf(mddev);
+ struct raid0_hash *hash;
+ struct strip_zone *zone;
+ mdk_rdev_t *tmp_dev;
+ int blk_in_chunk, chunksize_bits, chunk, chunk_size;
+ long block, rblock;
+
+ chunk_size = mddev->param.chunk_size >> 10;
+ chunksize_bits = ffz(~chunk_size);
+ block = bh->b_blocknr * size;
+ hash = conf->hash_table + block / conf->smallest->size;
+
+ /* Sanity check */
+ if (chunk_size < (block % chunk_size) + size)
+ goto bad_map;
+
+ if (!hash)
+ goto bad_hash;
+
+ if (!hash->zone0)
+ goto bad_zone0;
+
+ if (block >= (hash->zone0->size + hash->zone0->zone_offset)) {
+ if (!hash->zone1)
+ goto bad_zone1;
+ zone = hash->zone1;
+ } else
+ zone = hash->zone0;
- blk_in_chunk=block & (chunk_size -1);
- chunk=(block - zone->zone_offset) / (zone->nb_dev<<FACTOR_SHIFT(factor));
- tmp_dev=zone->dev[(block >> FACTOR_SHIFT(factor)) % zone->nb_dev];
- rblock=(chunk << FACTOR_SHIFT(factor)) + blk_in_chunk + zone->dev_offset;
-
- *rdev=tmp_dev->dev;
- *rsector=rblock<<1;
-
- return (0);
+ blk_in_chunk = block & (chunk_size -1);
+ chunk = (block - zone->zone_offset) / (zone->nb_dev << chunksize_bits);
+ tmp_dev = zone->dev[(block >> chunksize_bits) % zone->nb_dev];
+ rblock = (chunk << chunksize_bits) + blk_in_chunk + zone->dev_offset;
+
+ /*
+ * Important, at this point we are not guaranteed to be the only
+ * CPU modifying b_rdev and b_rsector! Only __make_request() later
+ * on serializes the IO. So in 2.4 we must never write temporary
+ * values to bh->b_rdev, like 2.2 and 2.0 did.
+ */
+ bh->b_rdev = tmp_dev->dev;
+ bh->b_rsector = rblock << 1;
+
+ generic_make_request(rw, bh);
+
+ return 0;
+
+bad_map:
+ printk ("raid0_make_request bug: can't convert block across chunks or bigger than %dk %ld %ld\n", chunk_size, bh->b_rsector, size);
+ return -1;
+bad_hash:
+ printk("raid0_make_request bug: hash==NULL for block %ld\n", block);
+ return -1;
+bad_zone0:
+ printk ("raid0_make_request bug: hash->zone0==NULL for block %ld\n", block);
+ return -1;
+bad_zone1:
+ printk ("raid0_make_request bug: hash->zone1==NULL for block %ld\n", block);
+ return -1;
}
-
-static int raid0_status (char *page, int minor, struct md_dev *mddev)
+static int raid0_status (char *page, mddev_t *mddev)
{
- int sz=0;
+ int sz = 0;
#undef MD_DEBUG
#ifdef MD_DEBUG
- int j, k;
- struct raid0_data *data=(struct raid0_data *) mddev->private;
+ int j, k;
+ raid0_conf_t *conf = mddev_to_conf(mddev);
- sz+=sprintf (page+sz, " ");
- for (j=0; j<data->nr_zones; j++)
- {
- sz+=sprintf (page+sz, "[z%d",
- data->hash_table[j].zone0-data->strip_zone);
- if (data->hash_table[j].zone1)
- sz+=sprintf (page+sz, "/z%d] ",
- data->hash_table[j].zone1-data->strip_zone);
- else
- sz+=sprintf (page+sz, "] ");
- }
+ sz += sprintf(page + sz, " ");
+ for (j = 0; j < conf->nr_zones; j++) {
+ sz += sprintf(page + sz, "[z%d",
+ conf->hash_table[j].zone0 - conf->strip_zone);
+ if (conf->hash_table[j].zone1)
+ sz += sprintf(page+sz, "/z%d] ",
+ conf->hash_table[j].zone1 - conf->strip_zone);
+ else
+ sz += sprintf(page+sz, "] ");
+ }
- sz+=sprintf (page+sz, "\n");
+ sz += sprintf(page + sz, "\n");
- for (j=0; j<data->nr_strip_zones; j++)
- {
- sz+=sprintf (page+sz, " z%d=[", j);
- for (k=0; k<data->strip_zone[j].nb_dev; k++)
- sz+=sprintf (page+sz, "%s/",
- partition_name(data->strip_zone[j].dev[k]->dev));
- sz--;
- sz+=sprintf (page+sz, "] zo=%d do=%d s=%d\n",
- data->strip_zone[j].zone_offset,
- data->strip_zone[j].dev_offset,
- data->strip_zone[j].size);
- }
+ for (j = 0; j < conf->nr_strip_zones; j++) {
+ sz += sprintf(page + sz, " z%d=[", j);
+ for (k = 0; k < conf->strip_zone[j].nb_dev; k++)
+ sz += sprintf (page+sz, "%s/", partition_name(
+ conf->strip_zone[j].dev[k]->dev));
+ sz--;
+ sz += sprintf (page+sz, "] zo=%d do=%d s=%d\n",
+ conf->strip_zone[j].zone_offset,
+ conf->strip_zone[j].dev_offset,
+ conf->strip_zone[j].size);
+ }
#endif
- sz+=sprintf (page+sz, " %dk chunks", 1<<FACTOR_SHIFT(FACTOR(mddev)));
- return sz;
+ sz += sprintf(page + sz, " %dk chunks", mddev->param.chunk_size/1024);
+ return sz;
}
-
-static struct md_personality raid0_personality=
+static mdk_personality_t raid0_personality=
{
- "raid0",
- raid0_map,
- NULL, /* no special make_request */
- NULL, /* no special end_request */
- raid0_run,
- raid0_stop,
- raid0_status,
- NULL, /* no ioctls */
- 0,
- NULL, /* no error_handler */
- NULL, /* hot_add_disk */
- NULL, /* hot_remove_disk */
- NULL /* mark_spare */
+ "raid0",
+ NULL, /* no special map */
+ raid0_make_request,
+ NULL, /* no special end_request */
+ raid0_run,
+ raid0_stop,
+ raid0_status,
+ NULL, /* no ioctls */
+ 0,
+ NULL, /* no error_handler */
+ NULL, /* no diskop */
+ NULL, /* no stop resync */
+ NULL /* no restart resync */
};
-
#ifndef MODULE
void raid0_init (void)
{
- register_md_personality (RAID0, &raid0_personality);
+ register_md_personality (RAID0, &raid0_personality);
}
#else
int init_module (void)
{
- return (register_md_personality (RAID0, &raid0_personality));
+ return (register_md_personality (RAID0, &raid0_personality));
}
void cleanup_module (void)
{
- unregister_md_personality (RAID0);
+ unregister_md_personality (RAID0);
}
#endif
+
FUNET's LINUX-ADM group, linux-adm@nic.funet.fi
TCL-scripts by Sam Shen (who was at: slshen@lbl.gov)