1 /*
2 raid0.c : Multiple Devices driver for Linux
3 Copyright (C) 1994-96 Marc ZYNGIER
4 <zyngier@ufr-info-p7.ibp.fr> or
5 <maz@gloups.fdn.fr>
6 Copyright (C) 1999, 2000 Ingo Molnar, Red Hat
7
8
9 RAID-0 management functions.
10
11 This program is free software; you can redistribute it and/or modify
12 it under the terms of the GNU General Public License as published by
13 the Free Software Foundation; either version 2, or (at your option)
14 any later version.
15
16 You should have received a copy of the GNU General Public License
17 (for example /usr/src/linux/COPYING); if not, write to the Free
18 Software Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
19 */
20
21 #include <linux/module.h>
22 #include <linux/raid/raid0.h>
23
24 #define MAJOR_NR MD_MAJOR
25 #define MD_DRIVER
26 #define MD_PERSONALITY
27
create_strip_zones(mddev_t * mddev)28 static int create_strip_zones (mddev_t *mddev)
29 {
30 int i, c, j, j1, j2;
31 unsigned long current_offset, curr_zone_offset;
32 raid0_conf_t *conf = mddev_to_conf(mddev);
33 mdk_rdev_t *smallest, *rdev1, *rdev2, *rdev;
34
35 /*
36 * The number of 'same size groups'
37 */
38 conf->nr_strip_zones = 0;
39
40 ITERATE_RDEV_ORDERED(mddev,rdev1,j1) {
41 printk("raid0: looking at %s\n", partition_name(rdev1->dev));
42 c = 0;
43 ITERATE_RDEV_ORDERED(mddev,rdev2,j2) {
44 printk("raid0: comparing %s(%ld) with %s(%ld)\n", partition_name(rdev1->dev), rdev1->size, partition_name(rdev2->dev), rdev2->size);
45 if (rdev2 == rdev1) {
46 printk("raid0: END\n");
47 break;
48 }
49 if (rdev2->size == rdev1->size)
50 {
51 /*
52 * Not unique, dont count it as a new
53 * group
54 */
55 printk("raid0: EQUAL\n");
56 c = 1;
57 break;
58 }
59 printk("raid0: NOT EQUAL\n");
60 }
61 if (!c) {
62 printk("raid0: ==> UNIQUE\n");
63 conf->nr_strip_zones++;
64 printk("raid0: %d zones\n", conf->nr_strip_zones);
65 }
66 }
67 printk("raid0: FINAL %d zones\n", conf->nr_strip_zones);
68
69 conf->strip_zone = vmalloc(sizeof(struct strip_zone)*
70 conf->nr_strip_zones);
71 if (!conf->strip_zone)
72 return 1;
73
74
75 conf->smallest = NULL;
76 current_offset = 0;
77 curr_zone_offset = 0;
78
79 for (i = 0; i < conf->nr_strip_zones; i++)
80 {
81 struct strip_zone *zone = conf->strip_zone + i;
82
83 printk("raid0: zone %d\n", i);
84 zone->dev_offset = current_offset;
85 smallest = NULL;
86 c = 0;
87
88 ITERATE_RDEV_ORDERED(mddev,rdev,j) {
89
90 printk("raid0: checking %s ...", partition_name(rdev->dev));
91 if (rdev->size > current_offset)
92 {
93 printk(" contained as device %d\n", c);
94 zone->dev[c] = rdev;
95 c++;
96 if (!smallest || (rdev->size <smallest->size)) {
97 smallest = rdev;
98 printk(" (%ld) is smallest!.\n", rdev->size);
99 }
100 } else
101 printk(" nope.\n");
102 }
103
104 zone->nb_dev = c;
105 zone->size = (smallest->size - current_offset) * c;
106 printk("raid0: zone->nb_dev: %d, size: %ld\n",zone->nb_dev,zone->size);
107
108 if (!conf->smallest || (zone->size < conf->smallest->size))
109 conf->smallest = zone;
110
111 zone->zone_offset = curr_zone_offset;
112 curr_zone_offset += zone->size;
113
114 current_offset = smallest->size;
115 printk("raid0: current zone offset: %ld\n", current_offset);
116 }
117 printk("raid0: done.\n");
118 return 0;
119 }
120
raid0_run(mddev_t * mddev)121 static int raid0_run (mddev_t *mddev)
122 {
123 unsigned long cur=0, i=0, size, zone0_size, nb_zone;
124 raid0_conf_t *conf;
125
126 MOD_INC_USE_COUNT;
127
128 conf = vmalloc(sizeof (raid0_conf_t));
129 if (!conf)
130 goto out;
131 mddev->private = (void *)conf;
132
133 if (md_check_ordering(mddev)) {
134 printk("raid0: disks are not ordered, aborting!\n");
135 goto out_free_conf;
136 }
137
138 if (create_strip_zones (mddev))
139 goto out_free_conf;
140
141 printk("raid0 : md_size is %d blocks.\n", md_size[mdidx(mddev)]);
142 printk("raid0 : conf->smallest->size is %ld blocks.\n", conf->smallest->size);
143 nb_zone = md_size[mdidx(mddev)]/conf->smallest->size +
144 (md_size[mdidx(mddev)] % conf->smallest->size ? 1 : 0);
145 printk("raid0 : nb_zone is %ld.\n", nb_zone);
146 conf->nr_zones = nb_zone;
147
148 printk("raid0 : Allocating %ld bytes for hash.\n",
149 nb_zone*sizeof(struct raid0_hash));
150
151 conf->hash_table = vmalloc (sizeof (struct raid0_hash)*nb_zone);
152 if (!conf->hash_table)
153 goto out_free_zone_conf;
154 size = conf->strip_zone[cur].size;
155
156 i = 0;
157 while (cur < conf->nr_strip_zones) {
158 conf->hash_table[i].zone0 = conf->strip_zone + cur;
159
160 /*
161 * If we completely fill the slot
162 */
163 if (size >= conf->smallest->size) {
164 conf->hash_table[i++].zone1 = NULL;
165 size -= conf->smallest->size;
166
167 if (!size) {
168 if (++cur == conf->nr_strip_zones)
169 continue;
170 size = conf->strip_zone[cur].size;
171 }
172 continue;
173 }
174 if (++cur == conf->nr_strip_zones) {
175 /*
176 * Last dev, set unit1 as NULL
177 */
178 conf->hash_table[i].zone1=NULL;
179 continue;
180 }
181
182 /*
183 * Here we use a 2nd dev to fill the slot
184 */
185 zone0_size = size;
186 size = conf->strip_zone[cur].size;
187 conf->hash_table[i++].zone1 = conf->strip_zone + cur;
188 size -= (conf->smallest->size - zone0_size);
189 }
190 return 0;
191
192 out_free_zone_conf:
193 vfree(conf->strip_zone);
194 conf->strip_zone = NULL;
195
196 out_free_conf:
197 vfree(conf);
198 mddev->private = NULL;
199 out:
200 MOD_DEC_USE_COUNT;
201 return 1;
202 }
203
raid0_stop(mddev_t * mddev)204 static int raid0_stop (mddev_t *mddev)
205 {
206 raid0_conf_t *conf = mddev_to_conf(mddev);
207
208 vfree (conf->hash_table);
209 conf->hash_table = NULL;
210 vfree (conf->strip_zone);
211 conf->strip_zone = NULL;
212 vfree (conf);
213 mddev->private = NULL;
214
215 MOD_DEC_USE_COUNT;
216 return 0;
217 }
218
219 /*
220 * FIXME - We assume some things here :
221 * - requested buffers NEVER bigger than chunk size,
222 * - requested buffers NEVER cross stripes limits.
223 * Of course, those facts may not be valid anymore (and surely won't...)
224 * Hey guys, there's some work out there ;-)
225 */
raid0_make_request(mddev_t * mddev,int rw,struct buffer_head * bh)226 static int raid0_make_request (mddev_t *mddev,
227 int rw, struct buffer_head * bh)
228 {
229 unsigned int sect_in_chunk, chunksize_bits, chunk_size;
230 raid0_conf_t *conf = mddev_to_conf(mddev);
231 struct raid0_hash *hash;
232 struct strip_zone *zone;
233 mdk_rdev_t *tmp_dev;
234 unsigned long chunk, block, rsect;
235
236 chunk_size = mddev->param.chunk_size >> 10;
237 chunksize_bits = ffz(~chunk_size);
238 block = bh->b_rsector >> 1;
239 hash = conf->hash_table + block / conf->smallest->size;
240
241 /* Sanity check */
242 if (chunk_size < (block % chunk_size) + (bh->b_size >> 10))
243 goto bad_map;
244
245 if (!hash)
246 goto bad_hash;
247
248 if (!hash->zone0)
249 goto bad_zone0;
250
251 if (block >= (hash->zone0->size + hash->zone0->zone_offset)) {
252 if (!hash->zone1)
253 goto bad_zone1;
254 zone = hash->zone1;
255 } else
256 zone = hash->zone0;
257
258 sect_in_chunk = bh->b_rsector & ((chunk_size<<1) -1);
259 chunk = (block - zone->zone_offset) / (zone->nb_dev << chunksize_bits);
260 tmp_dev = zone->dev[(block >> chunksize_bits) % zone->nb_dev];
261 rsect = (((chunk << chunksize_bits) + zone->dev_offset)<<1)
262 + sect_in_chunk;
263
264 /*
265 * The new BH_Lock semantics in ll_rw_blk.c guarantee that this
266 * is the only IO operation happening on this bh.
267 */
268 bh->b_rdev = tmp_dev->dev;
269 bh->b_rsector = rsect;
270
271 /*
272 * Let the main block layer submit the IO and resolve recursion:
273 */
274 return 1;
275
276 bad_map:
277 printk ("raid0_make_request bug: can't convert block across chunks or bigger than %dk %ld %d\n", chunk_size, bh->b_rsector, bh->b_size >> 10);
278 goto outerr;
279 bad_hash:
280 printk("raid0_make_request bug: hash==NULL for block %ld\n", block);
281 goto outerr;
282 bad_zone0:
283 printk ("raid0_make_request bug: hash->zone0==NULL for block %ld\n", block);
284 goto outerr;
285 bad_zone1:
286 printk ("raid0_make_request bug: hash->zone1==NULL for block %ld\n", block);
287 outerr:
288 buffer_IO_error(bh);
289 return 0;
290 }
291
raid0_status(struct seq_file * seq,mddev_t * mddev)292 static void raid0_status (struct seq_file *seq, mddev_t *mddev)
293 {
294 #undef MD_DEBUG
295 #ifdef MD_DEBUG
296 int j, k;
297 raid0_conf_t *conf = mddev_to_conf(mddev);
298
299 seq_printf(seq, " ");
300 for (j = 0; j < conf->nr_zones; j++) {
301 seq_printf(seq, "[z%d",
302 conf->hash_table[j].zone0 - conf->strip_zone);
303 if (conf->hash_table[j].zone1)
304 seq_printf(seq, "/z%d] ",
305 conf->hash_table[j].zone1 - conf->strip_zone);
306 else
307 seq_printf(seq, "] ");
308 }
309
310 seq_printf(seq, "\n");
311
312 for (j = 0; j < conf->nr_strip_zones; j++) {
313 seq_printf(seq, " z%d=[", j);
314 for (k = 0; k < conf->strip_zone[j].nb_dev; k++)
315 seq_printf (seq, "%s/", partition_name(
316 conf->strip_zone[j].dev[k]->dev));
317
318 seq_printf (seq, "] zo=%d do=%d s=%d\n",
319 conf->strip_zone[j].zone_offset,
320 conf->strip_zone[j].dev_offset,
321 conf->strip_zone[j].size);
322 }
323 #endif
324 seq_printf(seq, " %dk chunks", mddev->param.chunk_size/1024);
325 return;
326 }
327
328 static mdk_personality_t raid0_personality=
329 {
330 name: "raid0",
331 make_request: raid0_make_request,
332 run: raid0_run,
333 stop: raid0_stop,
334 status: raid0_status,
335 };
336
raid0_init(void)337 static int md__init raid0_init (void)
338 {
339 return register_md_personality (RAID0, &raid0_personality);
340 }
341
raid0_exit(void)342 static void raid0_exit (void)
343 {
344 unregister_md_personality (RAID0);
345 }
346
347 module_init(raid0_init);
348 module_exit(raid0_exit);
349 MODULE_LICENSE("GPL");
350