2 linear.c : Multiple Devices driver for Linux
3 Copyright (C) 1994-96 Marc ZYNGIER
4 <zyngier@ufr-info-p7.ibp.fr> or
7 Linear mode management functions.
9 This program is free software; you can redistribute it and/or modify
10 it under the terms of the GNU General Public License as published by
11 the Free Software Foundation; either version 2, or (at your option)
14 You should have received a copy of the GNU General Public License
15 (for example /usr/src/linux/COPYING); if not, write to the Free
16 Software Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
19 #include <linux/raid/linear.h>
22 * find which device holds a particular offset
24 static inline dev_info_t
*which_dev(mddev_t
*mddev
, sector_t sector
)
27 linear_conf_t
*conf
= mddev_to_conf(mddev
);
30 * sector_div(a,b) returns the remainer and sets a to a/b
32 sector
>>= conf
->sector_shift
;
33 (void)sector_div(sector
, conf
->spacing
);
34 hash
= conf
->hash_table
[sector
];
36 while (sector
>= hash
->num_sectors
+ hash
->start_sector
)
42 * linear_mergeable_bvec -- tell bio layer if two requests can be merged
44 * @bvm: properties of new bio
45 * @biovec: the request that could be merged to it.
47 * Return amount of bytes we can take at this offset
49 static int linear_mergeable_bvec(struct request_queue
*q
,
50 struct bvec_merge_data
*bvm
,
51 struct bio_vec
*biovec
)
53 mddev_t
*mddev
= q
->queuedata
;
55 unsigned long maxsectors
, bio_sectors
= bvm
->bi_size
>> 9;
56 sector_t sector
= bvm
->bi_sector
+ get_start_sect(bvm
->bi_bdev
);
58 dev0
= which_dev(mddev
, sector
);
59 maxsectors
= dev0
->num_sectors
- (sector
- dev0
->start_sector
);
61 if (maxsectors
< bio_sectors
)
64 maxsectors
-= bio_sectors
;
66 if (maxsectors
<= (PAGE_SIZE
>> 9 ) && bio_sectors
== 0)
67 return biovec
->bv_len
;
68 /* The bytes available at this offset could be really big,
69 * so we cap at 2^31 to avoid overflow */
70 if (maxsectors
> (1 << (31-9)))
72 return maxsectors
<< 9;
75 static void linear_unplug(struct request_queue
*q
)
77 mddev_t
*mddev
= q
->queuedata
;
78 linear_conf_t
*conf
= mddev_to_conf(mddev
);
81 for (i
=0; i
< mddev
->raid_disks
; i
++) {
82 struct request_queue
*r_queue
= bdev_get_queue(conf
->disks
[i
].rdev
->bdev
);
87 static int linear_congested(void *data
, int bits
)
89 mddev_t
*mddev
= data
;
90 linear_conf_t
*conf
= mddev_to_conf(mddev
);
93 for (i
= 0; i
< mddev
->raid_disks
&& !ret
; i
++) {
94 struct request_queue
*q
= bdev_get_queue(conf
->disks
[i
].rdev
->bdev
);
95 ret
|= bdi_congested(&q
->backing_dev_info
, bits
);
100 static linear_conf_t
*linear_conf(mddev_t
*mddev
, int raid_disks
)
106 sector_t min_sectors
;
107 sector_t curr_sector
;
108 struct list_head
*tmp
;
110 conf
= kzalloc (sizeof (*conf
) + raid_disks
*sizeof(dev_info_t
),
116 conf
->array_sectors
= 0;
118 rdev_for_each(rdev
, tmp
, mddev
) {
119 int j
= rdev
->raid_disk
;
120 dev_info_t
*disk
= conf
->disks
+ j
;
122 if (j
< 0 || j
>= raid_disks
|| disk
->rdev
) {
123 printk("linear: disk numbering problem. Aborting!\n");
129 blk_queue_stack_limits(mddev
->queue
,
130 rdev
->bdev
->bd_disk
->queue
);
131 /* as we don't honour merge_bvec_fn, we must never risk
132 * violating it, so limit ->max_sector to one PAGE, as
133 * a one page request is never in violation.
135 if (rdev
->bdev
->bd_disk
->queue
->merge_bvec_fn
&&
136 mddev
->queue
->max_sectors
> (PAGE_SIZE
>>9))
137 blk_queue_max_sectors(mddev
->queue
, PAGE_SIZE
>>9);
139 disk
->num_sectors
= rdev
->size
* 2;
140 conf
->array_sectors
+= rdev
->size
* 2;
144 if (cnt
!= raid_disks
) {
145 printk("linear: not enough drives present. Aborting!\n");
149 min_sectors
= conf
->array_sectors
;
150 sector_div(min_sectors
, PAGE_SIZE
/sizeof(struct dev_info
*));
152 /* min_sectors is the minimum spacing that will fit the hash
153 * table in one PAGE. This may be much smaller than needed.
154 * We find the smallest non-terminal set of consecutive devices
155 * that is larger than min_sectors and use the size of that as
158 conf
->spacing
= conf
->array_sectors
;
159 for (i
=0; i
< cnt
-1 ; i
++) {
162 for (j
= i
; j
< cnt
- 1 && tmp
< min_sectors
; j
++)
163 tmp
+= conf
->disks
[j
].num_sectors
;
164 if (tmp
>= min_sectors
&& tmp
< conf
->spacing
)
168 /* spacing may be too large for sector_div to work with,
169 * so we might need to pre-shift
171 conf
->sector_shift
= 0;
172 if (sizeof(sector_t
) > sizeof(u32
)) {
173 sector_t space
= conf
->spacing
;
174 while (space
> (sector_t
)(~(u32
)0)) {
176 conf
->sector_shift
++;
180 * This code was restructured to work around a gcc-2.95.3 internal
181 * compiler error. Alter it with care.
188 sz
= conf
->array_sectors
>> conf
->sector_shift
;
189 sz
+= 1; /* force round-up */
190 base
= conf
->spacing
>> conf
->sector_shift
;
191 round
= sector_div(sz
, base
);
192 nb_zone
= sz
+ (round
? 1 : 0);
194 BUG_ON(nb_zone
> PAGE_SIZE
/ sizeof(struct dev_info
*));
196 conf
->hash_table
= kmalloc (sizeof (struct dev_info
*) * nb_zone
,
198 if (!conf
->hash_table
)
202 * Here we generate the linear hash table
203 * First calculate the device offsets.
205 conf
->disks
[0].start_sector
= 0;
206 for (i
= 1; i
< raid_disks
; i
++)
207 conf
->disks
[i
].start_sector
=
208 conf
->disks
[i
-1].start_sector
+
209 conf
->disks
[i
-1].num_sectors
;
211 table
= conf
->hash_table
;
213 for (curr_sector
= 0;
214 curr_sector
< conf
->array_sectors
;
215 curr_sector
+= conf
->spacing
) {
217 while (i
< raid_disks
-1 &&
218 curr_sector
>= conf
->disks
[i
+1].start_sector
)
221 *table
++ = conf
->disks
+ i
;
224 if (conf
->sector_shift
) {
225 conf
->spacing
>>= conf
->sector_shift
;
226 /* round spacing up so that when we divide by it,
227 * we err on the side of "too-low", which is safest.
232 BUG_ON(table
- conf
->hash_table
> nb_zone
);
241 static int linear_run (mddev_t
*mddev
)
245 mddev
->queue
->queue_lock
= &mddev
->queue
->__queue_lock
;
246 conf
= linear_conf(mddev
, mddev
->raid_disks
);
250 mddev
->private = conf
;
251 mddev
->array_sectors
= conf
->array_sectors
;
253 blk_queue_merge_bvec(mddev
->queue
, linear_mergeable_bvec
);
254 mddev
->queue
->unplug_fn
= linear_unplug
;
255 mddev
->queue
->backing_dev_info
.congested_fn
= linear_congested
;
256 mddev
->queue
->backing_dev_info
.congested_data
= mddev
;
260 static int linear_add(mddev_t
*mddev
, mdk_rdev_t
*rdev
)
262 /* Adding a drive to a linear array allows the array to grow.
263 * It is permitted if the new drive has a matching superblock
264 * already on it, with raid_disk equal to raid_disks.
265 * It is achieved by creating a new linear_private_data structure
266 * and swapping it in in-place of the current one.
267 * The current one is never freed until the array is stopped.
270 linear_conf_t
*newconf
;
272 if (rdev
->saved_raid_disk
!= mddev
->raid_disks
)
275 rdev
->raid_disk
= rdev
->saved_raid_disk
;
277 newconf
= linear_conf(mddev
,mddev
->raid_disks
+1);
282 newconf
->prev
= mddev_to_conf(mddev
);
283 mddev
->private = newconf
;
285 mddev
->array_sectors
= newconf
->array_sectors
;
286 set_capacity(mddev
->gendisk
, mddev
->array_sectors
);
290 static int linear_stop (mddev_t
*mddev
)
292 linear_conf_t
*conf
= mddev_to_conf(mddev
);
294 blk_sync_queue(mddev
->queue
); /* the unplug fn references 'conf'*/
296 linear_conf_t
*t
= conf
->prev
;
297 kfree(conf
->hash_table
);
305 static int linear_make_request (struct request_queue
*q
, struct bio
*bio
)
307 const int rw
= bio_data_dir(bio
);
308 mddev_t
*mddev
= q
->queuedata
;
312 if (unlikely(bio_barrier(bio
))) {
313 bio_endio(bio
, -EOPNOTSUPP
);
317 cpu
= part_stat_lock();
318 part_stat_inc(cpu
, &mddev
->gendisk
->part0
, ios
[rw
]);
319 part_stat_add(cpu
, &mddev
->gendisk
->part0
, sectors
[rw
],
323 tmp_dev
= which_dev(mddev
, bio
->bi_sector
);
325 if (unlikely(bio
->bi_sector
>= (tmp_dev
->num_sectors
+
326 tmp_dev
->start_sector
)
328 tmp_dev
->start_sector
))) {
329 char b
[BDEVNAME_SIZE
];
331 printk("linear_make_request: Sector %llu out of bounds on "
332 "dev %s: %llu sectors, offset %llu\n",
333 (unsigned long long)bio
->bi_sector
,
334 bdevname(tmp_dev
->rdev
->bdev
, b
),
335 (unsigned long long)tmp_dev
->num_sectors
,
336 (unsigned long long)tmp_dev
->start_sector
);
340 if (unlikely(bio
->bi_sector
+ (bio
->bi_size
>> 9) >
341 tmp_dev
->start_sector
+ tmp_dev
->num_sectors
)) {
342 /* This bio crosses a device boundary, so we have to
348 tmp_dev
->start_sector
+ tmp_dev
->num_sectors
351 if (linear_make_request(q
, &bp
->bio1
))
352 generic_make_request(&bp
->bio1
);
353 if (linear_make_request(q
, &bp
->bio2
))
354 generic_make_request(&bp
->bio2
);
355 bio_pair_release(bp
);
359 bio
->bi_bdev
= tmp_dev
->rdev
->bdev
;
360 bio
->bi_sector
= bio
->bi_sector
- tmp_dev
->start_sector
361 + tmp_dev
->rdev
->data_offset
;
366 static void linear_status (struct seq_file
*seq
, mddev_t
*mddev
)
369 seq_printf(seq
, " %dk rounding", mddev
->chunk_size
/1024);
373 static struct mdk_personality linear_personality
=
376 .level
= LEVEL_LINEAR
,
377 .owner
= THIS_MODULE
,
378 .make_request
= linear_make_request
,
381 .status
= linear_status
,
382 .hot_add_disk
= linear_add
,
385 static int __init
linear_init (void)
387 return register_md_personality (&linear_personality
);
390 static void linear_exit (void)
392 unregister_md_personality (&linear_personality
);
396 module_init(linear_init
);
397 module_exit(linear_exit
);
398 MODULE_LICENSE("GPL");
399 MODULE_ALIAS("md-personality-1"); /* LINEAR - deprecated*/
400 MODULE_ALIAS("md-linear");
401 MODULE_ALIAS("md-level--1");