2 * Copyright (C) 2005-2007 Red Hat GmbH
4 * A target that delays reads and/or writes and can send
5 * them to different devices.
7 * This file is released under the GPL.
10 #include <linux/module.h>
11 #include <linux/init.h>
12 #include <linux/blkdev.h>
13 #include <linux/bio.h>
14 #include <linux/slab.h>
16 #include <linux/device-mapper.h>
18 #define DM_MSG_PREFIX "delay"
21 struct timer_list delay_timer
;
22 struct mutex timer_lock
;
23 struct workqueue_struct
*kdelayd_wq
;
24 struct work_struct flush_expired_bios
;
25 struct list_head delayed_bios
;
28 struct dm_dev
*dev_read
;
33 struct dm_dev
*dev_write
;
39 struct dm_delay_info
{
40 struct delay_c
*context
;
41 struct list_head list
;
42 unsigned long expires
;
45 static DEFINE_MUTEX(delayed_bios_lock
);
47 static void handle_delayed_timer(unsigned long data
)
49 struct delay_c
*dc
= (struct delay_c
*)data
;
51 queue_work(dc
->kdelayd_wq
, &dc
->flush_expired_bios
);
54 static void queue_timeout(struct delay_c
*dc
, unsigned long expires
)
56 mutex_lock(&dc
->timer_lock
);
58 if (!timer_pending(&dc
->delay_timer
) || expires
< dc
->delay_timer
.expires
)
59 mod_timer(&dc
->delay_timer
, expires
);
61 mutex_unlock(&dc
->timer_lock
);
64 static void flush_bios(struct bio
*bio
)
71 generic_make_request(bio
);
76 static struct bio
*flush_delayed_bios(struct delay_c
*dc
, int flush_all
)
78 struct dm_delay_info
*delayed
, *next
;
79 unsigned long next_expires
= 0;
81 struct bio_list flush_bios
= { };
83 mutex_lock(&delayed_bios_lock
);
84 list_for_each_entry_safe(delayed
, next
, &dc
->delayed_bios
, list
) {
85 if (flush_all
|| time_after_eq(jiffies
, delayed
->expires
)) {
86 struct bio
*bio
= dm_bio_from_per_bio_data(delayed
,
87 sizeof(struct dm_delay_info
));
88 list_del(&delayed
->list
);
89 bio_list_add(&flush_bios
, bio
);
90 if ((bio_data_dir(bio
) == WRITE
))
91 delayed
->context
->writes
--;
93 delayed
->context
->reads
--;
99 next_expires
= delayed
->expires
;
101 next_expires
= min(next_expires
, delayed
->expires
);
104 mutex_unlock(&delayed_bios_lock
);
107 queue_timeout(dc
, next_expires
);
109 return bio_list_get(&flush_bios
);
112 static void flush_expired_bios(struct work_struct
*work
)
116 dc
= container_of(work
, struct delay_c
, flush_expired_bios
);
117 flush_bios(flush_delayed_bios(dc
, 0));
121 * Mapping parameters:
122 * <device> <offset> <delay> [<write_device> <write_offset> <write_delay>]
124 * With separate write parameters, the first set is only used for reads.
125 * Offsets are specified in sectors.
126 * Delays are specified in milliseconds.
128 static int delay_ctr(struct dm_target
*ti
, unsigned int argc
, char **argv
)
131 unsigned long long tmpll
;
135 if (argc
!= 3 && argc
!= 6) {
136 ti
->error
= "Requires exactly 3 or 6 arguments";
140 dc
= kmalloc(sizeof(*dc
), GFP_KERNEL
);
142 ti
->error
= "Cannot allocate context";
146 dc
->reads
= dc
->writes
= 0;
149 if (sscanf(argv
[1], "%llu%c", &tmpll
, &dummy
) != 1) {
150 ti
->error
= "Invalid device sector";
153 dc
->start_read
= tmpll
;
155 if (sscanf(argv
[2], "%u%c", &dc
->read_delay
, &dummy
) != 1) {
156 ti
->error
= "Invalid delay";
160 ret
= dm_get_device(ti
, argv
[0], dm_table_get_mode(ti
->table
),
163 ti
->error
= "Device lookup failed";
168 dc
->dev_write
= NULL
;
172 if (sscanf(argv
[4], "%llu%c", &tmpll
, &dummy
) != 1) {
173 ti
->error
= "Invalid write device sector";
176 dc
->start_write
= tmpll
;
178 if (sscanf(argv
[5], "%u%c", &dc
->write_delay
, &dummy
) != 1) {
179 ti
->error
= "Invalid write delay";
183 ret
= dm_get_device(ti
, argv
[3], dm_table_get_mode(ti
->table
),
186 ti
->error
= "Write device lookup failed";
192 dc
->kdelayd_wq
= alloc_workqueue("kdelayd", WQ_MEM_RECLAIM
, 0);
193 if (!dc
->kdelayd_wq
) {
194 DMERR("Couldn't start kdelayd");
198 setup_timer(&dc
->delay_timer
, handle_delayed_timer
, (unsigned long)dc
);
200 INIT_WORK(&dc
->flush_expired_bios
, flush_expired_bios
);
201 INIT_LIST_HEAD(&dc
->delayed_bios
);
202 mutex_init(&dc
->timer_lock
);
203 atomic_set(&dc
->may_delay
, 1);
205 ti
->num_flush_bios
= 1;
206 ti
->num_discard_bios
= 1;
207 ti
->per_io_data_size
= sizeof(struct dm_delay_info
);
213 dm_put_device(ti
, dc
->dev_write
);
215 dm_put_device(ti
, dc
->dev_read
);
221 static void delay_dtr(struct dm_target
*ti
)
223 struct delay_c
*dc
= ti
->private;
225 destroy_workqueue(dc
->kdelayd_wq
);
227 dm_put_device(ti
, dc
->dev_read
);
230 dm_put_device(ti
, dc
->dev_write
);
235 static int delay_bio(struct delay_c
*dc
, int delay
, struct bio
*bio
)
237 struct dm_delay_info
*delayed
;
238 unsigned long expires
= 0;
240 if (!delay
|| !atomic_read(&dc
->may_delay
))
241 return DM_MAPIO_REMAPPED
;
243 delayed
= dm_per_bio_data(bio
, sizeof(struct dm_delay_info
));
245 delayed
->context
= dc
;
246 delayed
->expires
= expires
= jiffies
+ msecs_to_jiffies(delay
);
248 mutex_lock(&delayed_bios_lock
);
250 if (bio_data_dir(bio
) == WRITE
)
255 list_add_tail(&delayed
->list
, &dc
->delayed_bios
);
257 mutex_unlock(&delayed_bios_lock
);
259 queue_timeout(dc
, expires
);
261 return DM_MAPIO_SUBMITTED
;
264 static void delay_presuspend(struct dm_target
*ti
)
266 struct delay_c
*dc
= ti
->private;
268 atomic_set(&dc
->may_delay
, 0);
269 del_timer_sync(&dc
->delay_timer
);
270 flush_bios(flush_delayed_bios(dc
, 1));
273 static void delay_resume(struct dm_target
*ti
)
275 struct delay_c
*dc
= ti
->private;
277 atomic_set(&dc
->may_delay
, 1);
280 static int delay_map(struct dm_target
*ti
, struct bio
*bio
)
282 struct delay_c
*dc
= ti
->private;
284 if ((bio_data_dir(bio
) == WRITE
) && (dc
->dev_write
)) {
285 bio_set_dev(bio
, dc
->dev_write
->bdev
);
286 if (bio_sectors(bio
))
287 bio
->bi_iter
.bi_sector
= dc
->start_write
+
288 dm_target_offset(ti
, bio
->bi_iter
.bi_sector
);
290 return delay_bio(dc
, dc
->write_delay
, bio
);
293 bio_set_dev(bio
, dc
->dev_read
->bdev
);
294 bio
->bi_iter
.bi_sector
= dc
->start_read
+
295 dm_target_offset(ti
, bio
->bi_iter
.bi_sector
);
297 return delay_bio(dc
, dc
->read_delay
, bio
);
300 static void delay_status(struct dm_target
*ti
, status_type_t type
,
301 unsigned status_flags
, char *result
, unsigned maxlen
)
303 struct delay_c
*dc
= ti
->private;
307 case STATUSTYPE_INFO
:
308 DMEMIT("%u %u", dc
->reads
, dc
->writes
);
311 case STATUSTYPE_TABLE
:
312 DMEMIT("%s %llu %u", dc
->dev_read
->name
,
313 (unsigned long long) dc
->start_read
,
316 DMEMIT(" %s %llu %u", dc
->dev_write
->name
,
317 (unsigned long long) dc
->start_write
,
323 static int delay_iterate_devices(struct dm_target
*ti
,
324 iterate_devices_callout_fn fn
, void *data
)
326 struct delay_c
*dc
= ti
->private;
329 ret
= fn(ti
, dc
->dev_read
, dc
->start_read
, ti
->len
, data
);
334 ret
= fn(ti
, dc
->dev_write
, dc
->start_write
, ti
->len
, data
);
340 static struct target_type delay_target
= {
342 .version
= {1, 2, 1},
343 .features
= DM_TARGET_PASSES_INTEGRITY
,
344 .module
= THIS_MODULE
,
348 .presuspend
= delay_presuspend
,
349 .resume
= delay_resume
,
350 .status
= delay_status
,
351 .iterate_devices
= delay_iterate_devices
,
354 static int __init
dm_delay_init(void)
358 r
= dm_register_target(&delay_target
);
360 DMERR("register failed %d", r
);
370 static void __exit
dm_delay_exit(void)
372 dm_unregister_target(&delay_target
);
376 module_init(dm_delay_init
);
377 module_exit(dm_delay_exit
);
379 MODULE_DESCRIPTION(DM_NAME
" delay target");
380 MODULE_AUTHOR("Heinz Mauelshagen <mauelshagen@redhat.com>");
381 MODULE_LICENSE("GPL");