2 * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
3 * Copyright (C) 2004-2006 Red Hat, Inc. All rights reserved.
5 * This copyrighted material is made available to anyone wishing to use,
6 * modify, copy, or redistribute it subject to the terms and conditions
7 * of the GNU General Public License version 2.
10 #include <linux/sched.h>
11 #include <linux/slab.h>
12 #include <linux/spinlock.h>
13 #include <linux/completion.h>
14 #include <linux/buffer_head.h>
15 #include <linux/gfs2_ondisk.h>
16 #include <linux/crc32.h>
17 #include <linux/lm_interface.h>
32 * gfs2_struct2blk - compute stuff
33 * @sdp: the filesystem
34 * @nstruct: the number of structures
35 * @ssize: the size of the structures
37 * Compute the number of log descriptor blocks needed to hold a certain number
38 * of structures of a certain size.
40 * Returns: the number of blocks needed (minimum is always 1)
43 unsigned int gfs2_struct2blk(struct gfs2_sbd
*sdp
, unsigned int nstruct
,
47 unsigned int first
, second
;
50 first
= (sdp
->sd_sb
.sb_bsize
- sizeof(struct gfs2_log_descriptor
)) / ssize
;
52 if (nstruct
> first
) {
53 second
= (sdp
->sd_sb
.sb_bsize
-
54 sizeof(struct gfs2_meta_header
)) / ssize
;
55 blks
+= DIV_ROUND_UP(nstruct
- first
, second
);
62 * gfs2_ail1_start_one - Start I/O on a part of the AIL
63 * @sdp: the filesystem
64 * @tr: the part of the AIL
68 static void gfs2_ail1_start_one(struct gfs2_sbd
*sdp
, struct gfs2_ail
*ai
)
70 struct gfs2_bufdata
*bd
, *s
;
71 struct buffer_head
*bh
;
74 BUG_ON(!spin_is_locked(&sdp
->sd_log_lock
));
79 list_for_each_entry_safe_reverse(bd
, s
, &ai
->ai_ail1_list
,
83 gfs2_assert(sdp
, bd
->bd_ail
== ai
);
85 if (!buffer_busy(bh
)) {
86 if (!buffer_uptodate(bh
)) {
88 gfs2_io_error_bh(sdp
, bh
);
91 list_move(&bd
->bd_ail_st_list
, &ai
->ai_ail2_list
);
95 if (!buffer_dirty(bh
))
98 list_move(&bd
->bd_ail_st_list
, &ai
->ai_ail1_list
);
100 gfs2_log_unlock(sdp
);
102 ll_rw_block(WRITE
, 1, &bh
);
112 * gfs2_ail1_empty_one - Check whether or not a trans in the AIL has been synced
113 * @sdp: the filesystem
118 static int gfs2_ail1_empty_one(struct gfs2_sbd
*sdp
, struct gfs2_ail
*ai
, int flags
)
120 struct gfs2_bufdata
*bd
, *s
;
121 struct buffer_head
*bh
;
123 list_for_each_entry_safe_reverse(bd
, s
, &ai
->ai_ail1_list
,
127 gfs2_assert(sdp
, bd
->bd_ail
== ai
);
129 if (buffer_busy(bh
)) {
136 if (!buffer_uptodate(bh
))
137 gfs2_io_error_bh(sdp
, bh
);
139 list_move(&bd
->bd_ail_st_list
, &ai
->ai_ail2_list
);
142 return list_empty(&ai
->ai_ail1_list
);
145 void gfs2_ail1_start(struct gfs2_sbd
*sdp
, int flags
)
147 struct list_head
*head
= &sdp
->sd_ail1_list
;
149 struct list_head
*first
;
150 struct gfs2_ail
*first_ai
, *ai
, *tmp
;
154 if (list_empty(head
)) {
155 gfs2_log_unlock(sdp
);
158 sync_gen
= sdp
->sd_ail_sync_gen
++;
161 first_ai
= list_entry(first
, struct gfs2_ail
, ai_list
);
162 first_ai
->ai_sync_gen
= sync_gen
;
163 gfs2_ail1_start_one(sdp
, first_ai
); /* This may drop log lock */
169 if (first
&& (head
->prev
!= first
||
170 gfs2_ail1_empty_one(sdp
, first_ai
, 0)))
174 list_for_each_entry_safe_reverse(ai
, tmp
, head
, ai_list
) {
175 if (ai
->ai_sync_gen
>= sync_gen
)
177 ai
->ai_sync_gen
= sync_gen
;
178 gfs2_ail1_start_one(sdp
, ai
); /* This may drop log lock */
184 gfs2_log_unlock(sdp
);
187 int gfs2_ail1_empty(struct gfs2_sbd
*sdp
, int flags
)
189 struct gfs2_ail
*ai
, *s
;
194 list_for_each_entry_safe_reverse(ai
, s
, &sdp
->sd_ail1_list
, ai_list
) {
195 if (gfs2_ail1_empty_one(sdp
, ai
, flags
))
196 list_move(&ai
->ai_list
, &sdp
->sd_ail2_list
);
197 else if (!(flags
& DIO_ALL
))
201 ret
= list_empty(&sdp
->sd_ail1_list
);
203 gfs2_log_unlock(sdp
);
210 * gfs2_ail2_empty_one - Check whether or not a trans in the AIL has been synced
211 * @sdp: the filesystem
216 static void gfs2_ail2_empty_one(struct gfs2_sbd
*sdp
, struct gfs2_ail
*ai
)
218 struct list_head
*head
= &ai
->ai_ail2_list
;
219 struct gfs2_bufdata
*bd
;
221 while (!list_empty(head
)) {
222 bd
= list_entry(head
->prev
, struct gfs2_bufdata
,
224 gfs2_assert(sdp
, bd
->bd_ail
== ai
);
226 list_del(&bd
->bd_ail_st_list
);
227 list_del(&bd
->bd_ail_gl_list
);
228 atomic_dec(&bd
->bd_gl
->gl_ail_count
);
233 static void ail2_empty(struct gfs2_sbd
*sdp
, unsigned int new_tail
)
235 struct gfs2_ail
*ai
, *safe
;
236 unsigned int old_tail
= sdp
->sd_log_tail
;
237 int wrap
= (new_tail
< old_tail
);
242 list_for_each_entry_safe(ai
, safe
, &sdp
->sd_ail2_list
, ai_list
) {
243 a
= (old_tail
<= ai
->ai_first
);
244 b
= (ai
->ai_first
< new_tail
);
245 rm
= (wrap
) ? (a
|| b
) : (a
&& b
);
249 gfs2_ail2_empty_one(sdp
, ai
);
250 list_del(&ai
->ai_list
);
251 gfs2_assert_warn(sdp
, list_empty(&ai
->ai_ail1_list
));
252 gfs2_assert_warn(sdp
, list_empty(&ai
->ai_ail2_list
));
256 gfs2_log_unlock(sdp
);
260 * gfs2_log_reserve - Make a log reservation
261 * @sdp: The GFS2 superblock
262 * @blks: The number of blocks to reserve
267 int gfs2_log_reserve(struct gfs2_sbd
*sdp
, unsigned int blks
)
269 unsigned int try = 0;
271 if (gfs2_assert_warn(sdp
, blks
) ||
272 gfs2_assert_warn(sdp
, blks
<= sdp
->sd_jdesc
->jd_blocks
))
275 mutex_lock(&sdp
->sd_log_reserve_mutex
);
277 while(sdp
->sd_log_blks_free
<= blks
) {
278 gfs2_log_unlock(sdp
);
279 gfs2_ail1_empty(sdp
, 0);
280 gfs2_log_flush(sdp
, NULL
);
283 gfs2_ail1_start(sdp
, 0);
286 sdp
->sd_log_blks_free
-= blks
;
287 gfs2_log_unlock(sdp
);
288 mutex_unlock(&sdp
->sd_log_reserve_mutex
);
290 down_read(&sdp
->sd_log_flush_lock
);
296 * gfs2_log_release - Release a given number of log blocks
297 * @sdp: The GFS2 superblock
298 * @blks: The number of blocks
302 void gfs2_log_release(struct gfs2_sbd
*sdp
, unsigned int blks
)
306 sdp
->sd_log_blks_free
+= blks
;
307 gfs2_assert_withdraw(sdp
,
308 sdp
->sd_log_blks_free
<= sdp
->sd_jdesc
->jd_blocks
);
309 gfs2_log_unlock(sdp
);
310 up_read(&sdp
->sd_log_flush_lock
);
313 static u64
log_bmap(struct gfs2_sbd
*sdp
, unsigned int lbn
)
315 struct inode
*inode
= sdp
->sd_jdesc
->jd_inode
;
317 struct buffer_head bh_map
= { .b_state
= 0, .b_blocknr
= 0 };
319 bh_map
.b_size
= 1 << inode
->i_blkbits
;
320 error
= gfs2_block_map(inode
, lbn
, 0, &bh_map
);
321 if (error
|| !bh_map
.b_blocknr
)
322 printk(KERN_INFO
"error=%d, dbn=%llu lbn=%u", error
, bh_map
.b_blocknr
, lbn
);
323 gfs2_assert_withdraw(sdp
, !error
&& bh_map
.b_blocknr
);
325 return bh_map
.b_blocknr
;
329 * log_distance - Compute distance between two journal blocks
330 * @sdp: The GFS2 superblock
331 * @newer: The most recent journal block of the pair
332 * @older: The older journal block of the pair
334 * Compute the distance (in the journal direction) between two
335 * blocks in the journal
337 * Returns: the distance in blocks
340 static inline unsigned int log_distance(struct gfs2_sbd
*sdp
, unsigned int newer
,
345 dist
= newer
- older
;
347 dist
+= sdp
->sd_jdesc
->jd_blocks
;
352 static unsigned int current_tail(struct gfs2_sbd
*sdp
)
359 if (list_empty(&sdp
->sd_ail1_list
)) {
360 tail
= sdp
->sd_log_head
;
362 ai
= list_entry(sdp
->sd_ail1_list
.prev
, struct gfs2_ail
, ai_list
);
366 gfs2_log_unlock(sdp
);
371 static inline void log_incr_head(struct gfs2_sbd
*sdp
)
373 if (sdp
->sd_log_flush_head
== sdp
->sd_log_tail
)
374 gfs2_assert_withdraw(sdp
, sdp
->sd_log_flush_head
== sdp
->sd_log_head
);
376 if (++sdp
->sd_log_flush_head
== sdp
->sd_jdesc
->jd_blocks
) {
377 sdp
->sd_log_flush_head
= 0;
378 sdp
->sd_log_flush_wrapped
= 1;
383 * gfs2_log_get_buf - Get and initialize a buffer to use for log control data
384 * @sdp: The GFS2 superblock
386 * Returns: the buffer_head
389 struct buffer_head
*gfs2_log_get_buf(struct gfs2_sbd
*sdp
)
391 u64 blkno
= log_bmap(sdp
, sdp
->sd_log_flush_head
);
392 struct gfs2_log_buf
*lb
;
393 struct buffer_head
*bh
;
395 lb
= kzalloc(sizeof(struct gfs2_log_buf
), GFP_NOFS
| __GFP_NOFAIL
);
396 list_add(&lb
->lb_list
, &sdp
->sd_log_flush_list
);
398 bh
= lb
->lb_bh
= sb_getblk(sdp
->sd_vfs
, blkno
);
400 memset(bh
->b_data
, 0, bh
->b_size
);
401 set_buffer_uptodate(bh
);
402 clear_buffer_dirty(bh
);
411 * gfs2_log_fake_buf - Build a fake buffer head to write metadata buffer to log
412 * @sdp: the filesystem
413 * @data: the data the buffer_head should point to
415 * Returns: the log buffer descriptor
418 struct buffer_head
*gfs2_log_fake_buf(struct gfs2_sbd
*sdp
,
419 struct buffer_head
*real
)
421 u64 blkno
= log_bmap(sdp
, sdp
->sd_log_flush_head
);
422 struct gfs2_log_buf
*lb
;
423 struct buffer_head
*bh
;
425 lb
= kzalloc(sizeof(struct gfs2_log_buf
), GFP_NOFS
| __GFP_NOFAIL
);
426 list_add(&lb
->lb_list
, &sdp
->sd_log_flush_list
);
429 bh
= lb
->lb_bh
= alloc_buffer_head(GFP_NOFS
| __GFP_NOFAIL
);
430 atomic_set(&bh
->b_count
, 1);
431 bh
->b_state
= (1 << BH_Mapped
) | (1 << BH_Uptodate
);
432 set_bh_page(bh
, real
->b_page
, bh_offset(real
));
433 bh
->b_blocknr
= blkno
;
434 bh
->b_size
= sdp
->sd_sb
.sb_bsize
;
435 bh
->b_bdev
= sdp
->sd_vfs
->s_bdev
;
442 static void log_pull_tail(struct gfs2_sbd
*sdp
, unsigned int new_tail
, int pull
)
444 unsigned int dist
= log_distance(sdp
, new_tail
, sdp
->sd_log_tail
);
446 ail2_empty(sdp
, new_tail
);
449 sdp
->sd_log_blks_free
+= dist
- (pull
? 1 : 0);
450 gfs2_assert_withdraw(sdp
, sdp
->sd_log_blks_free
<= sdp
->sd_jdesc
->jd_blocks
);
451 gfs2_log_unlock(sdp
);
453 sdp
->sd_log_tail
= new_tail
;
457 * log_write_header - Get and initialize a journal header buffer
458 * @sdp: The GFS2 superblock
460 * Returns: the initialized log buffer descriptor
463 static void log_write_header(struct gfs2_sbd
*sdp
, u32 flags
, int pull
)
465 u64 blkno
= log_bmap(sdp
, sdp
->sd_log_flush_head
);
466 struct buffer_head
*bh
;
467 struct gfs2_log_header
*lh
;
471 bh
= sb_getblk(sdp
->sd_vfs
, blkno
);
473 memset(bh
->b_data
, 0, bh
->b_size
);
474 set_buffer_uptodate(bh
);
475 clear_buffer_dirty(bh
);
478 gfs2_ail1_empty(sdp
, 0);
479 tail
= current_tail(sdp
);
481 lh
= (struct gfs2_log_header
*)bh
->b_data
;
482 memset(lh
, 0, sizeof(struct gfs2_log_header
));
483 lh
->lh_header
.mh_magic
= cpu_to_be32(GFS2_MAGIC
);
484 lh
->lh_header
.mh_type
= cpu_to_be32(GFS2_METATYPE_LH
);
485 lh
->lh_header
.mh_format
= cpu_to_be32(GFS2_FORMAT_LH
);
486 lh
->lh_sequence
= cpu_to_be64(sdp
->sd_log_sequence
++);
487 lh
->lh_flags
= cpu_to_be32(flags
);
488 lh
->lh_tail
= cpu_to_be32(tail
);
489 lh
->lh_blkno
= cpu_to_be32(sdp
->sd_log_flush_head
);
490 hash
= gfs2_disk_hash(bh
->b_data
, sizeof(struct gfs2_log_header
));
491 lh
->lh_hash
= cpu_to_be32(hash
);
493 set_buffer_dirty(bh
);
494 if (sync_dirty_buffer(bh
))
495 gfs2_io_error_bh(sdp
, bh
);
498 if (sdp
->sd_log_tail
!= tail
)
499 log_pull_tail(sdp
, tail
, pull
);
501 gfs2_assert_withdraw(sdp
, !pull
);
503 sdp
->sd_log_idle
= (tail
== sdp
->sd_log_flush_head
);
507 static void log_flush_commit(struct gfs2_sbd
*sdp
)
509 struct list_head
*head
= &sdp
->sd_log_flush_list
;
510 struct gfs2_log_buf
*lb
;
511 struct buffer_head
*bh
;
513 while (!list_empty(head
)) {
514 lb
= list_entry(head
->next
, struct gfs2_log_buf
, lb_list
);
515 list_del(&lb
->lb_list
);
519 if (!buffer_uptodate(bh
))
520 gfs2_io_error_bh(sdp
, bh
);
522 while (atomic_read(&bh
->b_count
) != 1) /* Grrrr... */
524 free_buffer_head(bh
);
530 log_write_header(sdp
, 0, 0);
534 * gfs2_log_flush - flush incore transaction(s)
535 * @sdp: the filesystem
536 * @gl: The glock structure to flush. If NULL, flush the whole incore log
540 void gfs2_log_flush(struct gfs2_sbd
*sdp
, struct gfs2_glock
*gl
)
544 down_write(&sdp
->sd_log_flush_lock
);
548 if (list_empty(&gl
->gl_le
.le_list
)) {
549 gfs2_log_unlock(sdp
);
550 up_write(&sdp
->sd_log_flush_lock
);
553 gfs2_log_unlock(sdp
);
556 ai
= kzalloc(sizeof(struct gfs2_ail
), GFP_NOFS
| __GFP_NOFAIL
);
557 INIT_LIST_HEAD(&ai
->ai_ail1_list
);
558 INIT_LIST_HEAD(&ai
->ai_ail2_list
);
560 gfs2_assert_withdraw(sdp
, sdp
->sd_log_num_buf
== sdp
->sd_log_commited_buf
);
561 gfs2_assert_withdraw(sdp
,
562 sdp
->sd_log_num_revoke
== sdp
->sd_log_commited_revoke
);
564 sdp
->sd_log_flush_head
= sdp
->sd_log_head
;
565 sdp
->sd_log_flush_wrapped
= 0;
566 ai
->ai_first
= sdp
->sd_log_flush_head
;
568 lops_before_commit(sdp
);
569 if (!list_empty(&sdp
->sd_log_flush_list
))
570 log_flush_commit(sdp
);
571 else if (sdp
->sd_log_tail
!= current_tail(sdp
) && !sdp
->sd_log_idle
)
572 log_write_header(sdp
, 0, PULL
);
573 lops_after_commit(sdp
, ai
);
576 sdp
->sd_log_head
= sdp
->sd_log_flush_head
;
577 sdp
->sd_log_blks_free
-= sdp
->sd_log_num_hdrs
;
578 sdp
->sd_log_blks_reserved
= 0;
579 sdp
->sd_log_commited_buf
= 0;
580 sdp
->sd_log_num_hdrs
= 0;
581 sdp
->sd_log_commited_revoke
= 0;
583 if (!list_empty(&ai
->ai_ail1_list
)) {
584 list_add(&ai
->ai_list
, &sdp
->sd_ail1_list
);
587 gfs2_log_unlock(sdp
);
589 sdp
->sd_vfs
->s_dirt
= 0;
590 up_write(&sdp
->sd_log_flush_lock
);
595 static void log_refund(struct gfs2_sbd
*sdp
, struct gfs2_trans
*tr
)
597 unsigned int reserved
= 0;
602 sdp
->sd_log_commited_buf
+= tr
->tr_num_buf_new
- tr
->tr_num_buf_rm
;
603 gfs2_assert_withdraw(sdp
, ((int)sdp
->sd_log_commited_buf
) >= 0);
604 sdp
->sd_log_commited_revoke
+= tr
->tr_num_revoke
- tr
->tr_num_revoke_rm
;
605 gfs2_assert_withdraw(sdp
, ((int)sdp
->sd_log_commited_revoke
) >= 0);
607 if (sdp
->sd_log_commited_buf
)
608 reserved
+= sdp
->sd_log_commited_buf
;
609 if (sdp
->sd_log_commited_revoke
)
610 reserved
+= gfs2_struct2blk(sdp
, sdp
->sd_log_commited_revoke
,
615 old
= sdp
->sd_log_blks_free
;
616 sdp
->sd_log_blks_free
+= tr
->tr_reserved
-
617 (reserved
- sdp
->sd_log_blks_reserved
);
619 gfs2_assert_withdraw(sdp
, sdp
->sd_log_blks_free
>= old
);
620 gfs2_assert_withdraw(sdp
,
621 sdp
->sd_log_blks_free
<= sdp
->sd_jdesc
->jd_blocks
+
622 sdp
->sd_log_num_hdrs
);
624 sdp
->sd_log_blks_reserved
= reserved
;
626 gfs2_log_unlock(sdp
);
630 * gfs2_log_commit - Commit a transaction to the log
631 * @sdp: the filesystem
632 * @tr: the transaction
637 void gfs2_log_commit(struct gfs2_sbd
*sdp
, struct gfs2_trans
*tr
)
640 lops_incore_commit(sdp
, tr
);
642 sdp
->sd_vfs
->s_dirt
= 1;
643 up_read(&sdp
->sd_log_flush_lock
);
646 if (sdp
->sd_log_num_buf
> gfs2_tune_get(sdp
, gt_incore_log_blocks
)) {
647 gfs2_log_unlock(sdp
);
648 gfs2_log_flush(sdp
, NULL
);
650 gfs2_log_unlock(sdp
);
655 * gfs2_log_shutdown - write a shutdown header into a journal
656 * @sdp: the filesystem
660 void gfs2_log_shutdown(struct gfs2_sbd
*sdp
)
662 down_write(&sdp
->sd_log_flush_lock
);
664 gfs2_assert_withdraw(sdp
, !sdp
->sd_log_blks_reserved
);
665 gfs2_assert_withdraw(sdp
, !sdp
->sd_log_num_gl
);
666 gfs2_assert_withdraw(sdp
, !sdp
->sd_log_num_buf
);
667 gfs2_assert_withdraw(sdp
, !sdp
->sd_log_num_jdata
);
668 gfs2_assert_withdraw(sdp
, !sdp
->sd_log_num_revoke
);
669 gfs2_assert_withdraw(sdp
, !sdp
->sd_log_num_rg
);
670 gfs2_assert_withdraw(sdp
, !sdp
->sd_log_num_databuf
);
671 gfs2_assert_withdraw(sdp
, !sdp
->sd_log_num_hdrs
);
672 gfs2_assert_withdraw(sdp
, list_empty(&sdp
->sd_ail1_list
));
674 sdp
->sd_log_flush_head
= sdp
->sd_log_head
;
675 sdp
->sd_log_flush_wrapped
= 0;
677 log_write_header(sdp
, GFS2_LOG_HEAD_UNMOUNT
, 0);
679 gfs2_assert_warn(sdp
, sdp
->sd_log_blks_free
== sdp
->sd_jdesc
->jd_blocks
);
680 gfs2_assert_warn(sdp
, sdp
->sd_log_head
== sdp
->sd_log_tail
);
681 gfs2_assert_warn(sdp
, list_empty(&sdp
->sd_ail2_list
));
683 sdp
->sd_log_head
= sdp
->sd_log_flush_head
;
684 sdp
->sd_log_tail
= sdp
->sd_log_head
;
686 up_write(&sdp
->sd_log_flush_lock
);