2 * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
3 * Copyright (C) 2004-2006 Red Hat, Inc. All rights reserved.
5 * This copyrighted material is made available to anyone wishing to use,
6 * modify, copy, or redistribute it subject to the terms and conditions
7 * of the GNU General Public License version 2.
10 #include <linux/sched.h>
11 #include <linux/slab.h>
12 #include <linux/spinlock.h>
13 #include <linux/completion.h>
14 #include <linux/buffer_head.h>
15 #include <linux/mempool.h>
16 #include <linux/gfs2_ondisk.h>
17 #include <linux/bio.h>
31 #include "trace_gfs2.h"
34 * gfs2_pin - Pin a buffer in memory
35 * @sdp: The superblock
36 * @bh: The buffer to be pinned
38 * The log lock must be held when calling this function
40 static void gfs2_pin(struct gfs2_sbd
*sdp
, struct buffer_head
*bh
)
42 struct gfs2_bufdata
*bd
;
44 BUG_ON(!current
->journal_info
);
46 clear_buffer_dirty(bh
);
47 if (test_set_buffer_pinned(bh
))
48 gfs2_assert_withdraw(sdp
, 0);
49 if (!buffer_uptodate(bh
))
50 gfs2_io_error_bh(sdp
, bh
);
52 /* If this buffer is in the AIL and it has already been written
53 * to in-place disk block, remove it from the AIL.
55 spin_lock(&sdp
->sd_ail_lock
);
57 list_move(&bd
->bd_ail_st_list
, &bd
->bd_ail
->ai_ail2_list
);
58 spin_unlock(&sdp
->sd_ail_lock
);
60 atomic_inc(&sdp
->sd_log_pinned
);
61 trace_gfs2_pin(bd
, 1);
64 static bool buffer_is_rgrp(const struct gfs2_bufdata
*bd
)
66 return bd
->bd_gl
->gl_name
.ln_type
== LM_TYPE_RGRP
;
69 static void maybe_release_space(struct gfs2_bufdata
*bd
)
71 struct gfs2_glock
*gl
= bd
->bd_gl
;
72 struct gfs2_sbd
*sdp
= gl
->gl_sbd
;
73 struct gfs2_rgrpd
*rgd
= gl
->gl_object
;
74 unsigned int index
= bd
->bd_bh
->b_blocknr
- gl
->gl_name
.ln_number
;
75 struct gfs2_bitmap
*bi
= rgd
->rd_bits
+ index
;
77 if (bi
->bi_clone
== 0)
79 if (sdp
->sd_args
.ar_discard
)
80 gfs2_rgrp_send_discards(sdp
, rgd
->rd_data0
, bd
->bd_bh
, bi
, 1, NULL
);
81 memcpy(bi
->bi_clone
+ bi
->bi_offset
,
82 bd
->bd_bh
->b_data
+ bi
->bi_offset
, bi
->bi_len
);
83 clear_bit(GBF_FULL
, &bi
->bi_flags
);
84 rgd
->rd_free_clone
= rgd
->rd_free
;
88 * gfs2_unpin - Unpin a buffer
89 * @sdp: the filesystem the buffer belongs to
90 * @bh: The buffer to unpin
92 * @flags: The inode dirty flags
96 static void gfs2_unpin(struct gfs2_sbd
*sdp
, struct buffer_head
*bh
,
99 struct gfs2_bufdata
*bd
= bh
->b_private
;
101 BUG_ON(!buffer_uptodate(bh
));
102 BUG_ON(!buffer_pinned(bh
));
105 mark_buffer_dirty(bh
);
106 clear_buffer_pinned(bh
);
108 if (buffer_is_rgrp(bd
))
109 maybe_release_space(bd
);
111 spin_lock(&sdp
->sd_ail_lock
);
113 list_del(&bd
->bd_ail_st_list
);
116 struct gfs2_glock
*gl
= bd
->bd_gl
;
117 list_add(&bd
->bd_ail_gl_list
, &gl
->gl_ail_list
);
118 atomic_inc(&gl
->gl_ail_count
);
121 list_add(&bd
->bd_ail_st_list
, &ai
->ai_ail1_list
);
122 spin_unlock(&sdp
->sd_ail_lock
);
124 clear_bit(GLF_LFLUSH
, &bd
->bd_gl
->gl_flags
);
125 trace_gfs2_pin(bd
, 0);
127 atomic_dec(&sdp
->sd_log_pinned
);
130 static void gfs2_log_incr_head(struct gfs2_sbd
*sdp
)
132 BUG_ON((sdp
->sd_log_flush_head
== sdp
->sd_log_tail
) &&
133 (sdp
->sd_log_flush_head
!= sdp
->sd_log_head
));
135 if (++sdp
->sd_log_flush_head
== sdp
->sd_jdesc
->jd_blocks
) {
136 sdp
->sd_log_flush_head
= 0;
137 sdp
->sd_log_flush_wrapped
= 1;
141 static u64
gfs2_log_bmap(struct gfs2_sbd
*sdp
)
143 unsigned int lbn
= sdp
->sd_log_flush_head
;
144 struct gfs2_journal_extent
*je
;
147 list_for_each_entry(je
, &sdp
->sd_jdesc
->extent_list
, extent_list
) {
148 if (lbn
>= je
->lblock
&& lbn
< je
->lblock
+ je
->blocks
) {
149 block
= je
->dblock
+ lbn
- je
->lblock
;
150 gfs2_log_incr_head(sdp
);
159 * gfs2_end_log_write_bh - end log write of pagecache data with buffers
160 * @sdp: The superblock
162 * @error: The i/o status
164 * This finds the relavent buffers and unlocks then and sets the
165 * error flag according to the status of the i/o request. This is
166 * used when the log is writing data which has an in-place version
167 * that is pinned in the pagecache.
170 static void gfs2_end_log_write_bh(struct gfs2_sbd
*sdp
, struct bio_vec
*bvec
,
173 struct buffer_head
*bh
, *next
;
174 struct page
*page
= bvec
->bv_page
;
177 bh
= page_buffers(page
);
179 while (bh_offset(bh
) < bvec
->bv_offset
)
180 bh
= bh
->b_this_page
;
183 set_buffer_write_io_error(bh
);
185 next
= bh
->b_this_page
;
193 * gfs2_end_log_write - end of i/o to the log
195 * @error: Status of i/o request
197 * Each bio_vec contains either data from the pagecache or data
198 * relating to the log itself. Here we iterate over the bio_vec
199 * array, processing both kinds of data.
203 static void gfs2_end_log_write(struct bio
*bio
, int error
)
205 struct gfs2_sbd
*sdp
= bio
->bi_private
;
206 struct bio_vec
*bvec
;
211 sdp
->sd_log_error
= error
;
212 fs_err(sdp
, "Error %d writing to log\n", error
);
215 bio_for_each_segment(bvec
, bio
, i
) {
216 page
= bvec
->bv_page
;
217 if (page_has_buffers(page
))
218 gfs2_end_log_write_bh(sdp
, bvec
, error
);
220 mempool_free(page
, gfs2_page_pool
);
224 if (atomic_dec_and_test(&sdp
->sd_log_in_flight
))
225 wake_up(&sdp
->sd_log_flush_wait
);
229 * gfs2_log_flush_bio - Submit any pending log bio
230 * @sdp: The superblock
233 * Submit any pending part-built or full bio to the block device. If
234 * there is no pending bio, then this is a no-op.
237 void gfs2_log_flush_bio(struct gfs2_sbd
*sdp
, int rw
)
239 if (sdp
->sd_log_bio
) {
240 atomic_inc(&sdp
->sd_log_in_flight
);
241 submit_bio(rw
, sdp
->sd_log_bio
);
242 sdp
->sd_log_bio
= NULL
;
247 * gfs2_log_alloc_bio - Allocate a new bio for log writing
248 * @sdp: The superblock
249 * @blkno: The next device block number we want to write to
251 * This should never be called when there is a cached bio in the
252 * super block. When it returns, there will be a cached bio in the
253 * super block which will have as many bio_vecs as the device is
256 * Returns: Newly allocated bio
259 static struct bio
*gfs2_log_alloc_bio(struct gfs2_sbd
*sdp
, u64 blkno
)
261 struct super_block
*sb
= sdp
->sd_vfs
;
262 unsigned nrvecs
= bio_get_nr_vecs(sb
->s_bdev
);
265 BUG_ON(sdp
->sd_log_bio
);
268 bio
= bio_alloc(GFP_NOIO
, nrvecs
);
271 nrvecs
= max(nrvecs
/2, 1U);
274 bio
->bi_sector
= blkno
* (sb
->s_blocksize
>> 9);
275 bio
->bi_bdev
= sb
->s_bdev
;
276 bio
->bi_end_io
= gfs2_end_log_write
;
277 bio
->bi_private
= sdp
;
279 sdp
->sd_log_bio
= bio
;
285 * gfs2_log_get_bio - Get cached log bio, or allocate a new one
286 * @sdp: The superblock
287 * @blkno: The device block number we want to write to
289 * If there is a cached bio, then if the next block number is sequential
290 * with the previous one, return it, otherwise flush the bio to the
291 * device. If there is not a cached bio, or we just flushed it, then
292 * allocate a new one.
294 * Returns: The bio to use for log writes
297 static struct bio
*gfs2_log_get_bio(struct gfs2_sbd
*sdp
, u64 blkno
)
299 struct bio
*bio
= sdp
->sd_log_bio
;
303 nblk
= bio
->bi_sector
+ bio_sectors(bio
);
304 nblk
>>= sdp
->sd_fsb2bb_shift
;
307 gfs2_log_flush_bio(sdp
, WRITE
);
310 return gfs2_log_alloc_bio(sdp
, blkno
);
315 * gfs2_log_write - write to log
316 * @sdp: the filesystem
317 * @page: the page to write
318 * @size: the size of the data to write
319 * @offset: the offset within the page
321 * Try and add the page segment to the current bio. If that fails,
322 * submit the current bio to the device and create a new one, and
323 * then add the page segment to that.
326 static void gfs2_log_write(struct gfs2_sbd
*sdp
, struct page
*page
,
327 unsigned size
, unsigned offset
)
329 u64 blkno
= gfs2_log_bmap(sdp
);
333 bio
= gfs2_log_get_bio(sdp
, blkno
);
334 ret
= bio_add_page(bio
, page
, size
, offset
);
336 gfs2_log_flush_bio(sdp
, WRITE
);
337 bio
= gfs2_log_alloc_bio(sdp
, blkno
);
338 ret
= bio_add_page(bio
, page
, size
, offset
);
344 * gfs2_log_write_bh - write a buffer's content to the log
345 * @sdp: The super block
346 * @bh: The buffer pointing to the in-place location
348 * This writes the content of the buffer to the next available location
349 * in the log. The buffer will be unlocked once the i/o to the log has
353 static void gfs2_log_write_bh(struct gfs2_sbd
*sdp
, struct buffer_head
*bh
)
355 gfs2_log_write(sdp
, bh
->b_page
, bh
->b_size
, bh_offset(bh
));
359 * gfs2_log_write_page - write one block stored in a page, into the log
360 * @sdp: The superblock
361 * @page: The struct page
363 * This writes the first block-sized part of the page into the log. Note
364 * that the page must have been allocated from the gfs2_page_pool mempool
365 * and that after this has been called, ownership has been transferred and
366 * the page may be freed at any time.
369 void gfs2_log_write_page(struct gfs2_sbd
*sdp
, struct page
*page
)
371 struct super_block
*sb
= sdp
->sd_vfs
;
372 gfs2_log_write(sdp
, page
, sb
->s_blocksize
, 0);
375 static struct page
*gfs2_get_log_desc(struct gfs2_sbd
*sdp
, u32 ld_type
,
376 u32 ld_length
, u32 ld_data1
)
378 struct page
*page
= mempool_alloc(gfs2_page_pool
, GFP_NOIO
);
379 struct gfs2_log_descriptor
*ld
= page_address(page
);
381 ld
->ld_header
.mh_magic
= cpu_to_be32(GFS2_MAGIC
);
382 ld
->ld_header
.mh_type
= cpu_to_be32(GFS2_METATYPE_LD
);
383 ld
->ld_header
.mh_format
= cpu_to_be32(GFS2_FORMAT_LD
);
384 ld
->ld_type
= cpu_to_be32(ld_type
);
385 ld
->ld_length
= cpu_to_be32(ld_length
);
386 ld
->ld_data1
= cpu_to_be32(ld_data1
);
391 static void buf_lo_add(struct gfs2_sbd
*sdp
, struct gfs2_bufdata
*bd
)
393 struct gfs2_meta_header
*mh
;
394 struct gfs2_trans
*tr
;
396 lock_buffer(bd
->bd_bh
);
398 tr
= current
->journal_info
;
400 if (!list_empty(&bd
->bd_list
))
402 set_bit(GLF_LFLUSH
, &bd
->bd_gl
->gl_flags
);
403 set_bit(GLF_DIRTY
, &bd
->bd_gl
->gl_flags
);
404 gfs2_meta_check(sdp
, bd
->bd_bh
);
405 gfs2_pin(sdp
, bd
->bd_bh
);
406 mh
= (struct gfs2_meta_header
*)bd
->bd_bh
->b_data
;
407 mh
->__pad0
= cpu_to_be64(0);
408 mh
->mh_jid
= cpu_to_be32(sdp
->sd_jdesc
->jd_jid
);
409 sdp
->sd_log_num_buf
++;
410 list_add(&bd
->bd_list
, &sdp
->sd_log_le_buf
);
411 tr
->tr_num_buf_new
++;
413 gfs2_log_unlock(sdp
);
414 unlock_buffer(bd
->bd_bh
);
417 static void gfs2_check_magic(struct buffer_head
*bh
)
422 clear_buffer_escaped(bh
);
423 kaddr
= kmap_atomic(bh
->b_page
);
424 ptr
= kaddr
+ bh_offset(bh
);
425 if (*ptr
== cpu_to_be32(GFS2_MAGIC
))
426 set_buffer_escaped(bh
);
427 kunmap_atomic(kaddr
);
430 static void gfs2_before_commit(struct gfs2_sbd
*sdp
, unsigned int limit
,
431 unsigned int total
, struct list_head
*blist
,
434 struct gfs2_log_descriptor
*ld
;
435 struct gfs2_bufdata
*bd1
= NULL
, *bd2
;
442 bd1
= bd2
= list_prepare_entry(bd1
, blist
, bd_list
);
447 gfs2_log_unlock(sdp
);
448 page
= gfs2_get_log_desc(sdp
, GFS2_LOG_DESC_METADATA
, num
+ 1, num
);
449 ld
= page_address(page
);
451 ptr
= (__be64
*)(ld
+ 1);
454 list_for_each_entry_continue(bd1
, blist
, bd_list
) {
455 *ptr
++ = cpu_to_be64(bd1
->bd_bh
->b_blocknr
);
457 gfs2_check_magic(bd1
->bd_bh
);
458 *ptr
++ = cpu_to_be64(buffer_escaped(bd1
->bd_bh
) ? 1 : 0);
464 gfs2_log_unlock(sdp
);
465 gfs2_log_write_page(sdp
, page
);
469 list_for_each_entry_continue(bd2
, blist
, bd_list
) {
471 gfs2_log_unlock(sdp
);
472 lock_buffer(bd2
->bd_bh
);
474 if (buffer_escaped(bd2
->bd_bh
)) {
476 page
= mempool_alloc(gfs2_page_pool
, GFP_NOIO
);
477 ptr
= page_address(page
);
478 kaddr
= kmap_atomic(bd2
->bd_bh
->b_page
);
479 memcpy(ptr
, kaddr
+ bh_offset(bd2
->bd_bh
),
481 kunmap_atomic(kaddr
);
483 clear_buffer_escaped(bd2
->bd_bh
);
484 unlock_buffer(bd2
->bd_bh
);
486 gfs2_log_write_page(sdp
, page
);
488 gfs2_log_write_bh(sdp
, bd2
->bd_bh
);
498 gfs2_log_unlock(sdp
);
501 static void buf_lo_before_commit(struct gfs2_sbd
*sdp
)
503 unsigned int limit
= buf_limit(sdp
); /* 503 for 4k blocks */
505 gfs2_before_commit(sdp
, limit
, sdp
->sd_log_num_buf
,
506 &sdp
->sd_log_le_buf
, 0);
509 static void buf_lo_after_commit(struct gfs2_sbd
*sdp
, struct gfs2_ail
*ai
)
511 struct list_head
*head
= &sdp
->sd_log_le_buf
;
512 struct gfs2_bufdata
*bd
;
514 while (!list_empty(head
)) {
515 bd
= list_entry(head
->next
, struct gfs2_bufdata
, bd_list
);
516 list_del_init(&bd
->bd_list
);
517 sdp
->sd_log_num_buf
--;
519 gfs2_unpin(sdp
, bd
->bd_bh
, ai
);
521 gfs2_assert_warn(sdp
, !sdp
->sd_log_num_buf
);
524 static void buf_lo_before_scan(struct gfs2_jdesc
*jd
,
525 struct gfs2_log_header_host
*head
, int pass
)
527 struct gfs2_sbd
*sdp
= GFS2_SB(jd
->jd_inode
);
532 sdp
->sd_found_blocks
= 0;
533 sdp
->sd_replayed_blocks
= 0;
536 static int buf_lo_scan_elements(struct gfs2_jdesc
*jd
, unsigned int start
,
537 struct gfs2_log_descriptor
*ld
, __be64
*ptr
,
540 struct gfs2_inode
*ip
= GFS2_I(jd
->jd_inode
);
541 struct gfs2_sbd
*sdp
= GFS2_SB(jd
->jd_inode
);
542 struct gfs2_glock
*gl
= ip
->i_gl
;
543 unsigned int blks
= be32_to_cpu(ld
->ld_data1
);
544 struct buffer_head
*bh_log
, *bh_ip
;
548 if (pass
!= 1 || be32_to_cpu(ld
->ld_type
) != GFS2_LOG_DESC_METADATA
)
551 gfs2_replay_incr_blk(sdp
, &start
);
553 for (; blks
; gfs2_replay_incr_blk(sdp
, &start
), blks
--) {
554 blkno
= be64_to_cpu(*ptr
++);
556 sdp
->sd_found_blocks
++;
558 if (gfs2_revoke_check(sdp
, blkno
, start
))
561 error
= gfs2_replay_read_block(jd
, start
, &bh_log
);
565 bh_ip
= gfs2_meta_new(gl
, blkno
);
566 memcpy(bh_ip
->b_data
, bh_log
->b_data
, bh_log
->b_size
);
568 if (gfs2_meta_check(sdp
, bh_ip
))
571 mark_buffer_dirty(bh_ip
);
579 sdp
->sd_replayed_blocks
++;
585 static void buf_lo_after_scan(struct gfs2_jdesc
*jd
, int error
, int pass
)
587 struct gfs2_inode
*ip
= GFS2_I(jd
->jd_inode
);
588 struct gfs2_sbd
*sdp
= GFS2_SB(jd
->jd_inode
);
591 gfs2_meta_sync(ip
->i_gl
);
597 gfs2_meta_sync(ip
->i_gl
);
599 fs_info(sdp
, "jid=%u: Replayed %u of %u blocks\n",
600 jd
->jd_jid
, sdp
->sd_replayed_blocks
, sdp
->sd_found_blocks
);
603 static void revoke_lo_add(struct gfs2_sbd
*sdp
, struct gfs2_bufdata
*bd
)
605 struct gfs2_glock
*gl
= bd
->bd_gl
;
606 struct gfs2_trans
*tr
;
608 tr
= current
->journal_info
;
611 sdp
->sd_log_num_revoke
++;
612 atomic_inc(&gl
->gl_revokes
);
613 set_bit(GLF_LFLUSH
, &gl
->gl_flags
);
614 list_add(&bd
->bd_list
, &sdp
->sd_log_le_revoke
);
617 static void revoke_lo_before_commit(struct gfs2_sbd
*sdp
)
619 struct gfs2_log_descriptor
*ld
;
620 struct gfs2_meta_header
*mh
;
622 struct list_head
*head
= &sdp
->sd_log_le_revoke
;
623 struct gfs2_bufdata
*bd
;
627 if (!sdp
->sd_log_num_revoke
)
630 length
= gfs2_struct2blk(sdp
, sdp
->sd_log_num_revoke
, sizeof(u64
));
631 page
= gfs2_get_log_desc(sdp
, GFS2_LOG_DESC_REVOKE
, length
, sdp
->sd_log_num_revoke
);
632 ld
= page_address(page
);
633 offset
= sizeof(struct gfs2_log_descriptor
);
635 list_for_each_entry(bd
, head
, bd_list
) {
636 sdp
->sd_log_num_revoke
--;
638 if (offset
+ sizeof(u64
) > sdp
->sd_sb
.sb_bsize
) {
640 gfs2_log_write_page(sdp
, page
);
641 page
= mempool_alloc(gfs2_page_pool
, GFP_NOIO
);
642 mh
= page_address(page
);
644 mh
->mh_magic
= cpu_to_be32(GFS2_MAGIC
);
645 mh
->mh_type
= cpu_to_be32(GFS2_METATYPE_LB
);
646 mh
->mh_format
= cpu_to_be32(GFS2_FORMAT_LB
);
647 offset
= sizeof(struct gfs2_meta_header
);
650 *(__be64
*)(page_address(page
) + offset
) = cpu_to_be64(bd
->bd_blkno
);
651 offset
+= sizeof(u64
);
653 gfs2_assert_withdraw(sdp
, !sdp
->sd_log_num_revoke
);
655 gfs2_log_write_page(sdp
, page
);
658 static void revoke_lo_after_commit(struct gfs2_sbd
*sdp
, struct gfs2_ail
*ai
)
660 struct list_head
*head
= &sdp
->sd_log_le_revoke
;
661 struct gfs2_bufdata
*bd
;
662 struct gfs2_glock
*gl
;
664 while (!list_empty(head
)) {
665 bd
= list_entry(head
->next
, struct gfs2_bufdata
, bd_list
);
666 list_del_init(&bd
->bd_list
);
668 atomic_dec(&gl
->gl_revokes
);
669 clear_bit(GLF_LFLUSH
, &gl
->gl_flags
);
670 kmem_cache_free(gfs2_bufdata_cachep
, bd
);
674 static void revoke_lo_before_scan(struct gfs2_jdesc
*jd
,
675 struct gfs2_log_header_host
*head
, int pass
)
677 struct gfs2_sbd
*sdp
= GFS2_SB(jd
->jd_inode
);
682 sdp
->sd_found_revokes
= 0;
683 sdp
->sd_replay_tail
= head
->lh_tail
;
686 static int revoke_lo_scan_elements(struct gfs2_jdesc
*jd
, unsigned int start
,
687 struct gfs2_log_descriptor
*ld
, __be64
*ptr
,
690 struct gfs2_sbd
*sdp
= GFS2_SB(jd
->jd_inode
);
691 unsigned int blks
= be32_to_cpu(ld
->ld_length
);
692 unsigned int revokes
= be32_to_cpu(ld
->ld_data1
);
693 struct buffer_head
*bh
;
699 if (pass
!= 0 || be32_to_cpu(ld
->ld_type
) != GFS2_LOG_DESC_REVOKE
)
702 offset
= sizeof(struct gfs2_log_descriptor
);
704 for (; blks
; gfs2_replay_incr_blk(sdp
, &start
), blks
--) {
705 error
= gfs2_replay_read_block(jd
, start
, &bh
);
710 gfs2_metatype_check(sdp
, bh
, GFS2_METATYPE_LB
);
712 while (offset
+ sizeof(u64
) <= sdp
->sd_sb
.sb_bsize
) {
713 blkno
= be64_to_cpu(*(__be64
*)(bh
->b_data
+ offset
));
715 error
= gfs2_revoke_add(sdp
, blkno
, start
);
721 sdp
->sd_found_revokes
++;
725 offset
+= sizeof(u64
);
729 offset
= sizeof(struct gfs2_meta_header
);
736 static void revoke_lo_after_scan(struct gfs2_jdesc
*jd
, int error
, int pass
)
738 struct gfs2_sbd
*sdp
= GFS2_SB(jd
->jd_inode
);
741 gfs2_revoke_clean(sdp
);
747 fs_info(sdp
, "jid=%u: Found %u revoke tags\n",
748 jd
->jd_jid
, sdp
->sd_found_revokes
);
750 gfs2_revoke_clean(sdp
);
754 * databuf_lo_add - Add a databuf to the transaction.
756 * This is used in two distinct cases:
757 * i) In ordered write mode
758 * We put the data buffer on a list so that we can ensure that its
759 * synced to disk at the right time
760 * ii) In journaled data mode
761 * We need to journal the data block in the same way as metadata in
762 * the functions above. The difference is that here we have a tag
763 * which is two __be64's being the block number (as per meta data)
764 * and a flag which says whether the data block needs escaping or
765 * not. This means we need a new log entry for each 251 or so data
766 * blocks, which isn't an enormous overhead but twice as much as
767 * for normal metadata blocks.
769 static void databuf_lo_add(struct gfs2_sbd
*sdp
, struct gfs2_bufdata
*bd
)
771 struct gfs2_trans
*tr
= current
->journal_info
;
772 struct address_space
*mapping
= bd
->bd_bh
->b_page
->mapping
;
773 struct gfs2_inode
*ip
= GFS2_I(mapping
->host
);
775 lock_buffer(bd
->bd_bh
);
779 if (!list_empty(&bd
->bd_list
))
781 set_bit(GLF_LFLUSH
, &bd
->bd_gl
->gl_flags
);
782 set_bit(GLF_DIRTY
, &bd
->bd_gl
->gl_flags
);
783 if (gfs2_is_jdata(ip
)) {
784 gfs2_pin(sdp
, bd
->bd_bh
);
785 tr
->tr_num_databuf_new
++;
786 sdp
->sd_log_num_databuf
++;
787 list_add_tail(&bd
->bd_list
, &sdp
->sd_log_le_databuf
);
789 list_add_tail(&bd
->bd_list
, &sdp
->sd_log_le_ordered
);
792 gfs2_log_unlock(sdp
);
793 unlock_buffer(bd
->bd_bh
);
797 * databuf_lo_before_commit - Scan the data buffers, writing as we go
801 static void databuf_lo_before_commit(struct gfs2_sbd
*sdp
)
803 unsigned int limit
= buf_limit(sdp
) / 2;
805 gfs2_before_commit(sdp
, limit
, sdp
->sd_log_num_databuf
,
806 &sdp
->sd_log_le_databuf
, 1);
809 static int databuf_lo_scan_elements(struct gfs2_jdesc
*jd
, unsigned int start
,
810 struct gfs2_log_descriptor
*ld
,
811 __be64
*ptr
, int pass
)
813 struct gfs2_inode
*ip
= GFS2_I(jd
->jd_inode
);
814 struct gfs2_sbd
*sdp
= GFS2_SB(jd
->jd_inode
);
815 struct gfs2_glock
*gl
= ip
->i_gl
;
816 unsigned int blks
= be32_to_cpu(ld
->ld_data1
);
817 struct buffer_head
*bh_log
, *bh_ip
;
822 if (pass
!= 1 || be32_to_cpu(ld
->ld_type
) != GFS2_LOG_DESC_JDATA
)
825 gfs2_replay_incr_blk(sdp
, &start
);
826 for (; blks
; gfs2_replay_incr_blk(sdp
, &start
), blks
--) {
827 blkno
= be64_to_cpu(*ptr
++);
828 esc
= be64_to_cpu(*ptr
++);
830 sdp
->sd_found_blocks
++;
832 if (gfs2_revoke_check(sdp
, blkno
, start
))
835 error
= gfs2_replay_read_block(jd
, start
, &bh_log
);
839 bh_ip
= gfs2_meta_new(gl
, blkno
);
840 memcpy(bh_ip
->b_data
, bh_log
->b_data
, bh_log
->b_size
);
844 __be32
*eptr
= (__be32
*)bh_ip
->b_data
;
845 *eptr
= cpu_to_be32(GFS2_MAGIC
);
847 mark_buffer_dirty(bh_ip
);
852 sdp
->sd_replayed_blocks
++;
858 /* FIXME: sort out accounting for log blocks etc. */
860 static void databuf_lo_after_scan(struct gfs2_jdesc
*jd
, int error
, int pass
)
862 struct gfs2_inode
*ip
= GFS2_I(jd
->jd_inode
);
863 struct gfs2_sbd
*sdp
= GFS2_SB(jd
->jd_inode
);
866 gfs2_meta_sync(ip
->i_gl
);
873 gfs2_meta_sync(ip
->i_gl
);
875 fs_info(sdp
, "jid=%u: Replayed %u of %u data blocks\n",
876 jd
->jd_jid
, sdp
->sd_replayed_blocks
, sdp
->sd_found_blocks
);
879 static void databuf_lo_after_commit(struct gfs2_sbd
*sdp
, struct gfs2_ail
*ai
)
881 struct list_head
*head
= &sdp
->sd_log_le_databuf
;
882 struct gfs2_bufdata
*bd
;
884 while (!list_empty(head
)) {
885 bd
= list_entry(head
->next
, struct gfs2_bufdata
, bd_list
);
886 list_del_init(&bd
->bd_list
);
887 sdp
->sd_log_num_databuf
--;
888 gfs2_unpin(sdp
, bd
->bd_bh
, ai
);
890 gfs2_assert_warn(sdp
, !sdp
->sd_log_num_databuf
);
894 const struct gfs2_log_operations gfs2_buf_lops
= {
895 .lo_add
= buf_lo_add
,
896 .lo_before_commit
= buf_lo_before_commit
,
897 .lo_after_commit
= buf_lo_after_commit
,
898 .lo_before_scan
= buf_lo_before_scan
,
899 .lo_scan_elements
= buf_lo_scan_elements
,
900 .lo_after_scan
= buf_lo_after_scan
,
904 const struct gfs2_log_operations gfs2_revoke_lops
= {
905 .lo_add
= revoke_lo_add
,
906 .lo_before_commit
= revoke_lo_before_commit
,
907 .lo_after_commit
= revoke_lo_after_commit
,
908 .lo_before_scan
= revoke_lo_before_scan
,
909 .lo_scan_elements
= revoke_lo_scan_elements
,
910 .lo_after_scan
= revoke_lo_after_scan
,
914 const struct gfs2_log_operations gfs2_rg_lops
= {
918 const struct gfs2_log_operations gfs2_databuf_lops
= {
919 .lo_add
= databuf_lo_add
,
920 .lo_before_commit
= databuf_lo_before_commit
,
921 .lo_after_commit
= databuf_lo_after_commit
,
922 .lo_scan_elements
= databuf_lo_scan_elements
,
923 .lo_after_scan
= databuf_lo_after_scan
,
924 .lo_name
= "databuf",
927 const struct gfs2_log_operations
*gfs2_log_ops
[] = {