2 * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
3 * Copyright (C) 2004-2006 Red Hat, Inc. All rights reserved.
5 * This copyrighted material is made available to anyone wishing to use,
6 * modify, copy, or redistribute it subject to the terms and conditions
7 * of the GNU General Public License version 2.
10 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
12 #include <linux/sched.h>
13 #include <linux/slab.h>
14 #include <linux/spinlock.h>
15 #include <linux/completion.h>
16 #include <linux/buffer_head.h>
17 #include <linux/kallsyms.h>
18 #include <linux/gfs2_ondisk.h>
29 #include "trace_gfs2.h"
31 int gfs2_trans_begin(struct gfs2_sbd
*sdp
, unsigned int blocks
,
34 struct gfs2_trans
*tr
;
37 BUG_ON(current
->journal_info
);
38 BUG_ON(blocks
== 0 && revokes
== 0);
40 if (!test_bit(SDF_JOURNAL_LIVE
, &sdp
->sd_flags
))
43 tr
= kzalloc(sizeof(struct gfs2_trans
), GFP_NOFS
);
48 tr
->tr_blocks
= blocks
;
49 tr
->tr_revokes
= revokes
;
53 tr
->tr_reserved
+= 6 + blocks
;
55 tr
->tr_reserved
+= gfs2_struct2blk(sdp
, revokes
,
57 INIT_LIST_HEAD(&tr
->tr_databuf
);
58 INIT_LIST_HEAD(&tr
->tr_buf
);
60 sb_start_intwrite(sdp
->sd_vfs
);
62 error
= gfs2_log_reserve(sdp
, tr
->tr_reserved
);
66 current
->journal_info
= tr
;
71 sb_end_intwrite(sdp
->sd_vfs
);
77 static void gfs2_print_trans(const struct gfs2_trans
*tr
)
79 pr_warn("Transaction created at: %pSR\n", (void *)tr
->tr_ip
);
80 pr_warn("blocks=%u revokes=%u reserved=%u touched=%u\n",
81 tr
->tr_blocks
, tr
->tr_revokes
, tr
->tr_reserved
, tr
->tr_touched
);
82 pr_warn("Buf %u/%u Databuf %u/%u Revoke %u/%u\n",
83 tr
->tr_num_buf_new
, tr
->tr_num_buf_rm
,
84 tr
->tr_num_databuf_new
, tr
->tr_num_databuf_rm
,
85 tr
->tr_num_revoke
, tr
->tr_num_revoke_rm
);
88 void gfs2_trans_end(struct gfs2_sbd
*sdp
)
90 struct gfs2_trans
*tr
= current
->journal_info
;
92 int alloced
= tr
->tr_alloced
;
95 current
->journal_info
= NULL
;
97 if (!tr
->tr_touched
) {
98 gfs2_log_release(sdp
, tr
->tr_reserved
);
101 sb_end_intwrite(sdp
->sd_vfs
);
106 nbuf
= tr
->tr_num_buf_new
+ tr
->tr_num_databuf_new
;
107 nbuf
-= tr
->tr_num_buf_rm
;
108 nbuf
-= tr
->tr_num_databuf_rm
;
110 if (gfs2_assert_withdraw(sdp
, (nbuf
<= tr
->tr_blocks
) &&
111 (tr
->tr_num_revoke
<= tr
->tr_revokes
)))
112 gfs2_print_trans(tr
);
114 gfs2_log_commit(sdp
, tr
);
115 if (alloced
&& !tr
->tr_attached
)
117 up_read(&sdp
->sd_log_flush_lock
);
119 if (sdp
->sd_vfs
->s_flags
& MS_SYNCHRONOUS
)
120 gfs2_log_flush(sdp
, NULL
, NORMAL_FLUSH
);
122 sb_end_intwrite(sdp
->sd_vfs
);
125 static struct gfs2_bufdata
*gfs2_alloc_bufdata(struct gfs2_glock
*gl
,
126 struct buffer_head
*bh
,
127 const struct gfs2_log_operations
*lops
)
129 struct gfs2_bufdata
*bd
;
131 bd
= kmem_cache_zalloc(gfs2_bufdata_cachep
, GFP_NOFS
| __GFP_NOFAIL
);
135 INIT_LIST_HEAD(&bd
->bd_list
);
141 * gfs2_trans_add_data - Add a databuf to the transaction.
142 * @gl: The inode glock associated with the buffer
143 * @bh: The buffer to add
145 * This is used in two distinct cases:
146 * i) In ordered write mode
147 * We put the data buffer on a list so that we can ensure that its
148 * synced to disk at the right time
149 * ii) In journaled data mode
150 * We need to journal the data block in the same way as metadata in
151 * the functions above. The difference is that here we have a tag
152 * which is two __be64's being the block number (as per meta data)
153 * and a flag which says whether the data block needs escaping or
154 * not. This means we need a new log entry for each 251 or so data
155 * blocks, which isn't an enormous overhead but twice as much as
156 * for normal metadata blocks.
158 void gfs2_trans_add_data(struct gfs2_glock
*gl
, struct buffer_head
*bh
)
160 struct gfs2_trans
*tr
= current
->journal_info
;
161 struct gfs2_sbd
*sdp
= gl
->gl_name
.ln_sbd
;
162 struct address_space
*mapping
= bh
->b_page
->mapping
;
163 struct gfs2_inode
*ip
= GFS2_I(mapping
->host
);
164 struct gfs2_bufdata
*bd
;
166 if (!gfs2_is_jdata(ip
)) {
167 gfs2_ordered_add_inode(ip
);
175 gfs2_log_unlock(sdp
);
177 if (bh
->b_private
== NULL
)
178 bd
= gfs2_alloc_bufdata(gl
, bh
, &gfs2_databuf_lops
);
184 gfs2_assert(sdp
, bd
->bd_gl
== gl
);
186 if (list_empty(&bd
->bd_list
)) {
187 set_bit(GLF_LFLUSH
, &bd
->bd_gl
->gl_flags
);
188 set_bit(GLF_DIRTY
, &bd
->bd_gl
->gl_flags
);
189 gfs2_pin(sdp
, bd
->bd_bh
);
190 tr
->tr_num_databuf_new
++;
191 list_add_tail(&bd
->bd_list
, &tr
->tr_databuf
);
193 gfs2_log_unlock(sdp
);
197 static void meta_lo_add(struct gfs2_sbd
*sdp
, struct gfs2_bufdata
*bd
)
199 struct gfs2_meta_header
*mh
;
200 struct gfs2_trans
*tr
;
201 enum gfs2_freeze_state state
= atomic_read(&sdp
->sd_freeze_state
);
203 tr
= current
->journal_info
;
205 if (!list_empty(&bd
->bd_list
))
207 set_bit(GLF_LFLUSH
, &bd
->bd_gl
->gl_flags
);
208 set_bit(GLF_DIRTY
, &bd
->bd_gl
->gl_flags
);
209 mh
= (struct gfs2_meta_header
*)bd
->bd_bh
->b_data
;
210 if (unlikely(mh
->mh_magic
!= cpu_to_be32(GFS2_MAGIC
))) {
211 pr_err("Attempting to add uninitialised block to journal (inplace block=%lld)\n",
212 (unsigned long long)bd
->bd_bh
->b_blocknr
);
215 if (unlikely(state
== SFS_FROZEN
)) {
216 printk(KERN_INFO
"GFS2:adding buf while frozen\n");
217 gfs2_assert_withdraw(sdp
, 0);
219 gfs2_pin(sdp
, bd
->bd_bh
);
220 mh
->__pad0
= cpu_to_be64(0);
221 mh
->mh_jid
= cpu_to_be32(sdp
->sd_jdesc
->jd_jid
);
222 list_add(&bd
->bd_list
, &tr
->tr_buf
);
223 tr
->tr_num_buf_new
++;
226 void gfs2_trans_add_meta(struct gfs2_glock
*gl
, struct buffer_head
*bh
)
229 struct gfs2_sbd
*sdp
= gl
->gl_name
.ln_sbd
;
230 struct gfs2_bufdata
*bd
;
236 gfs2_log_unlock(sdp
);
238 lock_page(bh
->b_page
);
239 if (bh
->b_private
== NULL
)
240 bd
= gfs2_alloc_bufdata(gl
, bh
, &gfs2_buf_lops
);
243 unlock_page(bh
->b_page
);
247 gfs2_assert(sdp
, bd
->bd_gl
== gl
);
248 meta_lo_add(sdp
, bd
);
249 gfs2_log_unlock(sdp
);
253 void gfs2_trans_add_revoke(struct gfs2_sbd
*sdp
, struct gfs2_bufdata
*bd
)
255 struct gfs2_trans
*tr
= current
->journal_info
;
257 BUG_ON(!list_empty(&bd
->bd_list
));
258 gfs2_add_revoke(sdp
, bd
);
263 void gfs2_trans_add_unrevoke(struct gfs2_sbd
*sdp
, u64 blkno
, unsigned int len
)
265 struct gfs2_bufdata
*bd
, *tmp
;
266 struct gfs2_trans
*tr
= current
->journal_info
;
267 unsigned int n
= len
;
270 list_for_each_entry_safe(bd
, tmp
, &sdp
->sd_log_le_revoke
, bd_list
) {
271 if ((bd
->bd_blkno
>= blkno
) && (bd
->bd_blkno
< (blkno
+ len
))) {
272 list_del_init(&bd
->bd_list
);
273 gfs2_assert_withdraw(sdp
, sdp
->sd_log_num_revoke
);
274 sdp
->sd_log_num_revoke
--;
275 kmem_cache_free(gfs2_bufdata_cachep
, bd
);
276 tr
->tr_num_revoke_rm
++;
281 gfs2_log_unlock(sdp
);