1 // SPDX-License-Identifier: GPL-2.0
3 * Interface between ext4 and JBD
8 #include <trace/events/ext4.h>
10 int ext4_inode_journal_mode(struct inode
*inode
)
12 if (EXT4_JOURNAL(inode
) == NULL
)
13 return EXT4_INODE_WRITEBACK_DATA_MODE
; /* writeback */
14 /* We do not support data journalling with delayed allocation */
15 if (!S_ISREG(inode
->i_mode
) ||
16 ext4_test_inode_flag(inode
, EXT4_INODE_EA_INODE
) ||
17 test_opt(inode
->i_sb
, DATA_FLAGS
) == EXT4_MOUNT_JOURNAL_DATA
||
18 (ext4_test_inode_flag(inode
, EXT4_INODE_JOURNAL_DATA
) &&
19 !test_opt(inode
->i_sb
, DELALLOC
))) {
20 /* We do not support data journalling for encrypted data */
21 if (S_ISREG(inode
->i_mode
) && IS_ENCRYPTED(inode
))
22 return EXT4_INODE_ORDERED_DATA_MODE
; /* ordered */
23 return EXT4_INODE_JOURNAL_DATA_MODE
; /* journal data */
25 if (test_opt(inode
->i_sb
, DATA_FLAGS
) == EXT4_MOUNT_ORDERED_DATA
)
26 return EXT4_INODE_ORDERED_DATA_MODE
; /* ordered */
27 if (test_opt(inode
->i_sb
, DATA_FLAGS
) == EXT4_MOUNT_WRITEBACK_DATA
)
28 return EXT4_INODE_WRITEBACK_DATA_MODE
; /* writeback */
32 /* Just increment the non-pointer handle value */
33 static handle_t
*ext4_get_nojournal(void)
35 handle_t
*handle
= current
->journal_info
;
36 unsigned long ref_cnt
= (unsigned long)handle
;
38 BUG_ON(ref_cnt
>= EXT4_NOJOURNAL_MAX_REF_COUNT
);
41 handle
= (handle_t
*)ref_cnt
;
43 current
->journal_info
= handle
;
48 /* Decrement the non-pointer handle value */
49 static void ext4_put_nojournal(handle_t
*handle
)
51 unsigned long ref_cnt
= (unsigned long)handle
;
56 handle
= (handle_t
*)ref_cnt
;
58 current
->journal_info
= handle
;
62 * Wrappers for jbd2_journal_start/end.
64 static int ext4_journal_check_start(struct super_block
*sb
)
70 if (unlikely(ext4_forced_shutdown(sb
)))
73 if (WARN_ON_ONCE(sb_rdonly(sb
)))
76 WARN_ON(sb
->s_writers
.frozen
== SB_FREEZE_COMPLETE
);
77 journal
= EXT4_SB(sb
)->s_journal
;
79 * Special case here: if the journal has aborted behind our
80 * backs (eg. EIO in the commit thread), then we still need to
81 * take the FS itself readonly cleanly.
83 if (journal
&& is_journal_aborted(journal
)) {
84 ext4_abort(sb
, -journal
->j_errno
, "Detected aborted journal");
90 handle_t
*__ext4_journal_start_sb(struct inode
*inode
,
91 struct super_block
*sb
, unsigned int line
,
92 int type
, int blocks
, int rsv_blocks
,
98 trace_ext4_journal_start_inode(inode
, blocks
, rsv_blocks
,
102 trace_ext4_journal_start_sb(sb
, blocks
, rsv_blocks
,
105 err
= ext4_journal_check_start(sb
);
109 journal
= EXT4_SB(sb
)->s_journal
;
110 if (!journal
|| (EXT4_SB(sb
)->s_mount_state
& EXT4_FC_REPLAY
))
111 return ext4_get_nojournal();
112 return jbd2__journal_start(journal
, blocks
, rsv_blocks
, revoke_creds
,
113 GFP_NOFS
, type
, line
);
116 int __ext4_journal_stop(const char *where
, unsigned int line
, handle_t
*handle
)
118 struct super_block
*sb
;
122 if (!ext4_handle_valid(handle
)) {
123 ext4_put_nojournal(handle
);
128 if (!handle
->h_transaction
) {
129 rc
= jbd2_journal_stop(handle
);
130 return err
? err
: rc
;
133 sb
= handle
->h_transaction
->t_journal
->j_private
;
134 rc
= jbd2_journal_stop(handle
);
139 __ext4_std_error(sb
, where
, line
, err
);
143 handle_t
*__ext4_journal_start_reserved(handle_t
*handle
, unsigned int line
,
146 struct super_block
*sb
;
149 if (!ext4_handle_valid(handle
))
150 return ext4_get_nojournal();
152 sb
= handle
->h_journal
->j_private
;
153 trace_ext4_journal_start_reserved(sb
,
154 jbd2_handle_buffer_credits(handle
), _RET_IP_
);
155 err
= ext4_journal_check_start(sb
);
157 jbd2_journal_free_reserved(handle
);
161 err
= jbd2_journal_start_reserved(handle
, type
, line
);
167 int __ext4_journal_ensure_credits(handle_t
*handle
, int check_cred
,
168 int extend_cred
, int revoke_cred
)
170 if (!ext4_handle_valid(handle
))
172 if (is_handle_aborted(handle
))
174 if (jbd2_handle_buffer_credits(handle
) >= check_cred
&&
175 handle
->h_revoke_credits
>= revoke_cred
)
177 extend_cred
= max(0, extend_cred
- jbd2_handle_buffer_credits(handle
));
178 revoke_cred
= max(0, revoke_cred
- handle
->h_revoke_credits
);
179 return ext4_journal_extend(handle
, extend_cred
, revoke_cred
);
182 static void ext4_journal_abort_handle(const char *caller
, unsigned int line
,
184 struct buffer_head
*bh
,
185 handle_t
*handle
, int err
)
188 const char *errstr
= ext4_decode_error(NULL
, err
, nbuf
);
190 BUG_ON(!ext4_handle_valid(handle
));
193 BUFFER_TRACE(bh
, "abort");
198 if (is_handle_aborted(handle
))
201 printk(KERN_ERR
"EXT4-fs: %s:%d: aborting transaction: %s in %s\n",
202 caller
, line
, errstr
, err_fn
);
204 jbd2_journal_abort_handle(handle
);
207 static void ext4_check_bdev_write_error(struct super_block
*sb
)
209 struct address_space
*mapping
= sb
->s_bdev
->bd_mapping
;
210 struct ext4_sb_info
*sbi
= EXT4_SB(sb
);
214 * If the block device has write error flag, it may have failed to
215 * async write out metadata buffers in the background. In this case,
216 * we could read old data from disk and write it out again, which
217 * may lead to on-disk filesystem inconsistency.
219 if (errseq_check(&mapping
->wb_err
, READ_ONCE(sbi
->s_bdev_wb_err
))) {
220 spin_lock(&sbi
->s_bdev_wb_lock
);
221 err
= errseq_check_and_advance(&mapping
->wb_err
, &sbi
->s_bdev_wb_err
);
222 spin_unlock(&sbi
->s_bdev_wb_lock
);
224 ext4_error_err(sb
, -err
,
225 "Error while async write back metadata");
229 int __ext4_journal_get_write_access(const char *where
, unsigned int line
,
230 handle_t
*handle
, struct super_block
*sb
,
231 struct buffer_head
*bh
,
232 enum ext4_journal_trigger_type trigger_type
)
238 if (ext4_handle_valid(handle
)) {
239 err
= jbd2_journal_get_write_access(handle
, bh
);
241 ext4_journal_abort_handle(where
, line
, __func__
, bh
,
246 ext4_check_bdev_write_error(sb
);
247 if (trigger_type
== EXT4_JTR_NONE
|| !ext4_has_metadata_csum(sb
))
249 BUG_ON(trigger_type
>= EXT4_JOURNAL_TRIGGER_COUNT
);
250 jbd2_journal_set_triggers(bh
,
251 &EXT4_SB(sb
)->s_journal_triggers
[trigger_type
].tr_triggers
);
256 * The ext4 forget function must perform a revoke if we are freeing data
257 * which has been journaled. Metadata (eg. indirect blocks) must be
258 * revoked in all cases.
260 * "bh" may be NULL: a metadata block may have been freed from memory
261 * but there may still be a record of it in the journal, and that record
262 * still needs to be revoked.
264 int __ext4_forget(const char *where
, unsigned int line
, handle_t
*handle
,
265 int is_metadata
, struct inode
*inode
,
266 struct buffer_head
*bh
, ext4_fsblk_t blocknr
)
272 trace_ext4_forget(inode
, is_metadata
, blocknr
);
273 BUFFER_TRACE(bh
, "enter");
275 ext4_debug("forgetting bh %p: is_metadata=%d, mode %o, data mode %x\n",
276 bh
, is_metadata
, inode
->i_mode
,
277 test_opt(inode
->i_sb
, DATA_FLAGS
));
279 /* In the no journal case, we can just do a bforget and return */
280 if (!ext4_handle_valid(handle
)) {
285 /* Never use the revoke function if we are doing full data
286 * journaling: there is no need to, and a V1 superblock won't
287 * support it. Otherwise, only skip the revoke on un-journaled
290 if (test_opt(inode
->i_sb
, DATA_FLAGS
) == EXT4_MOUNT_JOURNAL_DATA
||
291 (!is_metadata
&& !ext4_should_journal_data(inode
))) {
293 BUFFER_TRACE(bh
, "call jbd2_journal_forget");
294 err
= jbd2_journal_forget(handle
, bh
);
296 ext4_journal_abort_handle(where
, line
, __func__
,
304 * data!=journal && (is_metadata || should_journal_data(inode))
306 BUFFER_TRACE(bh
, "call jbd2_journal_revoke");
307 err
= jbd2_journal_revoke(handle
, blocknr
, bh
);
309 ext4_journal_abort_handle(where
, line
, __func__
,
311 __ext4_error(inode
->i_sb
, where
, line
, true, -err
, 0,
312 "error %d when attempting revoke", err
);
314 BUFFER_TRACE(bh
, "exit");
318 int __ext4_journal_get_create_access(const char *where
, unsigned int line
,
319 handle_t
*handle
, struct super_block
*sb
,
320 struct buffer_head
*bh
,
321 enum ext4_journal_trigger_type trigger_type
)
325 if (!ext4_handle_valid(handle
))
328 err
= jbd2_journal_get_create_access(handle
, bh
);
330 ext4_journal_abort_handle(where
, line
, __func__
, bh
, handle
,
334 if (trigger_type
== EXT4_JTR_NONE
|| !ext4_has_metadata_csum(sb
))
336 BUG_ON(trigger_type
>= EXT4_JOURNAL_TRIGGER_COUNT
);
337 jbd2_journal_set_triggers(bh
,
338 &EXT4_SB(sb
)->s_journal_triggers
[trigger_type
].tr_triggers
);
342 int __ext4_handle_dirty_metadata(const char *where
, unsigned int line
,
343 handle_t
*handle
, struct inode
*inode
,
344 struct buffer_head
*bh
)
352 set_buffer_uptodate(bh
);
353 if (ext4_handle_valid(handle
)) {
354 err
= jbd2_journal_dirty_metadata(handle
, bh
);
355 /* Errors can only happen due to aborted journal or a nasty bug */
356 if (!is_handle_aborted(handle
) && WARN_ON_ONCE(err
)) {
357 ext4_journal_abort_handle(where
, line
, __func__
, bh
,
360 pr_err("EXT4: jbd2_journal_dirty_metadata "
361 "failed: handle type %u started at "
362 "line %u, credits %u/%u, errcode %d",
365 handle
->h_requested_credits
,
366 jbd2_handle_buffer_credits(handle
), err
);
369 ext4_error_inode(inode
, where
, line
,
371 "journal_dirty_metadata failed: "
372 "handle type %u started at line %u, "
373 "credits %u/%u, errcode %d",
376 handle
->h_requested_credits
,
377 jbd2_handle_buffer_credits(handle
),
382 mark_buffer_dirty_inode(bh
, inode
);
384 mark_buffer_dirty(bh
);
385 if (inode
&& inode_needs_sync(inode
)) {
386 sync_dirty_buffer(bh
);
387 if (buffer_req(bh
) && !buffer_uptodate(bh
)) {
388 ext4_error_inode_err(inode
, where
, line
,
390 "IO error syncing itable block");