1 // SPDX-License-Identifier: GPL-2.0
4 * Copyright (C) 2019-2021 Paragon Software GmbH, All rights reserved.
8 #include <linux/blkdev.h>
10 #include <linux/random.h>
11 #include <linux/slab.h>
23 #define MaxLogFileSize 0x100000000ull
24 #define DefaultLogPageSize 4096
25 #define MinLogRecordPages 0x30
28 struct NTFS_RECORD_HEADER rhdr
; // 'RSTR'
29 __le32 sys_page_size
; // 0x10: Page size of the system which initialized the log.
30 __le32 page_size
; // 0x14: Log page size used for this log file.
31 __le16 ra_off
; // 0x18:
32 __le16 minor_ver
; // 0x1A:
33 __le16 major_ver
; // 0x1C:
37 #define LFS_NO_CLIENT 0xffff
38 #define LFS_NO_CLIENT_LE cpu_to_le16(0xffff)
42 __le64 restart_lsn
; // 0x08:
43 __le16 prev_client
; // 0x10:
44 __le16 next_client
; // 0x12:
45 __le16 seq_num
; // 0x14:
47 __le32 name_bytes
; // 0x1C: In bytes.
48 __le16 name
[32]; // 0x20: Name of client.
51 static_assert(sizeof(struct CLIENT_REC
) == 0x60);
53 /* Two copies of these will exist at the beginning of the log file */
55 __le64 current_lsn
; // 0x00: Current logical end of log file.
56 __le16 log_clients
; // 0x08: Maximum number of clients.
57 __le16 client_idx
[2]; // 0x0A: Free/use index into the client record arrays.
58 __le16 flags
; // 0x0E: See RESTART_SINGLE_PAGE_IO.
59 __le32 seq_num_bits
; // 0x10: The number of bits in sequence number.
60 __le16 ra_len
; // 0x14:
61 __le16 client_off
; // 0x16:
62 __le64 l_size
; // 0x18: Usable log file size.
63 __le32 last_lsn_data_len
; // 0x20:
64 __le16 rec_hdr_len
; // 0x24: Log page data offset.
65 __le16 data_off
; // 0x26: Log page data length.
66 __le32 open_log_count
; // 0x28:
67 __le32 align
[5]; // 0x2C:
68 struct CLIENT_REC clients
[]; // 0x40:
72 __le16 redo_op
; // 0x00: NTFS_LOG_OPERATION
73 __le16 undo_op
; // 0x02: NTFS_LOG_OPERATION
74 __le16 redo_off
; // 0x04: Offset to Redo record.
75 __le16 redo_len
; // 0x06: Redo length.
76 __le16 undo_off
; // 0x08: Offset to Undo record.
77 __le16 undo_len
; // 0x0A: Undo length.
78 __le16 target_attr
; // 0x0C:
79 __le16 lcns_follow
; // 0x0E:
80 __le16 record_off
; // 0x10:
81 __le16 attr_off
; // 0x12:
82 __le16 cluster_off
; // 0x14:
83 __le16 reserved
; // 0x16:
84 __le64 target_vcn
; // 0x18:
85 __le64 page_lcns
[]; // 0x20:
88 static_assert(sizeof(struct LOG_REC_HDR
) == 0x20);
90 #define RESTART_ENTRY_ALLOCATED 0xFFFFFFFF
91 #define RESTART_ENTRY_ALLOCATED_LE cpu_to_le32(0xFFFFFFFF)
93 struct RESTART_TABLE
{
94 __le16 size
; // 0x00: In bytes
95 __le16 used
; // 0x02: Entries
96 __le16 total
; // 0x04: Entries
97 __le16 res
[3]; // 0x06:
98 __le32 free_goal
; // 0x0C:
99 __le32 first_free
; // 0x10:
100 __le32 last_free
; // 0x14:
104 static_assert(sizeof(struct RESTART_TABLE
) == 0x18);
106 struct ATTR_NAME_ENTRY
{
107 __le16 off
; // Offset in the Open attribute Table.
112 struct OPEN_ATTR_ENRTY
{
113 __le32 next
; // 0x00: RESTART_ENTRY_ALLOCATED if allocated
114 __le32 bytes_per_index
; // 0x04:
115 enum ATTR_TYPE type
; // 0x08:
116 u8 is_dirty_pages
; // 0x0C:
117 u8 is_attr_name
; // 0x0B: Faked field to manage 'ptr'
118 u8 name_len
; // 0x0C: Faked field to manage 'ptr'
120 struct MFT_REF ref
; // 0x10: File Reference of file containing attribute
121 __le64 open_record_lsn
; // 0x18:
125 /* 32 bit version of 'struct OPEN_ATTR_ENRTY' */
126 struct OPEN_ATTR_ENRTY_32
{
127 __le32 next
; // 0x00: RESTART_ENTRY_ALLOCATED if allocated
129 struct MFT_REF ref
; // 0x08:
130 __le64 open_record_lsn
; // 0x10:
131 u8 is_dirty_pages
; // 0x18:
132 u8 is_attr_name
; // 0x19:
134 enum ATTR_TYPE type
; // 0x1C:
135 u8 name_len
; // 0x20: In wchar
137 __le32 AttributeName
; // 0x24:
138 __le32 bytes_per_index
; // 0x28:
141 #define SIZEOF_OPENATTRIBUTEENTRY0 0x2c
142 // static_assert( 0x2C == sizeof(struct OPEN_ATTR_ENRTY_32) );
143 static_assert(sizeof(struct OPEN_ATTR_ENRTY
) < SIZEOF_OPENATTRIBUTEENTRY0
);
146 * One entry exists in the Dirty Pages Table for each page which is dirty at
147 * the time the Restart Area is written.
149 struct DIR_PAGE_ENTRY
{
150 __le32 next
; // 0x00: RESTART_ENTRY_ALLOCATED if allocated
151 __le32 target_attr
; // 0x04: Index into the Open attribute Table
152 __le32 transfer_len
; // 0x08:
153 __le32 lcns_follow
; // 0x0C:
154 __le64 vcn
; // 0x10: Vcn of dirty page
155 __le64 oldest_lsn
; // 0x18:
156 __le64 page_lcns
[]; // 0x20:
159 static_assert(sizeof(struct DIR_PAGE_ENTRY
) == 0x20);
161 /* 32 bit version of 'struct DIR_PAGE_ENTRY' */
162 struct DIR_PAGE_ENTRY_32
{
163 __le32 next
; // 0x00: RESTART_ENTRY_ALLOCATED if allocated
164 __le32 target_attr
; // 0x04: Index into the Open attribute Table
165 __le32 transfer_len
; // 0x08:
166 __le32 lcns_follow
; // 0x0C:
167 __le32 reserved
; // 0x10:
168 __le32 vcn_low
; // 0x14: Vcn of dirty page
169 __le32 vcn_hi
; // 0x18: Vcn of dirty page
170 __le32 oldest_lsn_low
; // 0x1C:
171 __le32 oldest_lsn_hi
; // 0x1C:
172 __le32 page_lcns_low
; // 0x24:
173 __le32 page_lcns_hi
; // 0x24:
176 static_assert(offsetof(struct DIR_PAGE_ENTRY_32
, vcn_low
) == 0x14);
177 static_assert(sizeof(struct DIR_PAGE_ENTRY_32
) == 0x2c);
179 enum transact_state
{
180 TransactionUninitialized
= 0,
186 struct TRANSACTION_ENTRY
{
187 __le32 next
; // 0x00: RESTART_ENTRY_ALLOCATED if allocated
188 u8 transact_state
; // 0x04:
189 u8 reserved
[3]; // 0x05:
190 __le64 first_lsn
; // 0x08:
191 __le64 prev_lsn
; // 0x10:
192 __le64 undo_next_lsn
; // 0x18:
193 __le32 undo_records
; // 0x20: Number of undo log records pending abort
194 __le32 undo_len
; // 0x24: Total undo size
197 static_assert(sizeof(struct TRANSACTION_ENTRY
) == 0x28);
199 struct NTFS_RESTART
{
200 __le32 major_ver
; // 0x00:
201 __le32 minor_ver
; // 0x04:
202 __le64 check_point_start
; // 0x08:
203 __le64 open_attr_table_lsn
; // 0x10:
204 __le64 attr_names_lsn
; // 0x18:
205 __le64 dirty_pages_table_lsn
; // 0x20:
206 __le64 transact_table_lsn
; // 0x28:
207 __le32 open_attr_len
; // 0x30: In bytes
208 __le32 attr_names_len
; // 0x34: In bytes
209 __le32 dirty_pages_len
; // 0x38: In bytes
210 __le32 transact_table_len
; // 0x3C: In bytes
213 static_assert(sizeof(struct NTFS_RESTART
) == 0x40);
215 struct NEW_ATTRIBUTE_SIZES
{
222 struct BITMAP_RANGE
{
232 /* The following type defines the different log record types. */
233 #define LfsClientRecord cpu_to_le32(1)
234 #define LfsClientRestart cpu_to_le32(2)
236 /* This is used to uniquely identify a client for a particular log file. */
242 /* This is the header that begins every Log Record in the log file. */
243 struct LFS_RECORD_HDR
{
244 __le64 this_lsn
; // 0x00:
245 __le64 client_prev_lsn
; // 0x08:
246 __le64 client_undo_next_lsn
; // 0x10:
247 __le32 client_data_len
; // 0x18:
248 struct CLIENT_ID client
; // 0x1C: Owner of this log record.
249 __le32 record_type
; // 0x20: LfsClientRecord or LfsClientRestart.
250 __le32 transact_id
; // 0x24:
251 __le16 flags
; // 0x28: LOG_RECORD_MULTI_PAGE
252 u8 align
[6]; // 0x2A:
255 #define LOG_RECORD_MULTI_PAGE cpu_to_le16(1)
257 static_assert(sizeof(struct LFS_RECORD_HDR
) == 0x30);
260 __le16 next_record_off
; // 0x00: Offset of the free space in the page,
261 u8 align
[6]; // 0x02:
262 __le64 last_end_lsn
; // 0x08: lsn for the last log record which ends on the page,
265 static_assert(sizeof(struct LFS_RECORD
) == 0x10);
267 struct RECORD_PAGE_HDR
{
268 struct NTFS_RECORD_HEADER rhdr
; // 'RCRD'
269 __le32 rflags
; // 0x10: See LOG_PAGE_LOG_RECORD_END
270 __le16 page_count
; // 0x14:
271 __le16 page_pos
; // 0x16:
272 struct LFS_RECORD record_hdr
; // 0x18:
273 __le16 fixups
[10]; // 0x28:
274 __le32 file_off
; // 0x3c: Used when major version >= 2
279 // Page contains the end of a log record.
280 #define LOG_PAGE_LOG_RECORD_END cpu_to_le32(0x00000001)
282 static inline bool is_log_record_end(const struct RECORD_PAGE_HDR
*hdr
)
284 return hdr
->rflags
& LOG_PAGE_LOG_RECORD_END
;
287 static_assert(offsetof(struct RECORD_PAGE_HDR
, file_off
) == 0x3c);
290 * END of NTFS LOG structures
293 /* Define some tuning parameters to keep the restart tables a reasonable size. */
294 #define INITIAL_NUMBER_TRANSACTIONS 5
296 enum NTFS_LOG_OPERATION
{
299 CompensationLogRecord
= 0x01,
300 InitializeFileRecordSegment
= 0x02,
301 DeallocateFileRecordSegment
= 0x03,
302 WriteEndOfFileRecordSegment
= 0x04,
303 CreateAttribute
= 0x05,
304 DeleteAttribute
= 0x06,
305 UpdateResidentValue
= 0x07,
306 UpdateNonresidentValue
= 0x08,
307 UpdateMappingPairs
= 0x09,
308 DeleteDirtyClusters
= 0x0A,
309 SetNewAttributeSizes
= 0x0B,
310 AddIndexEntryRoot
= 0x0C,
311 DeleteIndexEntryRoot
= 0x0D,
312 AddIndexEntryAllocation
= 0x0E,
313 DeleteIndexEntryAllocation
= 0x0F,
314 WriteEndOfIndexBuffer
= 0x10,
315 SetIndexEntryVcnRoot
= 0x11,
316 SetIndexEntryVcnAllocation
= 0x12,
317 UpdateFileNameRoot
= 0x13,
318 UpdateFileNameAllocation
= 0x14,
319 SetBitsInNonresidentBitMap
= 0x15,
320 ClearBitsInNonresidentBitMap
= 0x16,
322 EndTopLevelAction
= 0x18,
323 PrepareTransaction
= 0x19,
324 CommitTransaction
= 0x1A,
325 ForgetTransaction
= 0x1B,
326 OpenNonresidentAttribute
= 0x1C,
327 OpenAttributeTableDump
= 0x1D,
328 AttributeNamesDump
= 0x1E,
329 DirtyPageTableDump
= 0x1F,
330 TransactionTableDump
= 0x20,
331 UpdateRecordDataRoot
= 0x21,
332 UpdateRecordDataAllocation
= 0x22,
334 UpdateRelativeDataInIndex
=
335 0x23, // NtOfsRestartUpdateRelativeDataInIndex
336 UpdateRelativeDataInIndex2
= 0x24,
337 ZeroEndOfFileRecord
= 0x25,
341 * Array for log records which require a target attribute.
342 * A true indicates that the corresponding restart operation
343 * requires a target attribute.
345 static const u8 AttributeRequired
[] = {
346 0xFC, 0xFB, 0xFF, 0x10, 0x06,
349 static inline bool is_target_required(u16 op
)
351 bool ret
= op
<= UpdateRecordDataAllocation
&&
352 (AttributeRequired
[op
>> 3] >> (op
& 7) & 1);
356 static inline bool can_skip_action(enum NTFS_LOG_OPERATION op
)
360 case DeleteDirtyClusters
:
362 case EndTopLevelAction
:
363 case PrepareTransaction
:
364 case CommitTransaction
:
365 case ForgetTransaction
:
366 case CompensationLogRecord
:
367 case OpenNonresidentAttribute
:
368 case OpenAttributeTableDump
:
369 case AttributeNamesDump
:
370 case DirtyPageTableDump
:
371 case TransactionTableDump
:
378 enum { lcb_ctx_undo_next
, lcb_ctx_prev
, lcb_ctx_next
};
380 /* Bytes per restart table. */
381 static inline u32
bytes_per_rt(const struct RESTART_TABLE
*rt
)
383 return le16_to_cpu(rt
->used
) * le16_to_cpu(rt
->size
) +
384 sizeof(struct RESTART_TABLE
);
387 /* Log record length. */
388 static inline u32
lrh_length(const struct LOG_REC_HDR
*lr
)
390 u16 t16
= le16_to_cpu(lr
->lcns_follow
);
392 return struct_size(lr
, page_lcns
, max_t(u16
, 1, t16
));
396 struct LFS_RECORD_HDR
*lrh
; // Log record header of the current lsn.
397 struct LOG_REC_HDR
*log_rec
;
398 u32 ctx_mode
; // lcb_ctx_undo_next/lcb_ctx_prev/lcb_ctx_next
399 struct CLIENT_ID client
;
400 bool alloc
; // If true the we should deallocate 'log_rec'.
403 static void lcb_put(struct lcb
*lcb
)
411 /* Find the oldest lsn from active clients. */
412 static inline void oldest_client_lsn(const struct CLIENT_REC
*ca
,
413 __le16 next_client
, u64
*oldest_lsn
)
415 while (next_client
!= LFS_NO_CLIENT_LE
) {
416 const struct CLIENT_REC
*cr
= ca
+ le16_to_cpu(next_client
);
417 u64 lsn
= le64_to_cpu(cr
->oldest_lsn
);
419 /* Ignore this block if it's oldest lsn is 0. */
420 if (lsn
&& lsn
< *oldest_lsn
)
423 next_client
= cr
->next_client
;
427 static inline bool is_rst_page_hdr_valid(u32 file_off
,
428 const struct RESTART_HDR
*rhdr
)
430 u32 sys_page
= le32_to_cpu(rhdr
->sys_page_size
);
431 u32 page_size
= le32_to_cpu(rhdr
->page_size
);
435 if (sys_page
< SECTOR_SIZE
|| page_size
< SECTOR_SIZE
||
436 sys_page
& (sys_page
- 1) || page_size
& (page_size
- 1)) {
440 /* Check that if the file offset isn't 0, it is the system page size. */
441 if (file_off
&& file_off
!= sys_page
)
444 /* Check support version 1.1+. */
445 if (le16_to_cpu(rhdr
->major_ver
) <= 1 && !rhdr
->minor_ver
)
448 if (le16_to_cpu(rhdr
->major_ver
) > 2)
451 ro
= le16_to_cpu(rhdr
->ra_off
);
452 if (!IS_ALIGNED(ro
, 8) || ro
> sys_page
)
455 end_usa
= ((sys_page
>> SECTOR_SHIFT
) + 1) * sizeof(short);
456 end_usa
+= le16_to_cpu(rhdr
->rhdr
.fix_off
);
464 static inline bool is_rst_area_valid(const struct RESTART_HDR
*rhdr
)
466 const struct RESTART_AREA
*ra
;
468 u32 off
, l_size
, seq_bits
;
469 u16 ro
= le16_to_cpu(rhdr
->ra_off
);
470 u32 sys_page
= le32_to_cpu(rhdr
->sys_page_size
);
472 if (ro
+ offsetof(struct RESTART_AREA
, l_size
) >
473 SECTOR_SIZE
- sizeof(short))
476 ra
= Add2Ptr(rhdr
, ro
);
477 cl
= le16_to_cpu(ra
->log_clients
);
482 off
= le16_to_cpu(ra
->client_off
);
484 if (!IS_ALIGNED(off
, 8) || ro
+ off
> SECTOR_SIZE
- sizeof(short))
487 off
+= cl
* sizeof(struct CLIENT_REC
);
493 * Check the restart length field and whether the entire
494 * restart area is contained that length.
496 if (le16_to_cpu(rhdr
->ra_off
) + le16_to_cpu(ra
->ra_len
) > sys_page
||
497 off
> le16_to_cpu(ra
->ra_len
)) {
502 * As a final check make sure that the use list and the free list
503 * are either empty or point to a valid client.
505 fl
= le16_to_cpu(ra
->client_idx
[0]);
506 ul
= le16_to_cpu(ra
->client_idx
[1]);
507 if ((fl
!= LFS_NO_CLIENT
&& fl
>= cl
) ||
508 (ul
!= LFS_NO_CLIENT
&& ul
>= cl
))
511 /* Make sure the sequence number bits match the log file size. */
512 l_size
= le64_to_cpu(ra
->l_size
);
514 seq_bits
= sizeof(u64
) * 8 + 3;
520 if (seq_bits
!= le32_to_cpu(ra
->seq_num_bits
))
523 /* The log page data offset and record header length must be quad-aligned. */
524 if (!IS_ALIGNED(le16_to_cpu(ra
->data_off
), 8) ||
525 !IS_ALIGNED(le16_to_cpu(ra
->rec_hdr_len
), 8))
531 static inline bool is_client_area_valid(const struct RESTART_HDR
*rhdr
,
534 u16 ro
= le16_to_cpu(rhdr
->ra_off
);
535 const struct RESTART_AREA
*ra
= Add2Ptr(rhdr
, ro
);
536 u16 ra_len
= le16_to_cpu(ra
->ra_len
);
537 const struct CLIENT_REC
*ca
;
540 if (usa_error
&& ra_len
+ ro
> SECTOR_SIZE
- sizeof(short))
543 /* Find the start of the client array. */
544 ca
= Add2Ptr(ra
, le16_to_cpu(ra
->client_off
));
547 * Start with the free list.
548 * Check that all the clients are valid and that there isn't a cycle.
549 * Do the in-use list on the second pass.
551 for (i
= 0; i
< 2; i
++) {
552 u16 client_idx
= le16_to_cpu(ra
->client_idx
[i
]);
553 bool first_client
= true;
554 u16 clients
= le16_to_cpu(ra
->log_clients
);
556 while (client_idx
!= LFS_NO_CLIENT
) {
557 const struct CLIENT_REC
*cr
;
560 client_idx
>= le16_to_cpu(ra
->log_clients
))
564 cr
= ca
+ client_idx
;
566 client_idx
= le16_to_cpu(cr
->next_client
);
569 first_client
= false;
570 if (cr
->prev_client
!= LFS_NO_CLIENT_LE
)
582 * Remove a client record from a client record list an restart area.
584 static inline void remove_client(struct CLIENT_REC
*ca
,
585 const struct CLIENT_REC
*cr
, __le16
*head
)
587 if (cr
->prev_client
== LFS_NO_CLIENT_LE
)
588 *head
= cr
->next_client
;
590 ca
[le16_to_cpu(cr
->prev_client
)].next_client
= cr
->next_client
;
592 if (cr
->next_client
!= LFS_NO_CLIENT_LE
)
593 ca
[le16_to_cpu(cr
->next_client
)].prev_client
= cr
->prev_client
;
597 * add_client - Add a client record to the start of a list.
599 static inline void add_client(struct CLIENT_REC
*ca
, u16 index
, __le16
*head
)
601 struct CLIENT_REC
*cr
= ca
+ index
;
603 cr
->prev_client
= LFS_NO_CLIENT_LE
;
604 cr
->next_client
= *head
;
606 if (*head
!= LFS_NO_CLIENT_LE
)
607 ca
[le16_to_cpu(*head
)].prev_client
= cpu_to_le16(index
);
609 *head
= cpu_to_le16(index
);
613 * Enumerate restart table.
615 * @t - table to enumerate.
616 * @c - current enumerated element.
618 * enumeration starts with @c == NULL
619 * returns next element or NULL
621 static inline void *enum_rstbl(struct RESTART_TABLE
*t
, void *c
)
630 rsize
= le16_to_cpu(t
->size
);
633 /* start enumeration. */
636 e
= Add2Ptr(t
, sizeof(struct RESTART_TABLE
));
638 e
= Add2Ptr(c
, rsize
);
641 /* Loop until we hit the first one allocated, or the end of the list. */
642 for (bprt
= bytes_per_rt(t
); PtrOffset(t
, e
) < bprt
;
643 e
= Add2Ptr(e
, rsize
)) {
644 if (*e
== RESTART_ENTRY_ALLOCATED_LE
)
651 * find_dp - Search for a @vcn in Dirty Page Table.
653 static inline struct DIR_PAGE_ENTRY
*find_dp(struct RESTART_TABLE
*dptbl
,
654 u32 target_attr
, u64 vcn
)
656 __le32 ta
= cpu_to_le32(target_attr
);
657 struct DIR_PAGE_ENTRY
*dp
= NULL
;
659 while ((dp
= enum_rstbl(dptbl
, dp
))) {
660 u64 dp_vcn
= le64_to_cpu(dp
->vcn
);
662 if (dp
->target_attr
== ta
&& vcn
>= dp_vcn
&&
663 vcn
< dp_vcn
+ le32_to_cpu(dp
->lcns_follow
)) {
670 static inline u32
norm_file_page(u32 page_size
, u32
*l_size
, bool use_default
)
673 page_size
= DefaultLogPageSize
;
675 /* Round the file size down to a system page boundary. */
676 *l_size
&= ~(page_size
- 1);
678 /* File should contain at least 2 restart pages and MinLogRecordPages pages. */
679 if (*l_size
< (MinLogRecordPages
+ 2) * page_size
)
685 static bool check_log_rec(const struct LOG_REC_HDR
*lr
, u32 bytes
, u32 tr
,
686 u32 bytes_per_attr_entry
)
690 if (bytes
< sizeof(struct LOG_REC_HDR
))
695 if ((tr
- sizeof(struct RESTART_TABLE
)) %
696 sizeof(struct TRANSACTION_ENTRY
))
699 if (le16_to_cpu(lr
->redo_off
) & 7)
702 if (le16_to_cpu(lr
->undo_off
) & 7)
708 if (is_target_required(le16_to_cpu(lr
->redo_op
)))
711 if (is_target_required(le16_to_cpu(lr
->undo_op
)))
715 if (!lr
->lcns_follow
)
718 t16
= le16_to_cpu(lr
->target_attr
);
719 if ((t16
- sizeof(struct RESTART_TABLE
)) % bytes_per_attr_entry
)
723 if (bytes
< lrh_length(lr
))
729 static bool check_rstbl(const struct RESTART_TABLE
*rt
, size_t bytes
)
733 u16 rsize
= le16_to_cpu(rt
->size
);
734 u16 ne
= le16_to_cpu(rt
->used
);
735 u32 ff
= le32_to_cpu(rt
->first_free
);
736 u32 lf
= le32_to_cpu(rt
->last_free
);
738 ts
= rsize
* ne
+ sizeof(struct RESTART_TABLE
);
740 if (!rsize
|| rsize
> bytes
||
741 rsize
+ sizeof(struct RESTART_TABLE
) > bytes
|| bytes
< ts
||
742 le16_to_cpu(rt
->total
) > ne
|| ff
> ts
- sizeof(__le32
) ||
743 lf
> ts
- sizeof(__le32
) ||
744 (ff
&& ff
< sizeof(struct RESTART_TABLE
)) ||
745 (lf
&& lf
< sizeof(struct RESTART_TABLE
))) {
750 * Verify each entry is either allocated or points
751 * to a valid offset the table.
753 for (i
= 0; i
< ne
; i
++) {
754 off
= le32_to_cpu(*(__le32
*)Add2Ptr(
755 rt
, i
* rsize
+ sizeof(struct RESTART_TABLE
)));
757 if (off
!= RESTART_ENTRY_ALLOCATED
&& off
&&
758 (off
< sizeof(struct RESTART_TABLE
) ||
759 ((off
- sizeof(struct RESTART_TABLE
)) % rsize
))) {
765 * Walk through the list headed by the first entry to make
766 * sure none of the entries are currently being used.
768 for (off
= ff
; off
;) {
769 if (off
== RESTART_ENTRY_ALLOCATED
)
772 off
= le32_to_cpu(*(__le32
*)Add2Ptr(rt
, off
));
774 if (off
> ts
- sizeof(__le32
))
782 * free_rsttbl_idx - Free a previously allocated index a Restart Table.
784 static inline void free_rsttbl_idx(struct RESTART_TABLE
*rt
, u32 off
)
787 u32 lf
= le32_to_cpu(rt
->last_free
);
788 __le32 off_le
= cpu_to_le32(off
);
790 e
= Add2Ptr(rt
, off
);
792 if (off
< le32_to_cpu(rt
->free_goal
)) {
794 rt
->first_free
= off_le
;
796 rt
->last_free
= off_le
;
799 *(__le32
*)Add2Ptr(rt
, lf
) = off_le
;
801 rt
->first_free
= off_le
;
803 rt
->last_free
= off_le
;
807 le16_sub_cpu(&rt
->total
, 1);
810 static inline struct RESTART_TABLE
*init_rsttbl(u16 esize
, u16 used
)
812 __le32
*e
, *last_free
;
814 u32 bytes
= esize
* used
+ sizeof(struct RESTART_TABLE
);
815 u32 lf
= sizeof(struct RESTART_TABLE
) + (used
- 1) * esize
;
816 struct RESTART_TABLE
*t
= kzalloc(bytes
, GFP_NOFS
);
821 t
->size
= cpu_to_le16(esize
);
822 t
->used
= cpu_to_le16(used
);
823 t
->free_goal
= cpu_to_le32(~0u);
824 t
->first_free
= cpu_to_le32(sizeof(struct RESTART_TABLE
));
825 t
->last_free
= cpu_to_le32(lf
);
827 e
= (__le32
*)(t
+ 1);
828 last_free
= Add2Ptr(t
, lf
);
830 for (off
= sizeof(struct RESTART_TABLE
) + esize
; e
< last_free
;
831 e
= Add2Ptr(e
, esize
), off
+= esize
) {
832 *e
= cpu_to_le32(off
);
837 static inline struct RESTART_TABLE
*extend_rsttbl(struct RESTART_TABLE
*tbl
,
838 u32 add
, u32 free_goal
)
840 u16 esize
= le16_to_cpu(tbl
->size
);
841 __le32 osize
= cpu_to_le32(bytes_per_rt(tbl
));
842 u32 used
= le16_to_cpu(tbl
->used
);
843 struct RESTART_TABLE
*rt
;
845 rt
= init_rsttbl(esize
, used
+ add
);
849 memcpy(rt
+ 1, tbl
+ 1, esize
* used
);
851 rt
->free_goal
= free_goal
== ~0u ?
853 cpu_to_le32(sizeof(struct RESTART_TABLE
) +
856 if (tbl
->first_free
) {
857 rt
->first_free
= tbl
->first_free
;
858 *(__le32
*)Add2Ptr(rt
, le32_to_cpu(tbl
->last_free
)) = osize
;
860 rt
->first_free
= osize
;
863 rt
->total
= tbl
->total
;
872 * Allocate an index from within a previously initialized Restart Table.
874 static inline void *alloc_rsttbl_idx(struct RESTART_TABLE
**tbl
)
878 struct RESTART_TABLE
*t
= *tbl
;
880 if (!t
->first_free
) {
881 *tbl
= t
= extend_rsttbl(t
, 16, ~0u);
886 off
= le32_to_cpu(t
->first_free
);
888 /* Dequeue this entry and zero it. */
893 memset(e
, 0, le16_to_cpu(t
->size
));
895 *e
= RESTART_ENTRY_ALLOCATED_LE
;
897 /* If list is going empty, then we fix the last_free as well. */
901 le16_add_cpu(&t
->total
, 1);
903 return Add2Ptr(t
, off
);
907 * alloc_rsttbl_from_idx
909 * Allocate a specific index from within a previously initialized Restart Table.
911 static inline void *alloc_rsttbl_from_idx(struct RESTART_TABLE
**tbl
, u32 vbo
)
915 struct RESTART_TABLE
*rt
= *tbl
;
916 u32 bytes
= bytes_per_rt(rt
);
917 u16 esize
= le16_to_cpu(rt
->size
);
919 /* If the entry is not the table, we will have to extend the table. */
922 * Extend the size by computing the number of entries between
923 * the existing size and the desired index and adding 1 to that.
925 u32 bytes2idx
= vbo
- bytes
;
928 * There should always be an integral number of entries
929 * being added. Now extend the table.
931 *tbl
= rt
= extend_rsttbl(rt
, bytes2idx
/ esize
+ 1, bytes
);
936 /* See if the entry is already allocated, and just return if it is. */
937 e
= Add2Ptr(rt
, vbo
);
939 if (*e
== RESTART_ENTRY_ALLOCATED_LE
)
943 * Walk through the table, looking for the entry we're
944 * interested and the previous entry.
946 off
= le32_to_cpu(rt
->first_free
);
947 e
= Add2Ptr(rt
, off
);
950 /* this is a match */
956 * Need to walk through the list looking for the predecessor
960 /* Remember the entry just found */
964 /* Should never run of entries. */
966 /* Lookup up the next entry the list. */
967 off
= le32_to_cpu(*last_e
);
968 e
= Add2Ptr(rt
, off
);
970 /* If this is our match we are done. */
975 * If this was the last entry, we update that
978 if (le32_to_cpu(rt
->last_free
) == off
)
979 rt
->last_free
= cpu_to_le32(last_off
);
985 /* If the list is now empty, we fix the last_free as well. */
989 /* Zero this entry. */
991 *e
= RESTART_ENTRY_ALLOCATED_LE
;
993 le16_add_cpu(&rt
->total
, 1);
998 struct restart_info
{
1000 struct RESTART_HDR
*r_page
;
1002 bool chkdsk_was_run
;
1008 #define RESTART_SINGLE_PAGE_IO cpu_to_le16(0x0001)
1010 #define NTFSLOG_WRAPPED 0x00000001
1011 #define NTFSLOG_MULTIPLE_PAGE_IO 0x00000002
1012 #define NTFSLOG_NO_LAST_LSN 0x00000004
1013 #define NTFSLOG_REUSE_TAIL 0x00000010
1014 #define NTFSLOG_NO_OLDEST_LSN 0x00000020
1016 /* Helper struct to work with NTFS $LogFile. */
1018 struct ntfs_inode
*ni
;
1025 u32 page_mask
; // page_size - 1
1027 struct RECORD_PAGE_HDR
*one_page_buf
;
1029 struct RESTART_TABLE
*open_attr_tbl
;
1039 u16 record_header_len
;
1043 u32 seq_num_mask
; /* (1 << file_data_bits) - 1 */
1045 struct RESTART_AREA
*ra
; /* In-memory image of the next restart area. */
1046 u32 ra_size
; /* The usable size of the restart area. */
1049 * If true, then the in-memory restart area is to be written
1050 * to the first position on the disk.
1053 bool set_dirty
; /* True if we need to set dirty flag. */
1061 u32 total_avail_pages
;
1062 u32 total_undo_commit
;
1063 u32 max_current_avail
;
1070 u32 l_flags
; /* See NTFSLOG_XXX */
1071 u32 current_openlog_count
; /* On-disk value for open_log_count. */
1073 struct CLIENT_ID client_id
;
1074 u32 client_undo_commit
;
1076 struct restart_info rst_info
, rst_info2
;
1079 static inline u32
lsn_to_vbo(struct ntfs_log
*log
, const u64 lsn
)
1081 u32 vbo
= (lsn
<< log
->seq_num_bits
) >> (log
->seq_num_bits
- 3);
1086 /* Compute the offset in the log file of the next log page. */
1087 static inline u32
next_page_off(struct ntfs_log
*log
, u32 off
)
1089 off
= (off
& ~log
->sys_page_mask
) + log
->page_size
;
1090 return off
>= log
->l_size
? log
->first_page
: off
;
1093 static inline u32
lsn_to_page_off(struct ntfs_log
*log
, u64 lsn
)
1095 return (((u32
)lsn
) << 3) & log
->page_mask
;
1098 static inline u64
vbo_to_lsn(struct ntfs_log
*log
, u32 off
, u64 Seq
)
1100 return (off
>> 3) + (Seq
<< log
->file_data_bits
);
1103 static inline bool is_lsn_in_file(struct ntfs_log
*log
, u64 lsn
)
1105 return lsn
>= log
->oldest_lsn
&&
1106 lsn
<= le64_to_cpu(log
->ra
->current_lsn
);
1109 static inline u32
hdr_file_off(struct ntfs_log
*log
,
1110 struct RECORD_PAGE_HDR
*hdr
)
1112 if (log
->major_ver
< 2)
1113 return le64_to_cpu(hdr
->rhdr
.lsn
);
1115 return le32_to_cpu(hdr
->file_off
);
1118 static inline u64
base_lsn(struct ntfs_log
*log
,
1119 const struct RECORD_PAGE_HDR
*hdr
, u64 lsn
)
1121 u64 h_lsn
= le64_to_cpu(hdr
->rhdr
.lsn
);
1122 u64 ret
= (((h_lsn
>> log
->file_data_bits
) +
1123 (lsn
< (lsn_to_vbo(log
, h_lsn
) & ~log
->page_mask
) ? 1 : 0))
1124 << log
->file_data_bits
) +
1125 ((((is_log_record_end(hdr
) &&
1126 h_lsn
<= le64_to_cpu(hdr
->record_hdr
.last_end_lsn
)) ?
1127 le16_to_cpu(hdr
->record_hdr
.next_record_off
) :
1135 static inline bool verify_client_lsn(struct ntfs_log
*log
,
1136 const struct CLIENT_REC
*client
, u64 lsn
)
1138 return lsn
>= le64_to_cpu(client
->oldest_lsn
) &&
1139 lsn
<= le64_to_cpu(log
->ra
->current_lsn
) && lsn
;
1142 static int read_log_page(struct ntfs_log
*log
, u32 vbo
,
1143 struct RECORD_PAGE_HDR
**buffer
, bool *usa_error
)
1146 u32 page_idx
= vbo
>> log
->page_bits
;
1147 u32 page_off
= vbo
& log
->page_mask
;
1148 u32 bytes
= log
->page_size
- page_off
;
1149 void *to_free
= NULL
;
1150 u32 page_vbo
= page_idx
<< log
->page_bits
;
1151 struct RECORD_PAGE_HDR
*page_buf
;
1152 struct ntfs_inode
*ni
= log
->ni
;
1155 if (vbo
>= log
->l_size
)
1159 to_free
= kmalloc(log
->page_size
, GFP_NOFS
);
1165 page_buf
= page_off
? log
->one_page_buf
: *buffer
;
1167 err
= ntfs_read_run_nb(ni
->mi
.sbi
, &ni
->file
.run
, page_vbo
, page_buf
,
1168 log
->page_size
, NULL
);
1172 if (page_buf
->rhdr
.sign
!= NTFS_FFFF_SIGNATURE
)
1173 ntfs_fix_post_read(&page_buf
->rhdr
, PAGE_SIZE
, false);
1175 if (page_buf
!= *buffer
)
1176 memcpy(*buffer
, Add2Ptr(page_buf
, page_off
), bytes
);
1178 bBAAD
= page_buf
->rhdr
.sign
== NTFS_BAAD_SIGNATURE
;
1182 /* Check that the update sequence array for this page is valid */
1183 /* If we don't allow errors, raise an error status */
1188 if (err
&& to_free
) {
1199 * It walks through 512 blocks of the file looking for a valid
1200 * restart page header. It will stop the first time we find a
1201 * valid page header.
1203 static int log_read_rst(struct ntfs_log
*log
, bool first
,
1204 struct restart_info
*info
)
1208 struct RESTART_HDR
*r_page
= NULL
;
1210 /* Determine which restart area we are looking for. */
1219 /* Loop continuously until we succeed. */
1220 for (; vbo
< log
->l_size
; vbo
= 2 * vbo
+ skip
, skip
= 0) {
1223 struct RESTART_AREA
*ra
;
1225 /* Read a page header at the current offset. */
1226 if (read_log_page(log
, vbo
, (struct RECORD_PAGE_HDR
**)&r_page
,
1228 /* Ignore any errors. */
1232 /* Exit if the signature is a log record page. */
1233 if (r_page
->rhdr
.sign
== NTFS_RCRD_SIGNATURE
) {
1234 info
->initialized
= true;
1238 brst
= r_page
->rhdr
.sign
== NTFS_RSTR_SIGNATURE
;
1239 bchk
= r_page
->rhdr
.sign
== NTFS_CHKD_SIGNATURE
;
1241 if (!bchk
&& !brst
) {
1242 if (r_page
->rhdr
.sign
!= NTFS_FFFF_SIGNATURE
) {
1244 * Remember if the signature does not
1245 * indicate uninitialized file.
1247 info
->initialized
= true;
1253 info
->valid_page
= false;
1254 info
->initialized
= true;
1257 /* Let's check the restart area if this is a valid page. */
1258 if (!is_rst_page_hdr_valid(vbo
, r_page
))
1260 ra
= Add2Ptr(r_page
, le16_to_cpu(r_page
->ra_off
));
1262 if (!is_rst_area_valid(r_page
))
1266 * We have a valid restart page header and restart area.
1267 * If chkdsk was run or we have no clients then we have
1268 * no more checking to do.
1270 if (bchk
|| ra
->client_idx
[1] == LFS_NO_CLIENT_LE
) {
1271 info
->valid_page
= true;
1275 if (is_client_area_valid(r_page
, usa_error
)) {
1276 info
->valid_page
= true;
1277 ra
= Add2Ptr(r_page
, le16_to_cpu(r_page
->ra_off
));
1282 * If chkdsk was run then update the caller's
1283 * values and return.
1285 if (r_page
->rhdr
.sign
== NTFS_CHKD_SIGNATURE
) {
1286 info
->chkdsk_was_run
= true;
1287 info
->last_lsn
= le64_to_cpu(r_page
->rhdr
.lsn
);
1288 info
->restart
= true;
1289 info
->r_page
= r_page
;
1294 * If we have a valid page then copy the values
1297 if (info
->valid_page
) {
1298 info
->last_lsn
= le64_to_cpu(ra
->current_lsn
);
1299 info
->restart
= true;
1300 info
->r_page
= r_page
;
1311 * Ilog_init_pg_hdr - Init @log from restart page header.
1313 static void log_init_pg_hdr(struct ntfs_log
*log
, u16 major_ver
, u16 minor_ver
)
1315 log
->sys_page_size
= log
->page_size
;
1316 log
->sys_page_mask
= log
->page_mask
;
1318 log
->clst_per_page
= log
->page_size
>> log
->ni
->mi
.sbi
->cluster_bits
;
1319 if (!log
->clst_per_page
)
1320 log
->clst_per_page
= 1;
1322 log
->first_page
= major_ver
>= 2 ? 0x22 * log
->page_size
:
1324 log
->major_ver
= major_ver
;
1325 log
->minor_ver
= minor_ver
;
1329 * log_create - Init @log in cases when we don't have a restart area to use.
1331 static void log_create(struct ntfs_log
*log
, const u64 last_lsn
,
1332 u32 open_log_count
, bool wrapped
, bool use_multi_page
)
1334 /* All file offsets must be quadword aligned. */
1335 log
->file_data_bits
= blksize_bits(log
->l_size
) - 3;
1336 log
->seq_num_mask
= (8 << log
->file_data_bits
) - 1;
1337 log
->seq_num_bits
= sizeof(u64
) * 8 - log
->file_data_bits
;
1338 log
->seq_num
= (last_lsn
>> log
->file_data_bits
) + 2;
1339 log
->next_page
= log
->first_page
;
1340 log
->oldest_lsn
= log
->seq_num
<< log
->file_data_bits
;
1341 log
->oldest_lsn_off
= 0;
1342 log
->last_lsn
= log
->oldest_lsn
;
1344 log
->l_flags
|= NTFSLOG_NO_LAST_LSN
| NTFSLOG_NO_OLDEST_LSN
;
1346 /* Set the correct flags for the I/O and indicate if we have wrapped. */
1348 log
->l_flags
|= NTFSLOG_WRAPPED
;
1351 log
->l_flags
|= NTFSLOG_MULTIPLE_PAGE_IO
;
1353 /* Compute the log page values. */
1354 log
->data_off
= ALIGN(
1355 offsetof(struct RECORD_PAGE_HDR
, fixups
) +
1356 sizeof(short) * ((log
->page_size
>> SECTOR_SHIFT
) + 1),
1358 log
->data_size
= log
->page_size
- log
->data_off
;
1359 log
->record_header_len
= sizeof(struct LFS_RECORD_HDR
);
1361 /* Remember the different page sizes for reservation. */
1362 log
->reserved
= log
->data_size
- log
->record_header_len
;
1364 /* Compute the restart page values. */
1365 log
->ra_off
= ALIGN(
1366 offsetof(struct RESTART_HDR
, fixups
) +
1368 ((log
->sys_page_size
>> SECTOR_SHIFT
) + 1),
1370 log
->restart_size
= log
->sys_page_size
- log
->ra_off
;
1371 log
->ra_size
= struct_size(log
->ra
, clients
, 1);
1372 log
->current_openlog_count
= open_log_count
;
1375 * The total available log file space is the number of
1376 * log file pages times the space available on each page.
1378 log
->total_avail_pages
= log
->l_size
- log
->first_page
;
1379 log
->total_avail
= log
->total_avail_pages
>> log
->page_bits
;
1382 * We assume that we can't use the end of the page less than
1383 * the file record size.
1384 * Then we won't need to reserve more than the caller asks for.
1386 log
->max_current_avail
= log
->total_avail
* log
->reserved
;
1387 log
->total_avail
= log
->total_avail
* log
->data_size
;
1388 log
->current_avail
= log
->max_current_avail
;
1392 * log_create_ra - Fill a restart area from the values stored in @log.
1394 static struct RESTART_AREA
*log_create_ra(struct ntfs_log
*log
)
1396 struct CLIENT_REC
*cr
;
1397 struct RESTART_AREA
*ra
= kzalloc(log
->restart_size
, GFP_NOFS
);
1402 ra
->current_lsn
= cpu_to_le64(log
->last_lsn
);
1403 ra
->log_clients
= cpu_to_le16(1);
1404 ra
->client_idx
[1] = LFS_NO_CLIENT_LE
;
1405 if (log
->l_flags
& NTFSLOG_MULTIPLE_PAGE_IO
)
1406 ra
->flags
= RESTART_SINGLE_PAGE_IO
;
1407 ra
->seq_num_bits
= cpu_to_le32(log
->seq_num_bits
);
1408 ra
->ra_len
= cpu_to_le16(log
->ra_size
);
1409 ra
->client_off
= cpu_to_le16(offsetof(struct RESTART_AREA
, clients
));
1410 ra
->l_size
= cpu_to_le64(log
->l_size
);
1411 ra
->rec_hdr_len
= cpu_to_le16(log
->record_header_len
);
1412 ra
->data_off
= cpu_to_le16(log
->data_off
);
1413 ra
->open_log_count
= cpu_to_le32(log
->current_openlog_count
+ 1);
1417 cr
->prev_client
= LFS_NO_CLIENT_LE
;
1418 cr
->next_client
= LFS_NO_CLIENT_LE
;
1423 static u32
final_log_off(struct ntfs_log
*log
, u64 lsn
, u32 data_len
)
1425 u32 base_vbo
= lsn
<< 3;
1426 u32 final_log_off
= (base_vbo
& log
->seq_num_mask
) & ~log
->page_mask
;
1427 u32 page_off
= base_vbo
& log
->page_mask
;
1428 u32 tail
= log
->page_size
- page_off
;
1432 /* Add the length of the header. */
1433 data_len
+= log
->record_header_len
;
1436 * If this lsn is contained this log page we are done.
1437 * Otherwise we need to walk through several log pages.
1439 if (data_len
> tail
) {
1441 tail
= log
->data_size
;
1442 page_off
= log
->data_off
- 1;
1445 final_log_off
= next_page_off(log
, final_log_off
);
1448 * We are done if the remaining bytes
1451 if (data_len
<= tail
)
1458 * We add the remaining bytes to our starting position on this page
1459 * and then add that value to the file offset of this log page.
1461 return final_log_off
+ data_len
+ page_off
;
1464 static int next_log_lsn(struct ntfs_log
*log
, const struct LFS_RECORD_HDR
*rh
,
1468 u64 this_lsn
= le64_to_cpu(rh
->this_lsn
);
1469 u32 vbo
= lsn_to_vbo(log
, this_lsn
);
1471 final_log_off(log
, this_lsn
, le32_to_cpu(rh
->client_data_len
));
1472 u32 hdr_off
= end
& ~log
->sys_page_mask
;
1473 u64 seq
= this_lsn
>> log
->file_data_bits
;
1474 struct RECORD_PAGE_HDR
*page
= NULL
;
1476 /* Remember if we wrapped. */
1480 /* Log page header for this page. */
1481 err
= read_log_page(log
, hdr_off
, &page
, NULL
);
1486 * If the lsn we were given was not the last lsn on this page,
1487 * then the starting offset for the next lsn is on a quad word
1488 * boundary following the last file offset for the current lsn.
1489 * Otherwise the file offset is the start of the data on the next page.
1491 if (this_lsn
== le64_to_cpu(page
->rhdr
.lsn
)) {
1492 /* If we wrapped, we need to increment the sequence number. */
1493 hdr_off
= next_page_off(log
, hdr_off
);
1494 if (hdr_off
== log
->first_page
)
1497 vbo
= hdr_off
+ log
->data_off
;
1499 vbo
= ALIGN(end
, 8);
1502 /* Compute the lsn based on the file offset and the sequence count. */
1503 *lsn
= vbo_to_lsn(log
, vbo
, seq
);
1506 * If this lsn is within the legal range for the file, we return true.
1507 * Otherwise false indicates that there are no more lsn's.
1509 if (!is_lsn_in_file(log
, *lsn
))
1518 * current_log_avail - Calculate the number of bytes available for log records.
1520 static u32
current_log_avail(struct ntfs_log
*log
)
1522 u32 oldest_off
, next_free_off
, free_bytes
;
1524 if (log
->l_flags
& NTFSLOG_NO_LAST_LSN
) {
1525 /* The entire file is available. */
1526 return log
->max_current_avail
;
1530 * If there is a last lsn the restart area then we know that we will
1531 * have to compute the free range.
1532 * If there is no oldest lsn then start at the first page of the file.
1534 oldest_off
= (log
->l_flags
& NTFSLOG_NO_OLDEST_LSN
) ?
1536 (log
->oldest_lsn_off
& ~log
->sys_page_mask
);
1539 * We will use the next log page offset to compute the next free page.
1540 * If we are going to reuse this page go to the next page.
1541 * If we are at the first page then use the end of the file.
1543 next_free_off
= (log
->l_flags
& NTFSLOG_REUSE_TAIL
) ?
1544 log
->next_page
+ log
->page_size
:
1545 log
->next_page
== log
->first_page
? log
->l_size
:
1548 /* If the two offsets are the same then there is no available space. */
1549 if (oldest_off
== next_free_off
)
1552 * If the free offset follows the oldest offset then subtract
1553 * this range from the total available pages.
1556 oldest_off
< next_free_off
?
1557 log
->total_avail_pages
- (next_free_off
- oldest_off
) :
1558 oldest_off
- next_free_off
;
1560 free_bytes
>>= log
->page_bits
;
1561 return free_bytes
* log
->reserved
;
1564 static bool check_subseq_log_page(struct ntfs_log
*log
,
1565 const struct RECORD_PAGE_HDR
*rp
, u32 vbo
,
1569 const struct NTFS_RECORD_HEADER
*rhdr
= &rp
->rhdr
;
1570 u64 lsn
= le64_to_cpu(rhdr
->lsn
);
1572 if (rhdr
->sign
== NTFS_FFFF_SIGNATURE
|| !rhdr
->sign
)
1576 * If the last lsn on the page occurs was written after the page
1577 * that caused the original error then we have a fatal error.
1579 lsn_seq
= lsn
>> log
->file_data_bits
;
1582 * If the sequence number for the lsn the page is equal or greater
1583 * than lsn we expect, then this is a subsequent write.
1585 return lsn_seq
>= seq
||
1586 (lsn_seq
== seq
- 1 && log
->first_page
== vbo
&&
1587 vbo
!= (lsn_to_vbo(log
, lsn
) & ~log
->page_mask
));
1593 * Walks through the log pages for a file, searching for the
1594 * last log page written to the file.
1596 static int last_log_lsn(struct ntfs_log
*log
)
1599 bool usa_error
= false;
1600 bool replace_page
= false;
1601 bool reuse_page
= log
->l_flags
& NTFSLOG_REUSE_TAIL
;
1602 bool wrapped_file
, wrapped
;
1604 u32 page_cnt
= 1, page_pos
= 1;
1605 u32 page_off
= 0, page_off1
= 0, saved_off
= 0;
1606 u32 final_off
, second_off
, final_off_prev
= 0, second_off_prev
= 0;
1607 u32 first_file_off
= 0, second_file_off
= 0;
1608 u32 part_io_count
= 0;
1610 u32 this_off
, curpage_off
, nextpage_off
, remain_pages
;
1612 u64 expected_seq
, seq_base
= 0, lsn_base
= 0;
1613 u64 best_lsn
, best_lsn1
, best_lsn2
;
1614 u64 lsn_cur
, lsn1
, lsn2
;
1615 u64 last_ok_lsn
= reuse_page
? log
->last_lsn
: 0;
1617 u16 cur_pos
, best_page_pos
;
1619 struct RECORD_PAGE_HDR
*page
= NULL
;
1620 struct RECORD_PAGE_HDR
*tst_page
= NULL
;
1621 struct RECORD_PAGE_HDR
*first_tail
= NULL
;
1622 struct RECORD_PAGE_HDR
*second_tail
= NULL
;
1623 struct RECORD_PAGE_HDR
*tail_page
= NULL
;
1624 struct RECORD_PAGE_HDR
*second_tail_prev
= NULL
;
1625 struct RECORD_PAGE_HDR
*first_tail_prev
= NULL
;
1626 struct RECORD_PAGE_HDR
*page_bufs
= NULL
;
1627 struct RECORD_PAGE_HDR
*best_page
;
1629 if (log
->major_ver
>= 2) {
1630 final_off
= 0x02 * log
->page_size
;
1631 second_off
= 0x12 * log
->page_size
;
1633 // 0x10 == 0x12 - 0x2
1634 page_bufs
= kmalloc(log
->page_size
* 0x10, GFP_NOFS
);
1638 second_off
= log
->first_page
- log
->page_size
;
1639 final_off
= second_off
- log
->page_size
;
1643 /* Read second tail page (at pos 3/0x12000). */
1644 if (read_log_page(log
, second_off
, &second_tail
, &usa_error
) ||
1645 usa_error
|| second_tail
->rhdr
.sign
!= NTFS_RCRD_SIGNATURE
) {
1648 second_file_off
= 0;
1651 second_file_off
= hdr_file_off(log
, second_tail
);
1652 lsn2
= le64_to_cpu(second_tail
->record_hdr
.last_end_lsn
);
1655 /* Read first tail page (at pos 2/0x2000). */
1656 if (read_log_page(log
, final_off
, &first_tail
, &usa_error
) ||
1657 usa_error
|| first_tail
->rhdr
.sign
!= NTFS_RCRD_SIGNATURE
) {
1663 first_file_off
= hdr_file_off(log
, first_tail
);
1664 lsn1
= le64_to_cpu(first_tail
->record_hdr
.last_end_lsn
);
1667 if (log
->major_ver
< 2) {
1670 first_tail_prev
= first_tail
;
1671 final_off_prev
= first_file_off
;
1672 second_tail_prev
= second_tail
;
1673 second_off_prev
= second_file_off
;
1676 if (!first_tail
&& !second_tail
)
1679 if (first_tail
&& second_tail
)
1680 best_page
= lsn1
< lsn2
? 1 : 0;
1681 else if (first_tail
)
1686 page_off
= best_page
? second_file_off
: first_file_off
;
1687 seq_base
= (best_page
? lsn2
: lsn1
) >> log
->file_data_bits
;
1691 best_lsn1
= first_tail
? base_lsn(log
, first_tail
, first_file_off
) : 0;
1692 best_lsn2
= second_tail
? base_lsn(log
, second_tail
, second_file_off
) :
1695 if (first_tail
&& second_tail
) {
1696 if (best_lsn1
> best_lsn2
) {
1697 best_lsn
= best_lsn1
;
1698 best_page
= first_tail
;
1699 this_off
= first_file_off
;
1701 best_lsn
= best_lsn2
;
1702 best_page
= second_tail
;
1703 this_off
= second_file_off
;
1705 } else if (first_tail
) {
1706 best_lsn
= best_lsn1
;
1707 best_page
= first_tail
;
1708 this_off
= first_file_off
;
1709 } else if (second_tail
) {
1710 best_lsn
= best_lsn2
;
1711 best_page
= second_tail
;
1712 this_off
= second_file_off
;
1717 best_page_pos
= le16_to_cpu(best_page
->page_pos
);
1720 if (best_page_pos
== page_pos
) {
1721 seq_base
= best_lsn
>> log
->file_data_bits
;
1722 saved_off
= page_off
= le32_to_cpu(best_page
->file_off
);
1723 lsn_base
= best_lsn
;
1725 memmove(page_bufs
, best_page
, log
->page_size
);
1727 page_cnt
= le16_to_cpu(best_page
->page_count
);
1733 } else if (seq_base
== (best_lsn
>> log
->file_data_bits
) &&
1734 saved_off
+ log
->page_size
== this_off
&&
1735 lsn_base
< best_lsn
&&
1736 (page_pos
!= page_cnt
|| best_page_pos
== page_pos
||
1737 best_page_pos
== 1) &&
1738 (page_pos
>= page_cnt
|| best_page_pos
== page_pos
)) {
1739 u16 bppc
= le16_to_cpu(best_page
->page_count
);
1741 saved_off
+= log
->page_size
;
1742 lsn_base
= best_lsn
;
1744 memmove(Add2Ptr(page_bufs
, tails
* log
->page_size
), best_page
,
1749 if (best_page_pos
!= bppc
) {
1751 page_pos
= best_page_pos
;
1756 page_pos
= page_cnt
= 1;
1764 kfree(first_tail_prev
);
1765 first_tail_prev
= first_tail
;
1766 final_off_prev
= first_file_off
;
1769 kfree(second_tail_prev
);
1770 second_tail_prev
= second_tail
;
1771 second_off_prev
= second_file_off
;
1774 final_off
+= log
->page_size
;
1775 second_off
+= log
->page_size
;
1780 first_tail
= first_tail_prev
;
1781 final_off
= final_off_prev
;
1783 second_tail
= second_tail_prev
;
1784 second_off
= second_off_prev
;
1786 page_cnt
= page_pos
= 1;
1788 curpage_off
= seq_base
== log
->seq_num
? min(log
->next_page
, page_off
) :
1792 curpage_off
== log
->first_page
&&
1793 !(log
->l_flags
& (NTFSLOG_NO_LAST_LSN
| NTFSLOG_REUSE_TAIL
));
1795 expected_seq
= wrapped_file
? (log
->seq_num
+ 1) : log
->seq_num
;
1797 nextpage_off
= curpage_off
;
1801 /* Read the next log page. */
1802 err
= read_log_page(log
, curpage_off
, &page
, &usa_error
);
1804 /* Compute the next log page offset the file. */
1805 nextpage_off
= next_page_off(log
, curpage_off
);
1806 wrapped
= nextpage_off
== log
->first_page
;
1809 struct RECORD_PAGE_HDR
*cur_page
=
1810 Add2Ptr(page_bufs
, curpage_off
- page_off
);
1812 if (curpage_off
== saved_off
) {
1813 tail_page
= cur_page
;
1817 if (page_off
> curpage_off
|| curpage_off
>= saved_off
)
1823 if (!err
&& !usa_error
&&
1824 page
->rhdr
.sign
== NTFS_RCRD_SIGNATURE
&&
1825 cur_page
->rhdr
.lsn
== page
->rhdr
.lsn
&&
1826 cur_page
->record_hdr
.next_record_off
==
1827 page
->record_hdr
.next_record_off
&&
1828 ((page_pos
== page_cnt
&&
1829 le16_to_cpu(page
->page_pos
) == 1) ||
1830 (page_pos
!= page_cnt
&&
1831 le16_to_cpu(page
->page_pos
) == page_pos
+ 1 &&
1832 le16_to_cpu(page
->page_count
) == page_cnt
))) {
1837 page_off1
= page_off
;
1841 lsn_cur
= le64_to_cpu(cur_page
->rhdr
.lsn
);
1844 le64_to_cpu(cur_page
->record_hdr
.last_end_lsn
) &&
1845 ((lsn_cur
>> log
->file_data_bits
) +
1847 (lsn_to_vbo(log
, lsn_cur
) & ~log
->page_mask
)) ?
1849 0)) != expected_seq
) {
1853 if (!is_log_record_end(cur_page
)) {
1855 last_ok_lsn
= lsn_cur
;
1859 log
->seq_num
= expected_seq
;
1860 log
->l_flags
&= ~NTFSLOG_NO_LAST_LSN
;
1861 log
->last_lsn
= le64_to_cpu(cur_page
->record_hdr
.last_end_lsn
);
1862 log
->ra
->current_lsn
= cur_page
->record_hdr
.last_end_lsn
;
1864 if (log
->record_header_len
<=
1866 le16_to_cpu(cur_page
->record_hdr
.next_record_off
)) {
1867 log
->l_flags
|= NTFSLOG_REUSE_TAIL
;
1868 log
->next_page
= curpage_off
;
1870 log
->l_flags
&= ~NTFSLOG_REUSE_TAIL
;
1871 log
->next_page
= nextpage_off
;
1875 log
->l_flags
|= NTFSLOG_WRAPPED
;
1877 last_ok_lsn
= le64_to_cpu(cur_page
->record_hdr
.last_end_lsn
);
1882 * If we are at the expected first page of a transfer check to see
1883 * if either tail copy is at this offset.
1884 * If this page is the last page of a transfer, check if we wrote
1885 * a subsequent tail copy.
1887 if (page_cnt
== page_pos
|| page_cnt
== page_pos
+ 1) {
1889 * Check if the offset matches either the first or second
1890 * tail copy. It is possible it will match both.
1892 if (curpage_off
== final_off
)
1893 tail_page
= first_tail
;
1896 * If we already matched on the first page then
1897 * check the ending lsn's.
1899 if (curpage_off
== second_off
) {
1902 le64_to_cpu(second_tail
->record_hdr
.last_end_lsn
) >
1903 le64_to_cpu(first_tail
->record_hdr
1905 tail_page
= second_tail
;
1912 /* We have a candidate for a tail copy. */
1913 lsn_cur
= le64_to_cpu(tail_page
->record_hdr
.last_end_lsn
);
1915 if (last_ok_lsn
< lsn_cur
) {
1917 * If the sequence number is not expected,
1918 * then don't use the tail copy.
1920 if (expected_seq
!= (lsn_cur
>> log
->file_data_bits
))
1922 } else if (last_ok_lsn
> lsn_cur
) {
1924 * If the last lsn is greater than the one on
1925 * this page then forget this tail.
1932 *If we have an error on the current page,
1933 * we will break of this loop.
1935 if (err
|| usa_error
)
1939 * Done if the last lsn on this page doesn't match the previous known
1940 * last lsn or the sequence number is not expected.
1942 lsn_cur
= le64_to_cpu(page
->rhdr
.lsn
);
1943 if (last_ok_lsn
!= lsn_cur
&&
1944 expected_seq
!= (lsn_cur
>> log
->file_data_bits
)) {
1949 * Check that the page position and page count values are correct.
1950 * If this is the first page of a transfer the position must be 1
1951 * and the count will be unknown.
1953 if (page_cnt
== page_pos
) {
1954 if (page
->page_pos
!= cpu_to_le16(1) &&
1955 (!reuse_page
|| page
->page_pos
!= page
->page_count
)) {
1957 * If the current page is the first page we are
1958 * looking at and we are reusing this page then
1959 * it can be either the first or last page of a
1960 * transfer. Otherwise it can only be the first.
1964 } else if (le16_to_cpu(page
->page_count
) != page_cnt
||
1965 le16_to_cpu(page
->page_pos
) != page_pos
+ 1) {
1967 * The page position better be 1 more than the last page
1968 * position and the page count better match.
1974 * We have a valid page the file and may have a valid page
1975 * the tail copy area.
1976 * If the tail page was written after the page the file then
1977 * break of the loop.
1980 le64_to_cpu(tail_page
->record_hdr
.last_end_lsn
) > lsn_cur
) {
1981 /* Remember if we will replace the page. */
1982 replace_page
= true;
1988 if (is_log_record_end(page
)) {
1990 * Since we have read this page we know the sequence number
1991 * is the same as our expected value.
1993 log
->seq_num
= expected_seq
;
1994 log
->last_lsn
= le64_to_cpu(page
->record_hdr
.last_end_lsn
);
1995 log
->ra
->current_lsn
= page
->record_hdr
.last_end_lsn
;
1996 log
->l_flags
&= ~NTFSLOG_NO_LAST_LSN
;
1999 * If there is room on this page for another header then
2000 * remember we want to reuse the page.
2002 if (log
->record_header_len
<=
2004 le16_to_cpu(page
->record_hdr
.next_record_off
)) {
2005 log
->l_flags
|= NTFSLOG_REUSE_TAIL
;
2006 log
->next_page
= curpage_off
;
2008 log
->l_flags
&= ~NTFSLOG_REUSE_TAIL
;
2009 log
->next_page
= nextpage_off
;
2012 /* Remember if we wrapped the log file. */
2014 log
->l_flags
|= NTFSLOG_WRAPPED
;
2018 * Remember the last page count and position.
2019 * Also remember the last known lsn.
2021 page_cnt
= le16_to_cpu(page
->page_count
);
2022 page_pos
= le16_to_cpu(page
->page_pos
);
2023 last_ok_lsn
= le64_to_cpu(page
->rhdr
.lsn
);
2032 curpage_off
= nextpage_off
;
2040 log
->seq_num
= expected_seq
;
2041 log
->last_lsn
= le64_to_cpu(tail_page
->record_hdr
.last_end_lsn
);
2042 log
->ra
->current_lsn
= tail_page
->record_hdr
.last_end_lsn
;
2043 log
->l_flags
&= ~NTFSLOG_NO_LAST_LSN
;
2045 if (log
->page_size
-
2047 tail_page
->record_hdr
.next_record_off
) >=
2048 log
->record_header_len
) {
2049 log
->l_flags
|= NTFSLOG_REUSE_TAIL
;
2050 log
->next_page
= curpage_off
;
2052 log
->l_flags
&= ~NTFSLOG_REUSE_TAIL
;
2053 log
->next_page
= nextpage_off
;
2057 log
->l_flags
|= NTFSLOG_WRAPPED
;
2060 /* Remember that the partial IO will start at the next page. */
2061 second_off
= nextpage_off
;
2064 * If the next page is the first page of the file then update
2065 * the sequence number for log records which begon the next page.
2071 * If we have a tail copy or are performing single page I/O we can
2072 * immediately look at the next page.
2074 if (replace_page
|| (log
->ra
->flags
& RESTART_SINGLE_PAGE_IO
)) {
2080 if (page_pos
!= page_cnt
)
2083 * If the next page causes us to wrap to the beginning of the log
2084 * file then we know which page to check next.
2098 /* Walk through the file, reading log pages. */
2099 err
= read_log_page(log
, nextpage_off
, &tst_page
, &usa_error
);
2102 * If we get a USA error then assume that we correctly found
2103 * the end of the original transfer.
2109 * If we were able to read the page, we examine it to see if it
2110 * is the same or different Io block.
2113 goto next_test_page_1
;
2115 if (le16_to_cpu(tst_page
->page_pos
) == cur_pos
&&
2116 check_subseq_log_page(log
, tst_page
, nextpage_off
, expected_seq
)) {
2117 page_cnt
= le16_to_cpu(tst_page
->page_count
) + 1;
2118 page_pos
= le16_to_cpu(tst_page
->page_pos
);
2126 nextpage_off
= next_page_off(log
, curpage_off
);
2127 wrapped
= nextpage_off
== log
->first_page
;
2138 goto next_test_page
;
2141 /* Skip over the remaining pages this transfer. */
2142 remain_pages
= page_cnt
- page_pos
- 1;
2143 part_io_count
+= remain_pages
;
2145 while (remain_pages
--) {
2146 nextpage_off
= next_page_off(log
, curpage_off
);
2147 wrapped
= nextpage_off
== log
->first_page
;
2153 /* Call our routine to check this log page. */
2157 err
= read_log_page(log
, nextpage_off
, &tst_page
, &usa_error
);
2158 if (!err
&& !usa_error
&&
2159 check_subseq_log_page(log
, tst_page
, nextpage_off
, expected_seq
)) {
2166 /* We have a valid file. */
2167 if (page_off1
|| tail_page
) {
2168 struct RECORD_PAGE_HDR
*tmp_page
;
2170 if (sb_rdonly(log
->ni
->mi
.sbi
->sb
)) {
2176 tmp_page
= Add2Ptr(page_bufs
, page_off1
- page_off
);
2177 tails
-= (page_off1
- page_off
) / log
->page_size
;
2181 tmp_page
= tail_page
;
2186 u64 off
= hdr_file_off(log
, tmp_page
);
2189 page
= kmalloc(log
->page_size
, GFP_NOFS
);
2197 * Correct page and copy the data from this page
2198 * into it and flush it to disk.
2200 memcpy(page
, tmp_page
, log
->page_size
);
2202 /* Fill last flushed lsn value flush the page. */
2203 if (log
->major_ver
< 2)
2204 page
->rhdr
.lsn
= page
->record_hdr
.last_end_lsn
;
2208 page
->page_pos
= page
->page_count
= cpu_to_le16(1);
2210 ntfs_fix_pre_write(&page
->rhdr
, log
->page_size
);
2212 err
= ntfs_sb_write_run(log
->ni
->mi
.sbi
,
2213 &log
->ni
->file
.run
, off
, page
,
2219 if (part_io_count
&& second_off
== off
) {
2220 second_off
+= log
->page_size
;
2224 tmp_page
= Add2Ptr(tmp_page
, log
->page_size
);
2228 if (part_io_count
) {
2229 if (sb_rdonly(log
->ni
->mi
.sbi
->sb
)) {
2246 * read_log_rec_buf - Copy a log record from the file to a buffer.
2248 * The log record may span several log pages and may even wrap the file.
2250 static int read_log_rec_buf(struct ntfs_log
*log
,
2251 const struct LFS_RECORD_HDR
*rh
, void *buffer
)
2254 struct RECORD_PAGE_HDR
*ph
= NULL
;
2255 u64 lsn
= le64_to_cpu(rh
->this_lsn
);
2256 u32 vbo
= lsn_to_vbo(log
, lsn
) & ~log
->page_mask
;
2257 u32 off
= lsn_to_page_off(log
, lsn
) + log
->record_header_len
;
2258 u32 data_len
= le32_to_cpu(rh
->client_data_len
);
2261 * While there are more bytes to transfer,
2262 * we continue to attempt to perform the read.
2266 u32 tail
= log
->page_size
- off
;
2268 if (tail
>= data_len
)
2273 err
= read_log_page(log
, vbo
, &ph
, &usa_error
);
2278 * The last lsn on this page better be greater or equal
2279 * to the lsn we are copying.
2281 if (lsn
> le64_to_cpu(ph
->rhdr
.lsn
)) {
2286 memcpy(buffer
, Add2Ptr(ph
, off
), tail
);
2288 /* If there are no more bytes to transfer, we exit the loop. */
2290 if (!is_log_record_end(ph
) ||
2291 lsn
> le64_to_cpu(ph
->record_hdr
.last_end_lsn
)) {
2298 if (ph
->rhdr
.lsn
== ph
->record_hdr
.last_end_lsn
||
2299 lsn
> le64_to_cpu(ph
->rhdr
.lsn
)) {
2304 vbo
= next_page_off(log
, vbo
);
2305 off
= log
->data_off
;
2308 * Adjust our pointer the user's buffer to transfer
2309 * the next block to.
2311 buffer
= Add2Ptr(buffer
, tail
);
2319 static int read_rst_area(struct ntfs_log
*log
, struct NTFS_RESTART
**rst_
,
2323 struct LFS_RECORD_HDR
*rh
= NULL
;
2324 const struct CLIENT_REC
*cr
=
2325 Add2Ptr(log
->ra
, le16_to_cpu(log
->ra
->client_off
));
2326 u64 lsnr
, lsnc
= le64_to_cpu(cr
->restart_lsn
);
2328 struct NTFS_RESTART
*rst
;
2333 /* If the client doesn't have a restart area, go ahead and exit now. */
2337 err
= read_log_page(log
, lsn_to_vbo(log
, lsnc
),
2338 (struct RECORD_PAGE_HDR
**)&rh
, NULL
);
2343 lsnr
= le64_to_cpu(rh
->this_lsn
);
2346 /* If the lsn values don't match, then the disk is corrupt. */
2352 len
= le32_to_cpu(rh
->client_data_len
);
2359 if (len
< sizeof(struct NTFS_RESTART
)) {
2364 rst
= kmalloc(len
, GFP_NOFS
);
2370 /* Copy the data into the 'rst' buffer. */
2371 err
= read_log_rec_buf(log
, rh
, rst
);
2385 static int find_log_rec(struct ntfs_log
*log
, u64 lsn
, struct lcb
*lcb
)
2388 struct LFS_RECORD_HDR
*rh
= lcb
->lrh
;
2391 /* Read the record header for this lsn. */
2393 err
= read_log_page(log
, lsn_to_vbo(log
, lsn
),
2394 (struct RECORD_PAGE_HDR
**)&rh
, NULL
);
2402 * If the lsn the log record doesn't match the desired
2403 * lsn then the disk is corrupt.
2405 if (lsn
!= le64_to_cpu(rh
->this_lsn
))
2408 len
= le32_to_cpu(rh
->client_data_len
);
2411 * Check that the length field isn't greater than the total
2412 * available space the log file.
2414 rec_len
= len
+ log
->record_header_len
;
2415 if (rec_len
>= log
->total_avail
)
2419 * If the entire log record is on this log page,
2420 * put a pointer to the log record the context block.
2422 if (rh
->flags
& LOG_RECORD_MULTI_PAGE
) {
2423 void *lr
= kmalloc(len
, GFP_NOFS
);
2431 /* Copy the data into the buffer returned. */
2432 err
= read_log_rec_buf(log
, rh
, lr
);
2436 /* If beyond the end of the current page -> an error. */
2437 u32 page_off
= lsn_to_page_off(log
, lsn
);
2439 if (page_off
+ len
+ log
->record_header_len
> log
->page_size
)
2442 lcb
->log_rec
= Add2Ptr(rh
, sizeof(struct LFS_RECORD_HDR
));
2450 * read_log_rec_lcb - Init the query operation.
2452 static int read_log_rec_lcb(struct ntfs_log
*log
, u64 lsn
, u32 ctx_mode
,
2456 const struct CLIENT_REC
*cr
;
2460 case lcb_ctx_undo_next
:
2468 /* Check that the given lsn is the legal range for this client. */
2469 cr
= Add2Ptr(log
->ra
, le16_to_cpu(log
->ra
->client_off
));
2471 if (!verify_client_lsn(log
, cr
, lsn
))
2474 lcb
= kzalloc(sizeof(struct lcb
), GFP_NOFS
);
2477 lcb
->client
= log
->client_id
;
2478 lcb
->ctx_mode
= ctx_mode
;
2480 /* Find the log record indicated by the given lsn. */
2481 err
= find_log_rec(log
, lsn
, lcb
);
2495 * find_client_next_lsn
2497 * Attempt to find the next lsn to return to a client based on the context mode.
2499 static int find_client_next_lsn(struct ntfs_log
*log
, struct lcb
*lcb
, u64
*lsn
)
2503 struct LFS_RECORD_HDR
*hdr
;
2508 if (lcb_ctx_next
!= lcb
->ctx_mode
)
2509 goto check_undo_next
;
2511 /* Loop as long as another lsn can be found. */
2515 err
= next_log_lsn(log
, hdr
, ¤t_lsn
);
2522 if (hdr
!= lcb
->lrh
)
2526 err
= read_log_page(log
, lsn_to_vbo(log
, current_lsn
),
2527 (struct RECORD_PAGE_HDR
**)&hdr
, NULL
);
2531 if (memcmp(&hdr
->client
, &lcb
->client
,
2532 sizeof(struct CLIENT_ID
))) {
2534 } else if (LfsClientRecord
== hdr
->record_type
) {
2543 if (hdr
!= lcb
->lrh
)
2548 if (lcb_ctx_undo_next
== lcb
->ctx_mode
)
2549 next_lsn
= le64_to_cpu(hdr
->client_undo_next_lsn
);
2550 else if (lcb_ctx_prev
== lcb
->ctx_mode
)
2551 next_lsn
= le64_to_cpu(hdr
->client_prev_lsn
);
2558 if (!verify_client_lsn(
2559 log
, Add2Ptr(log
->ra
, le16_to_cpu(log
->ra
->client_off
)),
2564 err
= read_log_page(log
, lsn_to_vbo(log
, next_lsn
),
2565 (struct RECORD_PAGE_HDR
**)&hdr
, NULL
);
2576 static int read_next_log_rec(struct ntfs_log
*log
, struct lcb
*lcb
, u64
*lsn
)
2580 err
= find_client_next_lsn(log
, lcb
, lsn
);
2588 kfree(lcb
->log_rec
);
2590 lcb
->log_rec
= NULL
;
2595 return find_log_rec(log
, *lsn
, lcb
);
2598 bool check_index_header(const struct INDEX_HDR
*hdr
, size_t bytes
)
2601 u32 min_de
, de_off
, used
, total
;
2602 const struct NTFS_DE
*e
;
2604 if (hdr_has_subnode(hdr
)) {
2605 min_de
= sizeof(struct NTFS_DE
) + sizeof(u64
);
2606 mask
= NTFS_IE_HAS_SUBNODES
;
2608 min_de
= sizeof(struct NTFS_DE
);
2612 de_off
= le32_to_cpu(hdr
->de_off
);
2613 used
= le32_to_cpu(hdr
->used
);
2614 total
= le32_to_cpu(hdr
->total
);
2616 if (de_off
> bytes
- min_de
|| used
> bytes
|| total
> bytes
||
2617 de_off
+ min_de
> used
|| used
> total
) {
2621 e
= Add2Ptr(hdr
, de_off
);
2623 u16 esize
= le16_to_cpu(e
->size
);
2624 struct NTFS_DE
*next
= Add2Ptr(e
, esize
);
2626 if (esize
< min_de
|| PtrOffset(hdr
, next
) > used
||
2627 (e
->flags
& NTFS_IE_HAS_SUBNODES
) != mask
) {
2640 static inline bool check_index_buffer(const struct INDEX_BUFFER
*ib
, u32 bytes
)
2643 const struct NTFS_RECORD_HEADER
*r
= &ib
->rhdr
;
2645 if (r
->sign
!= NTFS_INDX_SIGNATURE
)
2648 fo
= (SECTOR_SIZE
- ((bytes
>> SECTOR_SHIFT
) + 1) * sizeof(short));
2650 if (le16_to_cpu(r
->fix_off
) > fo
)
2653 if ((le16_to_cpu(r
->fix_num
) - 1) * SECTOR_SIZE
!= bytes
)
2656 return check_index_header(&ib
->ihdr
,
2657 bytes
- offsetof(struct INDEX_BUFFER
, ihdr
));
2660 static inline bool check_index_root(const struct ATTRIB
*attr
,
2661 struct ntfs_sb_info
*sbi
)
2664 const struct INDEX_ROOT
*root
= resident_data(attr
);
2665 u8 index_bits
= le32_to_cpu(root
->index_block_size
) >=
2669 u8 block_clst
= root
->index_block_clst
;
2671 if (le32_to_cpu(attr
->res
.data_size
) < sizeof(struct INDEX_ROOT
) ||
2672 (root
->type
!= ATTR_NAME
&& root
->type
!= ATTR_ZERO
) ||
2673 (root
->type
== ATTR_NAME
&&
2674 root
->rule
!= NTFS_COLLATION_TYPE_FILENAME
) ||
2675 (le32_to_cpu(root
->index_block_size
) !=
2676 (block_clst
<< index_bits
)) ||
2677 (block_clst
!= 1 && block_clst
!= 2 && block_clst
!= 4 &&
2678 block_clst
!= 8 && block_clst
!= 0x10 && block_clst
!= 0x20 &&
2679 block_clst
!= 0x40 && block_clst
!= 0x80)) {
2683 ret
= check_index_header(&root
->ihdr
,
2684 le32_to_cpu(attr
->res
.data_size
) -
2685 offsetof(struct INDEX_ROOT
, ihdr
));
2689 static inline bool check_attr(const struct MFT_REC
*rec
,
2690 const struct ATTRIB
*attr
,
2691 struct ntfs_sb_info
*sbi
)
2693 u32 asize
= le32_to_cpu(attr
->size
);
2695 u64 dsize
, svcn
, evcn
;
2698 /* Check the fixed part of the attribute record header. */
2699 if (asize
>= sbi
->record_size
||
2700 asize
+ PtrOffset(rec
, attr
) >= sbi
->record_size
||
2702 le16_to_cpu(attr
->name_off
) + attr
->name_len
* sizeof(short) >
2707 /* Check the attribute fields. */
2708 switch (attr
->non_res
) {
2710 rsize
= le32_to_cpu(attr
->res
.data_size
);
2711 if (rsize
>= asize
||
2712 le16_to_cpu(attr
->res
.data_off
) + rsize
> asize
) {
2718 dsize
= le64_to_cpu(attr
->nres
.data_size
);
2719 svcn
= le64_to_cpu(attr
->nres
.svcn
);
2720 evcn
= le64_to_cpu(attr
->nres
.evcn
);
2721 run_off
= le16_to_cpu(attr
->nres
.run_off
);
2723 if (svcn
> evcn
+ 1 || run_off
>= asize
||
2724 le64_to_cpu(attr
->nres
.valid_size
) > dsize
||
2725 dsize
> le64_to_cpu(attr
->nres
.alloc_size
)) {
2729 if (run_off
> asize
)
2732 if (run_unpack(NULL
, sbi
, 0, svcn
, evcn
, svcn
,
2733 Add2Ptr(attr
, run_off
), asize
- run_off
) < 0) {
2743 switch (attr
->type
) {
2745 if (fname_full_size(Add2Ptr(
2746 attr
, le16_to_cpu(attr
->res
.data_off
))) > asize
) {
2752 return check_index_root(attr
, sbi
);
2755 if (rsize
< sizeof(struct ATTR_STD_INFO5
) &&
2756 rsize
!= sizeof(struct ATTR_STD_INFO
)) {
2772 case ATTR_PROPERTYSET
:
2773 case ATTR_LOGGED_UTILITY_STREAM
:
2783 static inline bool check_file_record(const struct MFT_REC
*rec
,
2784 const struct MFT_REC
*rec2
,
2785 struct ntfs_sb_info
*sbi
)
2787 const struct ATTRIB
*attr
;
2788 u16 fo
= le16_to_cpu(rec
->rhdr
.fix_off
);
2789 u16 fn
= le16_to_cpu(rec
->rhdr
.fix_num
);
2790 u16 ao
= le16_to_cpu(rec
->attr_off
);
2791 u32 rs
= sbi
->record_size
;
2793 /* Check the file record header for consistency. */
2794 if (rec
->rhdr
.sign
!= NTFS_FILE_SIGNATURE
||
2795 fo
> (SECTOR_SIZE
- ((rs
>> SECTOR_SHIFT
) + 1) * sizeof(short)) ||
2796 (fn
- 1) * SECTOR_SIZE
!= rs
|| ao
< MFTRECORD_FIXUP_OFFSET_1
||
2797 ao
> sbi
->record_size
- SIZEOF_RESIDENT
|| !is_rec_inuse(rec
) ||
2798 le32_to_cpu(rec
->total
) != rs
) {
2802 /* Loop to check all of the attributes. */
2803 for (attr
= Add2Ptr(rec
, ao
); attr
->type
!= ATTR_END
;
2804 attr
= Add2Ptr(attr
, le32_to_cpu(attr
->size
))) {
2805 if (check_attr(rec
, attr
, sbi
))
2813 static inline int check_lsn(const struct NTFS_RECORD_HEADER
*hdr
,
2821 lsn
= le64_to_cpu(hdr
->lsn
);
2823 if (hdr
->sign
== NTFS_HOLE_SIGNATURE
)
2832 static inline bool check_if_attr(const struct MFT_REC
*rec
,
2833 const struct LOG_REC_HDR
*lrh
)
2835 u16 ro
= le16_to_cpu(lrh
->record_off
);
2836 u16 o
= le16_to_cpu(rec
->attr_off
);
2837 const struct ATTRIB
*attr
= Add2Ptr(rec
, o
);
2842 if (attr
->type
== ATTR_END
)
2845 asize
= le32_to_cpu(attr
->size
);
2850 attr
= Add2Ptr(attr
, asize
);
2856 static inline bool check_if_index_root(const struct MFT_REC
*rec
,
2857 const struct LOG_REC_HDR
*lrh
)
2859 u16 ro
= le16_to_cpu(lrh
->record_off
);
2860 u16 o
= le16_to_cpu(rec
->attr_off
);
2861 const struct ATTRIB
*attr
= Add2Ptr(rec
, o
);
2866 if (attr
->type
== ATTR_END
)
2869 asize
= le32_to_cpu(attr
->size
);
2874 attr
= Add2Ptr(attr
, asize
);
2877 return o
== ro
&& attr
->type
== ATTR_ROOT
;
2880 static inline bool check_if_root_index(const struct ATTRIB
*attr
,
2881 const struct INDEX_HDR
*hdr
,
2882 const struct LOG_REC_HDR
*lrh
)
2884 u16 ao
= le16_to_cpu(lrh
->attr_off
);
2885 u32 de_off
= le32_to_cpu(hdr
->de_off
);
2886 u32 o
= PtrOffset(attr
, hdr
) + de_off
;
2887 const struct NTFS_DE
*e
= Add2Ptr(hdr
, de_off
);
2888 u32 asize
= le32_to_cpu(attr
->size
);
2896 esize
= le16_to_cpu(e
->size
);
2901 e
= Add2Ptr(e
, esize
);
2907 static inline bool check_if_alloc_index(const struct INDEX_HDR
*hdr
,
2910 u32 de_off
= le32_to_cpu(hdr
->de_off
);
2911 u32 o
= offsetof(struct INDEX_BUFFER
, ihdr
) + de_off
;
2912 const struct NTFS_DE
*e
= Add2Ptr(hdr
, de_off
);
2913 u32 used
= le32_to_cpu(hdr
->used
);
2915 while (o
< attr_off
) {
2921 esize
= le16_to_cpu(e
->size
);
2927 e
= Add2Ptr(e
, esize
);
2930 return o
== attr_off
;
2933 static inline void change_attr_size(struct MFT_REC
*rec
, struct ATTRIB
*attr
,
2936 u32 asize
= le32_to_cpu(attr
->size
);
2937 int dsize
= nsize
- asize
;
2938 u8
*next
= Add2Ptr(attr
, asize
);
2939 u32 used
= le32_to_cpu(rec
->used
);
2941 memmove(Add2Ptr(attr
, nsize
), next
, used
- PtrOffset(rec
, next
));
2943 rec
->used
= cpu_to_le32(used
+ dsize
);
2944 attr
->size
= cpu_to_le32(nsize
);
2948 struct ATTRIB
*attr
;
2949 struct runs_tree
*run1
;
2950 struct runs_tree run0
;
2951 struct ntfs_inode
*ni
;
2958 * Return: 0 if 'attr' has the same type and name.
2960 static inline int cmp_type_and_name(const struct ATTRIB
*a1
,
2961 const struct ATTRIB
*a2
)
2963 return a1
->type
!= a2
->type
|| a1
->name_len
!= a2
->name_len
||
2964 (a1
->name_len
&& memcmp(attr_name(a1
), attr_name(a2
),
2965 a1
->name_len
* sizeof(short)));
2968 static struct OpenAttr
*find_loaded_attr(struct ntfs_log
*log
,
2969 const struct ATTRIB
*attr
, CLST rno
)
2971 struct OPEN_ATTR_ENRTY
*oe
= NULL
;
2973 while ((oe
= enum_rstbl(log
->open_attr_tbl
, oe
))) {
2974 struct OpenAttr
*op_attr
;
2976 if (ino_get(&oe
->ref
) != rno
)
2979 op_attr
= (struct OpenAttr
*)oe
->ptr
;
2980 if (!cmp_type_and_name(op_attr
->attr
, attr
))
2986 static struct ATTRIB
*attr_create_nonres_log(struct ntfs_sb_info
*sbi
,
2987 enum ATTR_TYPE type
, u64 size
,
2988 const u16
*name
, size_t name_len
,
2991 struct ATTRIB
*attr
;
2992 u32 name_size
= ALIGN(name_len
* sizeof(short), 8);
2993 bool is_ext
= flags
& (ATTR_FLAG_COMPRESSED
| ATTR_FLAG_SPARSED
);
2994 u32 asize
= name_size
+
2995 (is_ext
? SIZEOF_NONRESIDENT_EX
: SIZEOF_NONRESIDENT
);
2997 attr
= kzalloc(asize
, GFP_NOFS
);
3002 attr
->size
= cpu_to_le32(asize
);
3003 attr
->flags
= flags
;
3005 attr
->name_len
= name_len
;
3007 attr
->nres
.evcn
= cpu_to_le64((u64
)bytes_to_cluster(sbi
, size
) - 1);
3008 attr
->nres
.alloc_size
= cpu_to_le64(ntfs_up_cluster(sbi
, size
));
3009 attr
->nres
.data_size
= cpu_to_le64(size
);
3010 attr
->nres
.valid_size
= attr
->nres
.data_size
;
3012 attr
->name_off
= SIZEOF_NONRESIDENT_EX_LE
;
3013 if (is_attr_compressed(attr
))
3014 attr
->nres
.c_unit
= NTFS_LZNT_CUNIT
;
3016 attr
->nres
.run_off
=
3017 cpu_to_le16(SIZEOF_NONRESIDENT_EX
+ name_size
);
3018 memcpy(Add2Ptr(attr
, SIZEOF_NONRESIDENT_EX
), name
,
3019 name_len
* sizeof(short));
3021 attr
->name_off
= SIZEOF_NONRESIDENT_LE
;
3022 attr
->nres
.run_off
=
3023 cpu_to_le16(SIZEOF_NONRESIDENT
+ name_size
);
3024 memcpy(Add2Ptr(attr
, SIZEOF_NONRESIDENT
), name
,
3025 name_len
* sizeof(short));
3032 * do_action - Common routine for the Redo and Undo Passes.
3033 * @rlsn: If it is NULL then undo.
3035 static int do_action(struct ntfs_log
*log
, struct OPEN_ATTR_ENRTY
*oe
,
3036 const struct LOG_REC_HDR
*lrh
, u32 op
, void *data
,
3037 u32 dlen
, u32 rec_len
, const u64
*rlsn
)
3040 struct ntfs_sb_info
*sbi
= log
->ni
->mi
.sbi
;
3041 struct inode
*inode
= NULL
, *inode_parent
;
3042 struct mft_inode
*mi
= NULL
, *mi2_child
= NULL
;
3043 CLST rno
= 0, rno_base
= 0;
3044 struct INDEX_BUFFER
*ib
= NULL
;
3045 struct MFT_REC
*rec
= NULL
;
3046 struct ATTRIB
*attr
= NULL
, *attr2
;
3047 struct INDEX_HDR
*hdr
;
3048 struct INDEX_ROOT
*root
;
3049 struct NTFS_DE
*e
, *e1
, *e2
;
3050 struct NEW_ATTRIBUTE_SIZES
*new_sz
;
3051 struct ATTR_FILE_NAME
*fname
;
3052 struct OpenAttr
*oa
, *oa2
;
3053 u32 nsize
, t32
, asize
, used
, esize
, off
, bits
;
3055 u32 record_size
= sbi
->record_size
;
3057 u16 roff
= le16_to_cpu(lrh
->record_off
);
3058 u16 aoff
= le16_to_cpu(lrh
->attr_off
);
3060 u64 cbo
= (u64
)le16_to_cpu(lrh
->cluster_off
) << SECTOR_SHIFT
;
3061 u64 tvo
= le64_to_cpu(lrh
->target_vcn
) << sbi
->cluster_bits
;
3062 u64 vbo
= cbo
+ tvo
;
3063 void *buffer_le
= NULL
;
3065 bool a_dirty
= false;
3070 /* Big switch to prepare. */
3072 /* ============================================================
3073 * Process MFT records, as described by the current log record.
3074 * ============================================================
3076 case InitializeFileRecordSegment
:
3077 case DeallocateFileRecordSegment
:
3078 case WriteEndOfFileRecordSegment
:
3079 case CreateAttribute
:
3080 case DeleteAttribute
:
3081 case UpdateResidentValue
:
3082 case UpdateMappingPairs
:
3083 case SetNewAttributeSizes
:
3084 case AddIndexEntryRoot
:
3085 case DeleteIndexEntryRoot
:
3086 case SetIndexEntryVcnRoot
:
3087 case UpdateFileNameRoot
:
3088 case UpdateRecordDataRoot
:
3089 case ZeroEndOfFileRecord
:
3090 rno
= vbo
>> sbi
->record_bits
;
3091 inode
= ilookup(sbi
->sb
, rno
);
3093 mi
= &ntfs_i(inode
)->mi
;
3094 } else if (op
== InitializeFileRecordSegment
) {
3095 mi
= kzalloc(sizeof(struct mft_inode
), GFP_NOFS
);
3098 err
= mi_format_new(mi
, sbi
, rno
, 0, false);
3102 /* Read from disk. */
3103 err
= mi_get(sbi
, rno
, &mi
);
3109 if (op
== DeallocateFileRecordSegment
)
3110 goto skip_load_parent
;
3112 if (InitializeFileRecordSegment
!= op
) {
3113 if (rec
->rhdr
.sign
== NTFS_BAAD_SIGNATURE
)
3115 if (!check_lsn(&rec
->rhdr
, rlsn
))
3117 if (!check_file_record(rec
, NULL
, sbi
))
3119 attr
= Add2Ptr(rec
, roff
);
3122 if (is_rec_base(rec
) || InitializeFileRecordSegment
== op
) {
3124 goto skip_load_parent
;
3127 rno_base
= ino_get(&rec
->parent_ref
);
3128 inode_parent
= ntfs_iget5(sbi
->sb
, &rec
->parent_ref
, NULL
);
3129 if (IS_ERR(inode_parent
))
3130 goto skip_load_parent
;
3132 if (is_bad_inode(inode_parent
)) {
3134 goto skip_load_parent
;
3137 if (ni_load_mi_ex(ntfs_i(inode_parent
), rno
, &mi2_child
)) {
3140 if (mi2_child
->mrec
!= mi
->mrec
)
3141 memcpy(mi2_child
->mrec
, mi
->mrec
,
3149 inode
= inode_parent
;
3151 rec
= mi2_child
->mrec
;
3152 attr
= Add2Ptr(rec
, roff
);
3156 inode_parent
= NULL
;
3160 * Process attributes, as described by the current log record.
3162 case UpdateNonresidentValue
:
3163 case AddIndexEntryAllocation
:
3164 case DeleteIndexEntryAllocation
:
3165 case WriteEndOfIndexBuffer
:
3166 case SetIndexEntryVcnAllocation
:
3167 case UpdateFileNameAllocation
:
3168 case SetBitsInNonresidentBitMap
:
3169 case ClearBitsInNonresidentBitMap
:
3170 case UpdateRecordDataAllocation
:
3172 bytes
= UpdateNonresidentValue
== op
? dlen
: 0;
3173 lco
= (u64
)le16_to_cpu(lrh
->lcns_follow
) << sbi
->cluster_bits
;
3175 if (attr
->type
== ATTR_ALLOC
) {
3176 t32
= le32_to_cpu(oe
->bytes_per_index
);
3185 if (attr
->type
== ATTR_ALLOC
)
3186 bytes
= (bytes
+ 511) & ~511; // align
3188 buffer_le
= kmalloc(bytes
, GFP_NOFS
);
3192 err
= ntfs_read_run_nb(sbi
, oa
->run1
, vbo
, buffer_le
, bytes
,
3197 if (attr
->type
== ATTR_ALLOC
&& *(int *)buffer_le
)
3198 ntfs_fix_post_read(buffer_le
, bytes
, false);
3205 /* Big switch to do operation. */
3207 case InitializeFileRecordSegment
:
3208 if (roff
+ dlen
> record_size
)
3211 memcpy(Add2Ptr(rec
, roff
), data
, dlen
);
3215 case DeallocateFileRecordSegment
:
3216 clear_rec_inuse(rec
);
3217 le16_add_cpu(&rec
->seq
, 1);
3221 case WriteEndOfFileRecordSegment
:
3222 attr2
= (struct ATTRIB
*)data
;
3223 if (!check_if_attr(rec
, lrh
) || roff
+ dlen
> record_size
)
3226 memmove(attr
, attr2
, dlen
);
3227 rec
->used
= cpu_to_le32(ALIGN(roff
+ dlen
, 8));
3232 case CreateAttribute
:
3233 attr2
= (struct ATTRIB
*)data
;
3234 asize
= le32_to_cpu(attr2
->size
);
3235 used
= le32_to_cpu(rec
->used
);
3237 if (!check_if_attr(rec
, lrh
) || dlen
< SIZEOF_RESIDENT
||
3238 !IS_ALIGNED(asize
, 8) ||
3239 Add2Ptr(attr2
, asize
) > Add2Ptr(lrh
, rec_len
) ||
3240 dlen
> record_size
- used
) {
3244 memmove(Add2Ptr(attr
, asize
), attr
, used
- roff
);
3245 memcpy(attr
, attr2
, asize
);
3247 rec
->used
= cpu_to_le32(used
+ asize
);
3248 id
= le16_to_cpu(rec
->next_attr_id
);
3249 id2
= le16_to_cpu(attr2
->id
);
3251 rec
->next_attr_id
= cpu_to_le16(id2
+ 1);
3252 if (is_attr_indexed(attr
))
3253 le16_add_cpu(&rec
->hard_links
, 1);
3255 oa2
= find_loaded_attr(log
, attr
, rno_base
);
3257 void *p2
= kmemdup(attr
, le32_to_cpu(attr
->size
),
3260 // run_close(oa2->run1);
3269 case DeleteAttribute
:
3270 asize
= le32_to_cpu(attr
->size
);
3271 used
= le32_to_cpu(rec
->used
);
3273 if (!check_if_attr(rec
, lrh
))
3276 rec
->used
= cpu_to_le32(used
- asize
);
3277 if (is_attr_indexed(attr
))
3278 le16_add_cpu(&rec
->hard_links
, -1);
3280 memmove(attr
, Add2Ptr(attr
, asize
), used
- asize
- roff
);
3285 case UpdateResidentValue
:
3286 nsize
= aoff
+ dlen
;
3288 if (!check_if_attr(rec
, lrh
))
3291 asize
= le32_to_cpu(attr
->size
);
3292 used
= le32_to_cpu(rec
->used
);
3294 if (lrh
->redo_len
== lrh
->undo_len
) {
3300 if (nsize
> asize
&& nsize
- asize
> record_size
- used
)
3303 nsize
= ALIGN(nsize
, 8);
3304 data_off
= le16_to_cpu(attr
->res
.data_off
);
3306 if (nsize
< asize
) {
3307 memmove(Add2Ptr(attr
, aoff
), data
, dlen
);
3308 data
= NULL
; // To skip below memmove().
3311 memmove(Add2Ptr(attr
, nsize
), Add2Ptr(attr
, asize
),
3312 used
- le16_to_cpu(lrh
->record_off
) - asize
);
3314 rec
->used
= cpu_to_le32(used
+ nsize
- asize
);
3315 attr
->size
= cpu_to_le32(nsize
);
3316 attr
->res
.data_size
= cpu_to_le32(aoff
+ dlen
- data_off
);
3320 memmove(Add2Ptr(attr
, aoff
), data
, dlen
);
3322 oa2
= find_loaded_attr(log
, attr
, rno_base
);
3324 void *p2
= kmemdup(attr
, le32_to_cpu(attr
->size
),
3327 // run_close(&oa2->run0);
3328 oa2
->run1
= &oa2
->run0
;
3337 case UpdateMappingPairs
:
3338 nsize
= aoff
+ dlen
;
3339 asize
= le32_to_cpu(attr
->size
);
3340 used
= le32_to_cpu(rec
->used
);
3342 if (!check_if_attr(rec
, lrh
) || !attr
->non_res
||
3343 aoff
< le16_to_cpu(attr
->nres
.run_off
) || aoff
> asize
||
3344 (nsize
> asize
&& nsize
- asize
> record_size
- used
)) {
3348 nsize
= ALIGN(nsize
, 8);
3350 memmove(Add2Ptr(attr
, nsize
), Add2Ptr(attr
, asize
),
3351 used
- le16_to_cpu(lrh
->record_off
) - asize
);
3352 rec
->used
= cpu_to_le32(used
+ nsize
- asize
);
3353 attr
->size
= cpu_to_le32(nsize
);
3354 memmove(Add2Ptr(attr
, aoff
), data
, dlen
);
3356 if (run_get_highest_vcn(le64_to_cpu(attr
->nres
.svcn
),
3357 attr_run(attr
), &t64
)) {
3361 attr
->nres
.evcn
= cpu_to_le64(t64
);
3362 oa2
= find_loaded_attr(log
, attr
, rno_base
);
3363 if (oa2
&& oa2
->attr
->non_res
)
3364 oa2
->attr
->nres
.evcn
= attr
->nres
.evcn
;
3369 case SetNewAttributeSizes
:
3371 if (!check_if_attr(rec
, lrh
) || !attr
->non_res
)
3374 attr
->nres
.alloc_size
= new_sz
->alloc_size
;
3375 attr
->nres
.data_size
= new_sz
->data_size
;
3376 attr
->nres
.valid_size
= new_sz
->valid_size
;
3378 if (dlen
>= sizeof(struct NEW_ATTRIBUTE_SIZES
))
3379 attr
->nres
.total_size
= new_sz
->total_size
;
3381 oa2
= find_loaded_attr(log
, attr
, rno_base
);
3383 void *p2
= kmemdup(attr
, le32_to_cpu(attr
->size
),
3393 case AddIndexEntryRoot
:
3394 e
= (struct NTFS_DE
*)data
;
3395 esize
= le16_to_cpu(e
->size
);
3396 root
= resident_data(attr
);
3398 used
= le32_to_cpu(hdr
->used
);
3400 if (!check_if_index_root(rec
, lrh
) ||
3401 !check_if_root_index(attr
, hdr
, lrh
) ||
3402 Add2Ptr(data
, esize
) > Add2Ptr(lrh
, rec_len
) ||
3403 esize
> le32_to_cpu(rec
->total
) - le32_to_cpu(rec
->used
)) {
3407 e1
= Add2Ptr(attr
, le16_to_cpu(lrh
->attr_off
));
3409 change_attr_size(rec
, attr
, le32_to_cpu(attr
->size
) + esize
);
3411 memmove(Add2Ptr(e1
, esize
), e1
,
3412 PtrOffset(e1
, Add2Ptr(hdr
, used
)));
3413 memmove(e1
, e
, esize
);
3415 le32_add_cpu(&attr
->res
.data_size
, esize
);
3416 hdr
->used
= cpu_to_le32(used
+ esize
);
3417 le32_add_cpu(&hdr
->total
, esize
);
3422 case DeleteIndexEntryRoot
:
3423 root
= resident_data(attr
);
3425 used
= le32_to_cpu(hdr
->used
);
3427 if (!check_if_index_root(rec
, lrh
) ||
3428 !check_if_root_index(attr
, hdr
, lrh
)) {
3432 e1
= Add2Ptr(attr
, le16_to_cpu(lrh
->attr_off
));
3433 esize
= le16_to_cpu(e1
->size
);
3434 e2
= Add2Ptr(e1
, esize
);
3436 memmove(e1
, e2
, PtrOffset(e2
, Add2Ptr(hdr
, used
)));
3438 le32_sub_cpu(&attr
->res
.data_size
, esize
);
3439 hdr
->used
= cpu_to_le32(used
- esize
);
3440 le32_sub_cpu(&hdr
->total
, esize
);
3442 change_attr_size(rec
, attr
, le32_to_cpu(attr
->size
) - esize
);
3447 case SetIndexEntryVcnRoot
:
3448 root
= resident_data(attr
);
3451 if (!check_if_index_root(rec
, lrh
) ||
3452 !check_if_root_index(attr
, hdr
, lrh
)) {
3456 e
= Add2Ptr(attr
, le16_to_cpu(lrh
->attr_off
));
3458 de_set_vbn_le(e
, *(__le64
*)data
);
3462 case UpdateFileNameRoot
:
3463 root
= resident_data(attr
);
3466 if (!check_if_index_root(rec
, lrh
) ||
3467 !check_if_root_index(attr
, hdr
, lrh
)) {
3471 e
= Add2Ptr(attr
, le16_to_cpu(lrh
->attr_off
));
3472 fname
= (struct ATTR_FILE_NAME
*)(e
+ 1);
3473 memmove(&fname
->dup
, data
, sizeof(fname
->dup
)); //
3477 case UpdateRecordDataRoot
:
3478 root
= resident_data(attr
);
3481 if (!check_if_index_root(rec
, lrh
) ||
3482 !check_if_root_index(attr
, hdr
, lrh
)) {
3486 e
= Add2Ptr(attr
, le16_to_cpu(lrh
->attr_off
));
3488 memmove(Add2Ptr(e
, le16_to_cpu(e
->view
.data_off
)), data
, dlen
);
3493 case ZeroEndOfFileRecord
:
3494 if (roff
+ dlen
> record_size
)
3497 memset(attr
, 0, dlen
);
3501 case UpdateNonresidentValue
:
3502 if (lco
< cbo
+ roff
+ dlen
)
3505 memcpy(Add2Ptr(buffer_le
, roff
), data
, dlen
);
3508 if (attr
->type
== ATTR_ALLOC
)
3509 ntfs_fix_pre_write(buffer_le
, bytes
);
3512 case AddIndexEntryAllocation
:
3513 ib
= Add2Ptr(buffer_le
, roff
);
3516 esize
= le16_to_cpu(e
->size
);
3517 e1
= Add2Ptr(ib
, aoff
);
3519 if (is_baad(&ib
->rhdr
))
3521 if (!check_lsn(&ib
->rhdr
, rlsn
))
3524 used
= le32_to_cpu(hdr
->used
);
3526 if (!check_index_buffer(ib
, bytes
) ||
3527 !check_if_alloc_index(hdr
, aoff
) ||
3528 Add2Ptr(e
, esize
) > Add2Ptr(lrh
, rec_len
) ||
3529 used
+ esize
> le32_to_cpu(hdr
->total
)) {
3533 memmove(Add2Ptr(e1
, esize
), e1
,
3534 PtrOffset(e1
, Add2Ptr(hdr
, used
)));
3535 memcpy(e1
, e
, esize
);
3537 hdr
->used
= cpu_to_le32(used
+ esize
);
3541 ntfs_fix_pre_write(&ib
->rhdr
, bytes
);
3544 case DeleteIndexEntryAllocation
:
3545 ib
= Add2Ptr(buffer_le
, roff
);
3547 e
= Add2Ptr(ib
, aoff
);
3548 esize
= le16_to_cpu(e
->size
);
3550 if (is_baad(&ib
->rhdr
))
3552 if (!check_lsn(&ib
->rhdr
, rlsn
))
3555 if (!check_index_buffer(ib
, bytes
) ||
3556 !check_if_alloc_index(hdr
, aoff
)) {
3560 e1
= Add2Ptr(e
, esize
);
3562 used
= le32_to_cpu(hdr
->used
);
3564 memmove(e
, e1
, PtrOffset(e1
, Add2Ptr(hdr
, used
)));
3566 hdr
->used
= cpu_to_le32(used
- nsize
);
3570 ntfs_fix_pre_write(&ib
->rhdr
, bytes
);
3573 case WriteEndOfIndexBuffer
:
3574 ib
= Add2Ptr(buffer_le
, roff
);
3576 e
= Add2Ptr(ib
, aoff
);
3578 if (is_baad(&ib
->rhdr
))
3580 if (!check_lsn(&ib
->rhdr
, rlsn
))
3582 if (!check_index_buffer(ib
, bytes
) ||
3583 !check_if_alloc_index(hdr
, aoff
) ||
3584 aoff
+ dlen
> offsetof(struct INDEX_BUFFER
, ihdr
) +
3585 le32_to_cpu(hdr
->total
)) {
3589 hdr
->used
= cpu_to_le32(dlen
+ PtrOffset(hdr
, e
));
3590 memmove(e
, data
, dlen
);
3593 ntfs_fix_pre_write(&ib
->rhdr
, bytes
);
3596 case SetIndexEntryVcnAllocation
:
3597 ib
= Add2Ptr(buffer_le
, roff
);
3599 e
= Add2Ptr(ib
, aoff
);
3601 if (is_baad(&ib
->rhdr
))
3604 if (!check_lsn(&ib
->rhdr
, rlsn
))
3606 if (!check_index_buffer(ib
, bytes
) ||
3607 !check_if_alloc_index(hdr
, aoff
)) {
3611 de_set_vbn_le(e
, *(__le64
*)data
);
3614 ntfs_fix_pre_write(&ib
->rhdr
, bytes
);
3617 case UpdateFileNameAllocation
:
3618 ib
= Add2Ptr(buffer_le
, roff
);
3620 e
= Add2Ptr(ib
, aoff
);
3622 if (is_baad(&ib
->rhdr
))
3625 if (!check_lsn(&ib
->rhdr
, rlsn
))
3627 if (!check_index_buffer(ib
, bytes
) ||
3628 !check_if_alloc_index(hdr
, aoff
)) {
3632 fname
= (struct ATTR_FILE_NAME
*)(e
+ 1);
3633 memmove(&fname
->dup
, data
, sizeof(fname
->dup
));
3636 ntfs_fix_pre_write(&ib
->rhdr
, bytes
);
3639 case SetBitsInNonresidentBitMap
:
3640 off
= le32_to_cpu(((struct BITMAP_RANGE
*)data
)->bitmap_off
);
3641 bits
= le32_to_cpu(((struct BITMAP_RANGE
*)data
)->bits
);
3643 if (cbo
+ (off
+ 7) / 8 > lco
||
3644 cbo
+ ((off
+ bits
+ 7) / 8) > lco
) {
3648 ntfs_bitmap_set_le(Add2Ptr(buffer_le
, roff
), off
, bits
);
3652 case ClearBitsInNonresidentBitMap
:
3653 off
= le32_to_cpu(((struct BITMAP_RANGE
*)data
)->bitmap_off
);
3654 bits
= le32_to_cpu(((struct BITMAP_RANGE
*)data
)->bits
);
3656 if (cbo
+ (off
+ 7) / 8 > lco
||
3657 cbo
+ ((off
+ bits
+ 7) / 8) > lco
) {
3661 ntfs_bitmap_clear_le(Add2Ptr(buffer_le
, roff
), off
, bits
);
3665 case UpdateRecordDataAllocation
:
3666 ib
= Add2Ptr(buffer_le
, roff
);
3668 e
= Add2Ptr(ib
, aoff
);
3670 if (is_baad(&ib
->rhdr
))
3673 if (!check_lsn(&ib
->rhdr
, rlsn
))
3675 if (!check_index_buffer(ib
, bytes
) ||
3676 !check_if_alloc_index(hdr
, aoff
)) {
3680 memmove(Add2Ptr(e
, le16_to_cpu(e
->view
.data_off
)), data
, dlen
);
3683 ntfs_fix_pre_write(&ib
->rhdr
, bytes
);
3691 __le64 t64
= cpu_to_le64(*rlsn
);
3694 rec
->rhdr
.lsn
= t64
;
3699 if (mi
&& mi
->dirty
) {
3700 err
= mi_write(mi
, 0);
3707 err
= ntfs_sb_write_run(sbi
, oa
->run1
, vbo
, buffer_le
, bytes
,
3717 else if (mi
!= mi2_child
)
3725 log
->set_dirty
= true;
3730 * log_replay - Replays log and empties it.
3732 * This function is called during mount operation.
3733 * It replays log and empties it.
3734 * Initialized is set false if logfile contains '-1'.
3736 int log_replay(struct ntfs_inode
*ni
, bool *initialized
)
3739 struct ntfs_sb_info
*sbi
= ni
->mi
.sbi
;
3740 struct ntfs_log
*log
;
3742 u64 rec_lsn
, checkpt_lsn
= 0, rlsn
= 0;
3743 struct ATTR_NAME_ENTRY
*attr_names
= NULL
;
3744 u32 attr_names_bytes
= 0;
3745 u32 oatbl_bytes
= 0;
3746 struct RESTART_TABLE
*dptbl
= NULL
;
3747 struct RESTART_TABLE
*trtbl
= NULL
;
3748 const struct RESTART_TABLE
*rt
;
3749 struct RESTART_TABLE
*oatbl
= NULL
;
3750 struct inode
*inode
;
3751 struct OpenAttr
*oa
;
3752 struct ntfs_inode
*ni_oe
;
3753 struct ATTRIB
*attr
= NULL
;
3754 u64 size
, vcn
, undo_next_lsn
;
3755 CLST rno
, lcn
, lcn0
, len0
, clen
;
3757 struct NTFS_RESTART
*rst
= NULL
;
3758 struct lcb
*lcb
= NULL
;
3759 struct OPEN_ATTR_ENRTY
*oe
;
3760 struct ATTR_NAME_ENTRY
*ane
;
3761 struct TRANSACTION_ENTRY
*tr
;
3762 struct DIR_PAGE_ENTRY
*dp
;
3763 u32 i
, bytes_per_attr_entry
;
3764 u32 vbo
, tail
, off
, dlen
;
3765 u32 saved_len
, rec_len
, transact_id
;
3766 bool use_second_page
;
3767 struct RESTART_AREA
*ra2
, *ra
= NULL
;
3768 struct CLIENT_REC
*ca
, *cr
;
3770 struct RESTART_HDR
*rh
;
3771 const struct LFS_RECORD_HDR
*frh
;
3772 const struct LOG_REC_HDR
*lrh
;
3774 bool is_ro
= sb_rdonly(sbi
->sb
);
3779 log
= kzalloc(sizeof(struct ntfs_log
), GFP_NOFS
);
3784 log
->l_size
= log
->orig_file_size
= ni
->vfs_inode
.i_size
;
3786 /* Get the size of page. NOTE: To replay we can use default page. */
3787 #if PAGE_SIZE >= DefaultLogPageSize && PAGE_SIZE <= DefaultLogPageSize * 2
3788 log
->page_size
= norm_file_page(PAGE_SIZE
, &log
->l_size
, true);
3790 log
->page_size
= norm_file_page(PAGE_SIZE
, &log
->l_size
, false);
3792 if (!log
->page_size
) {
3797 log
->one_page_buf
= kmalloc(log
->page_size
, GFP_NOFS
);
3798 if (!log
->one_page_buf
) {
3803 log
->page_mask
= log
->page_size
- 1;
3804 log
->page_bits
= blksize_bits(log
->page_size
);
3806 /* Look for a restart area on the disk. */
3807 err
= log_read_rst(log
, true, &log
->rst_info
);
3811 /* remember 'initialized' */
3812 *initialized
= log
->rst_info
.initialized
;
3814 if (!log
->rst_info
.restart
) {
3815 if (log
->rst_info
.initialized
) {
3816 /* No restart area but the file is not initialized. */
3821 log_init_pg_hdr(log
, 1, 1);
3822 log_create(log
, 0, get_random_u32(), false, false);
3824 ra
= log_create_ra(log
);
3830 log
->init_ra
= true;
3836 * If the restart offset above wasn't zero then we won't
3837 * look for a second restart.
3839 if (log
->rst_info
.vbo
)
3840 goto check_restart_area
;
3842 err
= log_read_rst(log
, false, &log
->rst_info2
);
3846 /* Determine which restart area to use. */
3847 if (!log
->rst_info2
.restart
||
3848 log
->rst_info2
.last_lsn
<= log
->rst_info
.last_lsn
)
3849 goto use_first_page
;
3851 use_second_page
= true;
3853 if (log
->rst_info
.chkdsk_was_run
&&
3854 log
->page_size
!= log
->rst_info
.vbo
) {
3855 struct RECORD_PAGE_HDR
*sp
= NULL
;
3858 if (!read_log_page(log
, log
->page_size
, &sp
, &usa_error
) &&
3859 sp
->rhdr
.sign
== NTFS_CHKD_SIGNATURE
) {
3860 use_second_page
= false;
3865 if (use_second_page
) {
3866 kfree(log
->rst_info
.r_page
);
3867 memcpy(&log
->rst_info
, &log
->rst_info2
,
3868 sizeof(struct restart_info
));
3869 log
->rst_info2
.r_page
= NULL
;
3873 kfree(log
->rst_info2
.r_page
);
3877 * If the restart area is at offset 0, we want
3878 * to write the second restart area first.
3880 log
->init_ra
= !!log
->rst_info
.vbo
;
3882 /* If we have a valid page then grab a pointer to the restart area. */
3883 ra2
= log
->rst_info
.valid_page
?
3884 Add2Ptr(log
->rst_info
.r_page
,
3885 le16_to_cpu(log
->rst_info
.r_page
->ra_off
)) :
3888 if (log
->rst_info
.chkdsk_was_run
||
3889 (ra2
&& ra2
->client_idx
[1] == LFS_NO_CLIENT_LE
)) {
3890 bool wrapped
= false;
3891 bool use_multi_page
= false;
3894 /* Do some checks based on whether we have a valid log page. */
3895 open_log_count
= log
->rst_info
.valid_page
?
3896 le32_to_cpu(ra2
->open_log_count
) :
3899 log_init_pg_hdr(log
, 1, 1);
3901 log_create(log
, log
->rst_info
.last_lsn
, open_log_count
, wrapped
,
3904 ra
= log_create_ra(log
);
3911 /* Put the restart areas and initialize
3912 * the log file as required.
3923 * If the log page or the system page sizes have changed, we can't
3924 * use the log file. We must use the system page size instead of the
3925 * default size if there is not a clean shutdown.
3927 t32
= le32_to_cpu(log
->rst_info
.r_page
->sys_page_size
);
3928 if (log
->page_size
!= t32
) {
3929 log
->l_size
= log
->orig_file_size
;
3930 log
->page_size
= norm_file_page(t32
, &log
->l_size
,
3931 t32
== DefaultLogPageSize
);
3934 if (log
->page_size
!= t32
||
3935 log
->page_size
!= le32_to_cpu(log
->rst_info
.r_page
->page_size
)) {
3940 log
->page_mask
= log
->page_size
- 1;
3941 log
->page_bits
= blksize_bits(log
->page_size
);
3943 /* If the file size has shrunk then we won't mount it. */
3944 if (log
->l_size
< le64_to_cpu(ra2
->l_size
)) {
3949 log_init_pg_hdr(log
, le16_to_cpu(log
->rst_info
.r_page
->major_ver
),
3950 le16_to_cpu(log
->rst_info
.r_page
->minor_ver
));
3952 log
->l_size
= le64_to_cpu(ra2
->l_size
);
3953 log
->seq_num_bits
= le32_to_cpu(ra2
->seq_num_bits
);
3954 log
->file_data_bits
= sizeof(u64
) * 8 - log
->seq_num_bits
;
3955 log
->seq_num_mask
= (8 << log
->file_data_bits
) - 1;
3956 log
->last_lsn
= le64_to_cpu(ra2
->current_lsn
);
3957 log
->seq_num
= log
->last_lsn
>> log
->file_data_bits
;
3958 log
->ra_off
= le16_to_cpu(log
->rst_info
.r_page
->ra_off
);
3959 log
->restart_size
= log
->sys_page_size
- log
->ra_off
;
3960 log
->record_header_len
= le16_to_cpu(ra2
->rec_hdr_len
);
3961 log
->ra_size
= le16_to_cpu(ra2
->ra_len
);
3962 log
->data_off
= le16_to_cpu(ra2
->data_off
);
3963 log
->data_size
= log
->page_size
- log
->data_off
;
3964 log
->reserved
= log
->data_size
- log
->record_header_len
;
3966 vbo
= lsn_to_vbo(log
, log
->last_lsn
);
3968 if (vbo
< log
->first_page
) {
3969 /* This is a pseudo lsn. */
3970 log
->l_flags
|= NTFSLOG_NO_LAST_LSN
;
3971 log
->next_page
= log
->first_page
;
3975 /* Find the end of this log record. */
3976 off
= final_log_off(log
, log
->last_lsn
,
3977 le32_to_cpu(ra2
->last_lsn_data_len
));
3979 /* If we wrapped the file then increment the sequence number. */
3982 log
->l_flags
|= NTFSLOG_WRAPPED
;
3985 /* Now compute the next log page to use. */
3986 vbo
&= ~log
->sys_page_mask
;
3987 tail
= log
->page_size
- (off
& log
->page_mask
) - 1;
3990 *If we can fit another log record on the page,
3991 * move back a page the log file.
3993 if (tail
>= log
->record_header_len
) {
3994 log
->l_flags
|= NTFSLOG_REUSE_TAIL
;
3995 log
->next_page
= vbo
;
3997 log
->next_page
= next_page_off(log
, vbo
);
4002 * Find the oldest client lsn. Use the last
4003 * flushed lsn as a starting point.
4005 log
->oldest_lsn
= log
->last_lsn
;
4006 oldest_client_lsn(Add2Ptr(ra2
, le16_to_cpu(ra2
->client_off
)),
4007 ra2
->client_idx
[1], &log
->oldest_lsn
);
4008 log
->oldest_lsn_off
= lsn_to_vbo(log
, log
->oldest_lsn
);
4010 if (log
->oldest_lsn_off
< log
->first_page
)
4011 log
->l_flags
|= NTFSLOG_NO_OLDEST_LSN
;
4013 if (!(ra2
->flags
& RESTART_SINGLE_PAGE_IO
))
4014 log
->l_flags
|= NTFSLOG_WRAPPED
| NTFSLOG_MULTIPLE_PAGE_IO
;
4016 log
->current_openlog_count
= le32_to_cpu(ra2
->open_log_count
);
4017 log
->total_avail_pages
= log
->l_size
- log
->first_page
;
4018 log
->total_avail
= log
->total_avail_pages
>> log
->page_bits
;
4019 log
->max_current_avail
= log
->total_avail
* log
->reserved
;
4020 log
->total_avail
= log
->total_avail
* log
->data_size
;
4022 log
->current_avail
= current_log_avail(log
);
4024 ra
= kzalloc(log
->restart_size
, GFP_NOFS
);
4031 t16
= le16_to_cpu(ra2
->client_off
);
4032 if (t16
== offsetof(struct RESTART_AREA
, clients
)) {
4033 memcpy(ra
, ra2
, log
->ra_size
);
4035 memcpy(ra
, ra2
, offsetof(struct RESTART_AREA
, clients
));
4036 memcpy(ra
->clients
, Add2Ptr(ra2
, t16
),
4037 le16_to_cpu(ra2
->ra_len
) - t16
);
4039 log
->current_openlog_count
= get_random_u32();
4040 ra
->open_log_count
= cpu_to_le32(log
->current_openlog_count
);
4041 log
->ra_size
= offsetof(struct RESTART_AREA
, clients
) +
4042 sizeof(struct CLIENT_REC
);
4044 cpu_to_le16(offsetof(struct RESTART_AREA
, clients
));
4045 ra
->ra_len
= cpu_to_le16(log
->ra_size
);
4048 le32_add_cpu(&ra
->open_log_count
, 1);
4050 /* Now we need to walk through looking for the last lsn. */
4051 err
= last_log_lsn(log
);
4055 log
->current_avail
= current_log_avail(log
);
4057 /* Remember which restart area to write first. */
4058 log
->init_ra
= log
->rst_info
.vbo
;
4061 /* 1.0, 1.1, 2.0 log->major_ver/minor_ver - short values. */
4062 switch ((log
->major_ver
<< 16) + log
->minor_ver
) {
4068 ntfs_warn(sbi
->sb
, "\x24LogFile version %d.%d is not supported",
4069 log
->major_ver
, log
->minor_ver
);
4071 log
->set_dirty
= true;
4075 /* One client "NTFS" per logfile. */
4076 ca
= Add2Ptr(ra
, le16_to_cpu(ra
->client_off
));
4078 for (client
= ra
->client_idx
[1];; client
= cr
->next_client
) {
4079 if (client
== LFS_NO_CLIENT_LE
) {
4080 /* Insert "NTFS" client LogFile. */
4081 client
= ra
->client_idx
[0];
4082 if (client
== LFS_NO_CLIENT_LE
) {
4087 t16
= le16_to_cpu(client
);
4090 remove_client(ca
, cr
, &ra
->client_idx
[0]);
4092 cr
->restart_lsn
= 0;
4093 cr
->oldest_lsn
= cpu_to_le64(log
->oldest_lsn
);
4094 cr
->name_bytes
= cpu_to_le32(8);
4095 cr
->name
[0] = cpu_to_le16('N');
4096 cr
->name
[1] = cpu_to_le16('T');
4097 cr
->name
[2] = cpu_to_le16('F');
4098 cr
->name
[3] = cpu_to_le16('S');
4100 add_client(ca
, t16
, &ra
->client_idx
[1]);
4104 cr
= ca
+ le16_to_cpu(client
);
4106 if (cpu_to_le32(8) == cr
->name_bytes
&&
4107 cpu_to_le16('N') == cr
->name
[0] &&
4108 cpu_to_le16('T') == cr
->name
[1] &&
4109 cpu_to_le16('F') == cr
->name
[2] &&
4110 cpu_to_le16('S') == cr
->name
[3])
4114 /* Update the client handle with the client block information. */
4115 log
->client_id
.seq_num
= cr
->seq_num
;
4116 log
->client_id
.client_idx
= client
;
4118 err
= read_rst_area(log
, &rst
, &checkpt_lsn
);
4125 bytes_per_attr_entry
= !rst
->major_ver
? 0x2C : 0x28;
4127 if (rst
->check_point_start
)
4128 checkpt_lsn
= le64_to_cpu(rst
->check_point_start
);
4130 /* Allocate and Read the Transaction Table. */
4131 if (!rst
->transact_table_len
)
4132 goto check_dirty_page_table
; /* reduce tab pressure. */
4134 t64
= le64_to_cpu(rst
->transact_table_lsn
);
4135 err
= read_log_rec_lcb(log
, t64
, lcb_ctx_prev
, &lcb
);
4141 rec_len
= le32_to_cpu(frh
->client_data_len
);
4143 if (!check_log_rec(lrh
, rec_len
, le32_to_cpu(frh
->transact_id
),
4144 bytes_per_attr_entry
)) {
4149 t16
= le16_to_cpu(lrh
->redo_off
);
4151 rt
= Add2Ptr(lrh
, t16
);
4152 t32
= rec_len
- t16
;
4154 /* Now check that this is a valid restart table. */
4155 if (!check_rstbl(rt
, t32
)) {
4160 trtbl
= kmemdup(rt
, t32
, GFP_NOFS
);
4169 check_dirty_page_table
:
4170 /* The next record back should be the Dirty Pages Table. */
4171 if (!rst
->dirty_pages_len
)
4172 goto check_attribute_names
; /* reduce tab pressure. */
4174 t64
= le64_to_cpu(rst
->dirty_pages_table_lsn
);
4175 err
= read_log_rec_lcb(log
, t64
, lcb_ctx_prev
, &lcb
);
4181 rec_len
= le32_to_cpu(frh
->client_data_len
);
4183 if (!check_log_rec(lrh
, rec_len
, le32_to_cpu(frh
->transact_id
),
4184 bytes_per_attr_entry
)) {
4189 t16
= le16_to_cpu(lrh
->redo_off
);
4191 rt
= Add2Ptr(lrh
, t16
);
4192 t32
= rec_len
- t16
;
4194 /* Now check that this is a valid restart table. */
4195 if (!check_rstbl(rt
, t32
)) {
4200 dptbl
= kmemdup(rt
, t32
, GFP_NOFS
);
4206 /* Convert Ra version '0' into version '1'. */
4208 goto end_conv_1
; /* reduce tab pressure. */
4211 while ((dp
= enum_rstbl(dptbl
, dp
))) {
4212 struct DIR_PAGE_ENTRY_32
*dp0
= (struct DIR_PAGE_ENTRY_32
*)dp
;
4213 // NOTE: Danger. Check for of boundary.
4214 memmove(&dp
->vcn
, &dp0
->vcn_low
,
4216 le32_to_cpu(dp
->lcns_follow
) * sizeof(u64
));
4224 * Go through the table and remove the duplicates,
4225 * remembering the oldest lsn values.
4227 if (sbi
->cluster_size
<= log
->page_size
)
4228 goto trace_dp_table
; /* reduce tab pressure. */
4230 while ((dp
= enum_rstbl(dptbl
, dp
))) {
4231 struct DIR_PAGE_ENTRY
*next
= dp
;
4233 while ((next
= enum_rstbl(dptbl
, next
))) {
4234 if (next
->target_attr
== dp
->target_attr
&&
4235 next
->vcn
== dp
->vcn
) {
4236 if (le64_to_cpu(next
->oldest_lsn
) <
4237 le64_to_cpu(dp
->oldest_lsn
)) {
4238 dp
->oldest_lsn
= next
->oldest_lsn
;
4241 free_rsttbl_idx(dptbl
, PtrOffset(dptbl
, next
));
4246 check_attribute_names
:
4247 /* The next record should be the Attribute Names. */
4248 if (!rst
->attr_names_len
)
4249 goto check_attr_table
; /* reduce tab pressure. */
4251 t64
= le64_to_cpu(rst
->attr_names_lsn
);
4252 err
= read_log_rec_lcb(log
, t64
, lcb_ctx_prev
, &lcb
);
4258 rec_len
= le32_to_cpu(frh
->client_data_len
);
4260 if (!check_log_rec(lrh
, rec_len
, le32_to_cpu(frh
->transact_id
),
4261 bytes_per_attr_entry
)) {
4266 t32
= lrh_length(lrh
);
4267 attr_names_bytes
= rec_len
- t32
;
4269 attr_names
= kmemdup(Add2Ptr(lrh
, t32
), attr_names_bytes
, GFP_NOFS
);
4279 /* The next record should be the attribute Table. */
4280 if (!rst
->open_attr_len
)
4281 goto check_attribute_names2
; /* reduce tab pressure. */
4283 t64
= le64_to_cpu(rst
->open_attr_table_lsn
);
4284 err
= read_log_rec_lcb(log
, t64
, lcb_ctx_prev
, &lcb
);
4290 rec_len
= le32_to_cpu(frh
->client_data_len
);
4292 if (!check_log_rec(lrh
, rec_len
, le32_to_cpu(frh
->transact_id
),
4293 bytes_per_attr_entry
)) {
4298 t16
= le16_to_cpu(lrh
->redo_off
);
4300 rt
= Add2Ptr(lrh
, t16
);
4301 oatbl_bytes
= rec_len
- t16
;
4303 if (!check_rstbl(rt
, oatbl_bytes
)) {
4308 oatbl
= kmemdup(rt
, oatbl_bytes
, GFP_NOFS
);
4314 log
->open_attr_tbl
= oatbl
;
4316 /* Clear all of the Attr pointers. */
4318 while ((oe
= enum_rstbl(oatbl
, oe
))) {
4319 if (!rst
->major_ver
) {
4320 struct OPEN_ATTR_ENRTY_32 oe0
;
4322 /* Really 'oe' points to OPEN_ATTR_ENRTY_32. */
4323 memcpy(&oe0
, oe
, SIZEOF_OPENATTRIBUTEENTRY0
);
4325 oe
->bytes_per_index
= oe0
.bytes_per_index
;
4326 oe
->type
= oe0
.type
;
4327 oe
->is_dirty_pages
= oe0
.is_dirty_pages
;
4330 oe
->open_record_lsn
= oe0
.open_record_lsn
;
4333 oe
->is_attr_name
= 0;
4340 check_attribute_names2
:
4341 if (attr_names
&& oatbl
) {
4344 /* Check we can use attribute name entry 'ane'. */
4345 static_assert(sizeof(*ane
) == 4);
4346 if (off
+ sizeof(*ane
) > attr_names_bytes
) {
4347 /* just ignore the rest. */
4351 ane
= Add2Ptr(attr_names
, off
);
4352 t16
= le16_to_cpu(ane
->off
);
4354 /* this is the only valid exit. */
4358 /* Check we can use open attribute entry 'oe'. */
4359 if (t16
+ sizeof(*oe
) > oatbl_bytes
) {
4360 /* just ignore the rest. */
4364 /* TODO: Clear table on exit! */
4365 oe
= Add2Ptr(oatbl
, t16
);
4366 t16
= le16_to_cpu(ane
->name_bytes
);
4367 off
+= t16
+ sizeof(*ane
);
4368 if (off
> attr_names_bytes
) {
4369 /* just ignore the rest. */
4372 oe
->name_len
= t16
/ sizeof(short);
4373 oe
->ptr
= ane
->name
;
4374 oe
->is_attr_name
= 2;
4379 * If the checkpt_lsn is zero, then this is a freshly
4380 * formatted disk and we have no work to do.
4388 oatbl
= init_rsttbl(bytes_per_attr_entry
, 8);
4395 log
->open_attr_tbl
= oatbl
;
4397 /* Start the analysis pass from the Checkpoint lsn. */
4398 rec_lsn
= checkpt_lsn
;
4400 /* Read the first lsn. */
4401 err
= read_log_rec_lcb(log
, checkpt_lsn
, lcb_ctx_next
, &lcb
);
4405 /* Loop to read all subsequent records to the end of the log file. */
4406 next_log_record_analyze
:
4407 err
= read_next_log_rec(log
, lcb
, &rec_lsn
);
4412 goto end_log_records_enumerate
;
4415 transact_id
= le32_to_cpu(frh
->transact_id
);
4416 rec_len
= le32_to_cpu(frh
->client_data_len
);
4419 if (!check_log_rec(lrh
, rec_len
, transact_id
, bytes_per_attr_entry
)) {
4425 * The first lsn after the previous lsn remembered
4426 * the checkpoint is the first candidate for the rlsn.
4431 if (LfsClientRecord
!= frh
->record_type
)
4432 goto next_log_record_analyze
;
4435 * Now update the Transaction Table for this transaction. If there
4436 * is no entry present or it is unallocated we allocate the entry.
4439 trtbl
= init_rsttbl(sizeof(struct TRANSACTION_ENTRY
),
4440 INITIAL_NUMBER_TRANSACTIONS
);
4447 tr
= Add2Ptr(trtbl
, transact_id
);
4449 if (transact_id
>= bytes_per_rt(trtbl
) ||
4450 tr
->next
!= RESTART_ENTRY_ALLOCATED_LE
) {
4451 tr
= alloc_rsttbl_from_idx(&trtbl
, transact_id
);
4456 tr
->transact_state
= TransactionActive
;
4457 tr
->first_lsn
= cpu_to_le64(rec_lsn
);
4460 tr
->prev_lsn
= tr
->undo_next_lsn
= cpu_to_le64(rec_lsn
);
4463 * If this is a compensation log record, then change
4464 * the undo_next_lsn to be the undo_next_lsn of this record.
4466 if (lrh
->undo_op
== cpu_to_le16(CompensationLogRecord
))
4467 tr
->undo_next_lsn
= frh
->client_undo_next_lsn
;
4469 /* Dispatch to handle log record depending on type. */
4470 switch (le16_to_cpu(lrh
->redo_op
)) {
4471 case InitializeFileRecordSegment
:
4472 case DeallocateFileRecordSegment
:
4473 case WriteEndOfFileRecordSegment
:
4474 case CreateAttribute
:
4475 case DeleteAttribute
:
4476 case UpdateResidentValue
:
4477 case UpdateNonresidentValue
:
4478 case UpdateMappingPairs
:
4479 case SetNewAttributeSizes
:
4480 case AddIndexEntryRoot
:
4481 case DeleteIndexEntryRoot
:
4482 case AddIndexEntryAllocation
:
4483 case DeleteIndexEntryAllocation
:
4484 case WriteEndOfIndexBuffer
:
4485 case SetIndexEntryVcnRoot
:
4486 case SetIndexEntryVcnAllocation
:
4487 case UpdateFileNameRoot
:
4488 case UpdateFileNameAllocation
:
4489 case SetBitsInNonresidentBitMap
:
4490 case ClearBitsInNonresidentBitMap
:
4491 case UpdateRecordDataRoot
:
4492 case UpdateRecordDataAllocation
:
4493 case ZeroEndOfFileRecord
:
4494 t16
= le16_to_cpu(lrh
->target_attr
);
4495 t64
= le64_to_cpu(lrh
->target_vcn
);
4496 dp
= find_dp(dptbl
, t16
, t64
);
4502 * Calculate the number of clusters per page the system
4503 * which wrote the checkpoint, possibly creating the table.
4506 t32
= (le16_to_cpu(dptbl
->size
) -
4507 sizeof(struct DIR_PAGE_ENTRY
)) /
4510 t32
= log
->clst_per_page
;
4512 dptbl
= init_rsttbl(struct_size(dp
, page_lcns
, t32
),
4520 dp
= alloc_rsttbl_idx(&dptbl
);
4525 dp
->target_attr
= cpu_to_le32(t16
);
4526 dp
->transfer_len
= cpu_to_le32(t32
<< sbi
->cluster_bits
);
4527 dp
->lcns_follow
= cpu_to_le32(t32
);
4528 dp
->vcn
= cpu_to_le64(t64
& ~((u64
)t32
- 1));
4529 dp
->oldest_lsn
= cpu_to_le64(rec_lsn
);
4533 * Copy the Lcns from the log record into the Dirty Page Entry.
4534 * TODO: For different page size support, must somehow make
4535 * whole routine a loop, case Lcns do not fit below.
4537 t16
= le16_to_cpu(lrh
->lcns_follow
);
4538 for (i
= 0; i
< t16
; i
++) {
4539 size_t j
= (size_t)(le64_to_cpu(lrh
->target_vcn
) -
4540 le64_to_cpu(dp
->vcn
));
4541 dp
->page_lcns
[j
+ i
] = lrh
->page_lcns
[i
];
4544 goto next_log_record_analyze
;
4546 case DeleteDirtyClusters
: {
4548 le16_to_cpu(lrh
->redo_len
) / sizeof(struct LCN_RANGE
);
4549 const struct LCN_RANGE
*r
=
4550 Add2Ptr(lrh
, le16_to_cpu(lrh
->redo_off
));
4552 /* Loop through all of the Lcn ranges this log record. */
4553 for (i
= 0; i
< range_count
; i
++, r
++) {
4554 u64 lcn0
= le64_to_cpu(r
->lcn
);
4555 u64 lcn_e
= lcn0
+ le64_to_cpu(r
->len
) - 1;
4558 while ((dp
= enum_rstbl(dptbl
, dp
))) {
4561 t32
= le32_to_cpu(dp
->lcns_follow
);
4562 for (j
= 0; j
< t32
; j
++) {
4563 t64
= le64_to_cpu(dp
->page_lcns
[j
]);
4564 if (t64
>= lcn0
&& t64
<= lcn_e
)
4565 dp
->page_lcns
[j
] = 0;
4569 goto next_log_record_analyze
;
4572 case OpenNonresidentAttribute
:
4573 t16
= le16_to_cpu(lrh
->target_attr
);
4574 if (t16
>= bytes_per_rt(oatbl
)) {
4576 * Compute how big the table needs to be.
4577 * Add 10 extra entries for some cushion.
4579 u32 new_e
= t16
/ le16_to_cpu(oatbl
->size
);
4581 new_e
+= 10 - le16_to_cpu(oatbl
->used
);
4583 oatbl
= extend_rsttbl(oatbl
, new_e
, ~0u);
4584 log
->open_attr_tbl
= oatbl
;
4591 /* Point to the entry being opened. */
4592 oe
= alloc_rsttbl_from_idx(&oatbl
, t16
);
4593 log
->open_attr_tbl
= oatbl
;
4599 /* Initialize this entry from the log record. */
4600 t16
= le16_to_cpu(lrh
->redo_off
);
4601 if (!rst
->major_ver
) {
4602 /* Convert version '0' into version '1'. */
4603 struct OPEN_ATTR_ENRTY_32
*oe0
= Add2Ptr(lrh
, t16
);
4605 oe
->bytes_per_index
= oe0
->bytes_per_index
;
4606 oe
->type
= oe0
->type
;
4607 oe
->is_dirty_pages
= oe0
->is_dirty_pages
;
4608 oe
->name_len
= 0; //oe0.name_len;
4610 oe
->open_record_lsn
= oe0
->open_record_lsn
;
4612 memcpy(oe
, Add2Ptr(lrh
, t16
), bytes_per_attr_entry
);
4615 t16
= le16_to_cpu(lrh
->undo_len
);
4617 oe
->ptr
= kmalloc(t16
, GFP_NOFS
);
4622 oe
->name_len
= t16
/ sizeof(short);
4624 Add2Ptr(lrh
, le16_to_cpu(lrh
->undo_off
)), t16
);
4625 oe
->is_attr_name
= 1;
4628 oe
->is_attr_name
= 0;
4631 goto next_log_record_analyze
;
4634 t16
= le16_to_cpu(lrh
->target_attr
);
4635 t64
= le64_to_cpu(lrh
->target_vcn
);
4636 dp
= find_dp(dptbl
, t16
, t64
);
4638 size_t j
= le64_to_cpu(lrh
->target_vcn
) -
4639 le64_to_cpu(dp
->vcn
);
4640 if (dp
->page_lcns
[j
])
4641 dp
->page_lcns
[j
] = lrh
->page_lcns
[0];
4643 goto next_log_record_analyze
;
4645 case EndTopLevelAction
:
4646 tr
= Add2Ptr(trtbl
, transact_id
);
4647 tr
->prev_lsn
= cpu_to_le64(rec_lsn
);
4648 tr
->undo_next_lsn
= frh
->client_undo_next_lsn
;
4649 goto next_log_record_analyze
;
4651 case PrepareTransaction
:
4652 tr
= Add2Ptr(trtbl
, transact_id
);
4653 tr
->transact_state
= TransactionPrepared
;
4654 goto next_log_record_analyze
;
4656 case CommitTransaction
:
4657 tr
= Add2Ptr(trtbl
, transact_id
);
4658 tr
->transact_state
= TransactionCommitted
;
4659 goto next_log_record_analyze
;
4661 case ForgetTransaction
:
4662 free_rsttbl_idx(trtbl
, transact_id
);
4663 goto next_log_record_analyze
;
4666 case OpenAttributeTableDump
:
4667 case AttributeNamesDump
:
4668 case DirtyPageTableDump
:
4669 case TransactionTableDump
:
4670 /* The following cases require no action the Analysis Pass. */
4671 goto next_log_record_analyze
;
4675 * All codes will be explicitly handled.
4676 * If we see a code we do not expect, then we are trouble.
4678 goto next_log_record_analyze
;
4681 end_log_records_enumerate
:
4686 * Scan the Dirty Page Table and Transaction Table for
4687 * the lowest lsn, and return it as the Redo lsn.
4690 while ((dp
= enum_rstbl(dptbl
, dp
))) {
4691 t64
= le64_to_cpu(dp
->oldest_lsn
);
4692 if (t64
&& t64
< rlsn
)
4697 while ((tr
= enum_rstbl(trtbl
, tr
))) {
4698 t64
= le64_to_cpu(tr
->first_lsn
);
4699 if (t64
&& t64
< rlsn
)
4704 * Only proceed if the Dirty Page Table or Transaction
4705 * table are not empty.
4707 if ((!dptbl
|| !dptbl
->total
) && (!trtbl
|| !trtbl
->total
))
4710 sbi
->flags
|= NTFS_FLAGS_NEED_REPLAY
;
4714 /* Reopen all of the attributes with dirty pages. */
4716 next_open_attribute
:
4718 oe
= enum_rstbl(oatbl
, oe
);
4722 goto next_dirty_page
;
4725 oa
= kzalloc(sizeof(struct OpenAttr
), GFP_NOFS
);
4731 inode
= ntfs_iget5(sbi
->sb
, &oe
->ref
, NULL
);
4735 if (is_bad_inode(inode
)) {
4739 iput(&oa
->ni
->vfs_inode
);
4743 attr
= attr_create_nonres_log(sbi
, oe
->type
, 0, oe
->ptr
,
4751 oa
->run1
= &oa
->run0
;
4755 ni_oe
= ntfs_i(inode
);
4758 attr
= ni_find_attr(ni_oe
, NULL
, NULL
, oe
->type
, oe
->ptr
, oe
->name_len
,
4764 t32
= le32_to_cpu(attr
->size
);
4765 oa
->attr
= kmemdup(attr
, t32
, GFP_NOFS
);
4769 if (!S_ISDIR(inode
->i_mode
)) {
4770 if (attr
->type
== ATTR_DATA
&& !attr
->name_len
) {
4771 oa
->run1
= &ni_oe
->file
.run
;
4775 if (attr
->type
== ATTR_ALLOC
&&
4776 attr
->name_len
== ARRAY_SIZE(I30_NAME
) &&
4777 !memcmp(attr_name(attr
), I30_NAME
, sizeof(I30_NAME
))) {
4778 oa
->run1
= &ni_oe
->dir
.alloc_run
;
4783 if (attr
->non_res
) {
4784 u16 roff
= le16_to_cpu(attr
->nres
.run_off
);
4785 CLST svcn
= le64_to_cpu(attr
->nres
.svcn
);
4793 err
= run_unpack(&oa
->run0
, sbi
, inode
->i_ino
, svcn
,
4794 le64_to_cpu(attr
->nres
.evcn
), svcn
,
4795 Add2Ptr(attr
, roff
), t32
- roff
);
4803 oa
->run1
= &oa
->run0
;
4807 if (oe
->is_attr_name
== 1)
4809 oe
->is_attr_name
= 0;
4811 oe
->name_len
= attr
->name_len
;
4813 goto next_open_attribute
;
4816 * Now loop through the dirty page table to extract all of the Vcn/Lcn.
4817 * Mapping that we have, and insert it into the appropriate run.
4820 dp
= enum_rstbl(dptbl
, dp
);
4824 oe
= Add2Ptr(oatbl
, le32_to_cpu(dp
->target_attr
));
4826 if (oe
->next
!= RESTART_ENTRY_ALLOCATED_LE
)
4827 goto next_dirty_page
;
4831 goto next_dirty_page
;
4834 next_dirty_page_vcn
:
4836 if (i
>= le32_to_cpu(dp
->lcns_follow
))
4837 goto next_dirty_page
;
4839 vcn
= le64_to_cpu(dp
->vcn
) + i
;
4840 size
= (vcn
+ 1) << sbi
->cluster_bits
;
4842 if (!dp
->page_lcns
[i
])
4843 goto next_dirty_page_vcn
;
4845 rno
= ino_get(&oe
->ref
);
4846 if (rno
<= MFT_REC_MIRR
&&
4847 size
< (MFT_REC_VOL
+ 1) * sbi
->record_size
&&
4848 oe
->type
== ATTR_DATA
) {
4849 goto next_dirty_page_vcn
;
4852 lcn
= le64_to_cpu(dp
->page_lcns
[i
]);
4854 if ((!run_lookup_entry(oa
->run1
, vcn
, &lcn0
, &len0
, NULL
) ||
4856 !run_add_entry(oa
->run1
, vcn
, lcn
, 1, false)) {
4861 if (size
> le64_to_cpu(attr
->nres
.alloc_size
)) {
4862 attr
->nres
.valid_size
= attr
->nres
.data_size
=
4863 attr
->nres
.alloc_size
= cpu_to_le64(size
);
4865 goto next_dirty_page_vcn
;
4869 * Perform the Redo Pass, to restore all of the dirty pages to the same
4870 * contents that they had immediately before the crash. If the dirty
4871 * page table is empty, then we can skip the entire Redo Pass.
4873 if (!dptbl
|| !dptbl
->total
)
4874 goto do_undo_action
;
4879 * Read the record at the Redo lsn, before falling
4880 * into common code to handle each record.
4882 err
= read_log_rec_lcb(log
, rlsn
, lcb_ctx_next
, &lcb
);
4887 * Now loop to read all of our log records forwards, until
4888 * we hit the end of the file, cleaning up at the end.
4893 if (LfsClientRecord
!= frh
->record_type
)
4894 goto read_next_log_do_action
;
4896 transact_id
= le32_to_cpu(frh
->transact_id
);
4897 rec_len
= le32_to_cpu(frh
->client_data_len
);
4900 if (!check_log_rec(lrh
, rec_len
, transact_id
, bytes_per_attr_entry
)) {
4905 /* Ignore log records that do not update pages. */
4906 if (lrh
->lcns_follow
)
4907 goto find_dirty_page
;
4909 goto read_next_log_do_action
;
4912 t16
= le16_to_cpu(lrh
->target_attr
);
4913 t64
= le64_to_cpu(lrh
->target_vcn
);
4914 dp
= find_dp(dptbl
, t16
, t64
);
4917 goto read_next_log_do_action
;
4919 if (rec_lsn
< le64_to_cpu(dp
->oldest_lsn
))
4920 goto read_next_log_do_action
;
4922 t16
= le16_to_cpu(lrh
->target_attr
);
4923 if (t16
>= bytes_per_rt(oatbl
)) {
4928 oe
= Add2Ptr(oatbl
, t16
);
4930 if (oe
->next
!= RESTART_ENTRY_ALLOCATED_LE
) {
4943 vcn
= le64_to_cpu(lrh
->target_vcn
);
4945 if (!run_lookup_entry(oa
->run1
, vcn
, &lcn
, NULL
, NULL
) ||
4946 lcn
== SPARSE_LCN
) {
4947 goto read_next_log_do_action
;
4950 /* Point to the Redo data and get its length. */
4951 data
= Add2Ptr(lrh
, le16_to_cpu(lrh
->redo_off
));
4952 dlen
= le16_to_cpu(lrh
->redo_len
);
4954 /* Shorten length by any Lcns which were deleted. */
4957 for (i
= le16_to_cpu(lrh
->lcns_follow
); i
; i
--) {
4961 voff
= le16_to_cpu(lrh
->record_off
) +
4962 le16_to_cpu(lrh
->attr_off
);
4963 voff
+= le16_to_cpu(lrh
->cluster_off
) << SECTOR_SHIFT
;
4965 /* If the Vcn question is allocated, we can just get out. */
4966 j
= le64_to_cpu(lrh
->target_vcn
) - le64_to_cpu(dp
->vcn
);
4967 if (dp
->page_lcns
[j
+ i
- 1])
4974 * Calculate the allocated space left relative to the
4975 * log record Vcn, after removing this unallocated Vcn.
4977 alen
= (i
- 1) << sbi
->cluster_bits
;
4980 * If the update described this log record goes beyond
4981 * the allocated space, then we will have to reduce the length.
4985 else if (voff
+ dlen
> alen
)
4990 * If the resulting dlen from above is now zero,
4991 * we can skip this log record.
4993 if (!dlen
&& saved_len
)
4994 goto read_next_log_do_action
;
4996 t16
= le16_to_cpu(lrh
->redo_op
);
4997 if (can_skip_action(t16
))
4998 goto read_next_log_do_action
;
5000 /* Apply the Redo operation a common routine. */
5001 err
= do_action(log
, oe
, lrh
, t16
, data
, dlen
, rec_len
, &rec_lsn
);
5005 /* Keep reading and looping back until end of file. */
5006 read_next_log_do_action
:
5007 err
= read_next_log_rec(log
, lcb
, &rec_lsn
);
5008 if (!err
&& rec_lsn
)
5009 goto do_action_next
;
5015 /* Scan Transaction Table. */
5017 transaction_table_next
:
5018 tr
= enum_rstbl(trtbl
, tr
);
5020 goto undo_action_done
;
5022 if (TransactionActive
!= tr
->transact_state
|| !tr
->undo_next_lsn
) {
5023 free_rsttbl_idx(trtbl
, PtrOffset(trtbl
, tr
));
5024 goto transaction_table_next
;
5027 log
->transaction_id
= PtrOffset(trtbl
, tr
);
5028 undo_next_lsn
= le64_to_cpu(tr
->undo_next_lsn
);
5031 * We only have to do anything if the transaction has
5032 * something its undo_next_lsn field.
5037 /* Read the first record to be undone by this transaction. */
5038 err
= read_log_rec_lcb(log
, undo_next_lsn
, lcb_ctx_undo_next
, &lcb
);
5043 * Now loop to read all of our log records forwards,
5044 * until we hit the end of the file, cleaning up at the end.
5050 transact_id
= le32_to_cpu(frh
->transact_id
);
5051 rec_len
= le32_to_cpu(frh
->client_data_len
);
5053 if (!check_log_rec(lrh
, rec_len
, transact_id
, bytes_per_attr_entry
)) {
5058 if (lrh
->undo_op
== cpu_to_le16(Noop
))
5059 goto read_next_log_undo_action
;
5061 oe
= Add2Ptr(oatbl
, le16_to_cpu(lrh
->target_attr
));
5064 t16
= le16_to_cpu(lrh
->lcns_follow
);
5066 goto add_allocated_vcns
;
5068 is_mapped
= run_lookup_entry(oa
->run1
, le64_to_cpu(lrh
->target_vcn
),
5072 * If the mapping isn't already the table or the mapping
5073 * corresponds to a hole the mapping, we need to make sure
5074 * there is no partial page already memory.
5076 if (is_mapped
&& lcn
!= SPARSE_LCN
&& clen
>= t16
)
5077 goto add_allocated_vcns
;
5079 vcn
= le64_to_cpu(lrh
->target_vcn
);
5080 vcn
&= ~(u64
)(log
->clst_per_page
- 1);
5083 for (i
= 0, vcn
= le64_to_cpu(lrh
->target_vcn
),
5084 size
= (vcn
+ 1) << sbi
->cluster_bits
;
5085 i
< t16
; i
++, vcn
+= 1, size
+= sbi
->cluster_size
) {
5087 if (!attr
->non_res
) {
5088 if (size
> le32_to_cpu(attr
->res
.data_size
))
5089 attr
->res
.data_size
= cpu_to_le32(size
);
5091 if (size
> le64_to_cpu(attr
->nres
.data_size
))
5092 attr
->nres
.valid_size
= attr
->nres
.data_size
=
5093 attr
->nres
.alloc_size
=
5098 t16
= le16_to_cpu(lrh
->undo_op
);
5099 if (can_skip_action(t16
))
5100 goto read_next_log_undo_action
;
5102 /* Point to the Redo data and get its length. */
5103 data
= Add2Ptr(lrh
, le16_to_cpu(lrh
->undo_off
));
5104 dlen
= le16_to_cpu(lrh
->undo_len
);
5106 /* It is time to apply the undo action. */
5107 err
= do_action(log
, oe
, lrh
, t16
, data
, dlen
, rec_len
, NULL
);
5109 read_next_log_undo_action
:
5111 * Keep reading and looping back until we have read the
5112 * last record for this transaction.
5114 err
= read_next_log_rec(log
, lcb
, &rec_lsn
);
5119 goto undo_action_next
;
5125 free_rsttbl_idx(trtbl
, log
->transaction_id
);
5127 log
->transaction_id
= 0;
5129 goto transaction_table_next
;
5133 ntfs_update_mftmirr(sbi
, 0);
5135 sbi
->flags
&= ~NTFS_FLAGS_NEED_REPLAY
;
5143 rh
= kzalloc(log
->page_size
, GFP_NOFS
);
5149 rh
->rhdr
.sign
= NTFS_RSTR_SIGNATURE
;
5150 rh
->rhdr
.fix_off
= cpu_to_le16(offsetof(struct RESTART_HDR
, fixups
));
5151 t16
= (log
->page_size
>> SECTOR_SHIFT
) + 1;
5152 rh
->rhdr
.fix_num
= cpu_to_le16(t16
);
5153 rh
->sys_page_size
= cpu_to_le32(log
->page_size
);
5154 rh
->page_size
= cpu_to_le32(log
->page_size
);
5156 t16
= ALIGN(offsetof(struct RESTART_HDR
, fixups
) + sizeof(short) * t16
,
5158 rh
->ra_off
= cpu_to_le16(t16
);
5159 rh
->minor_ver
= cpu_to_le16(1); // 0x1A:
5160 rh
->major_ver
= cpu_to_le16(1); // 0x1C:
5162 ra2
= Add2Ptr(rh
, t16
);
5163 memcpy(ra2
, ra
, sizeof(struct RESTART_AREA
));
5165 ra2
->client_idx
[0] = 0;
5166 ra2
->client_idx
[1] = LFS_NO_CLIENT_LE
;
5167 ra2
->flags
= cpu_to_le16(2);
5169 le32_add_cpu(&ra2
->open_log_count
, 1);
5171 ntfs_fix_pre_write(&rh
->rhdr
, log
->page_size
);
5173 err
= ntfs_sb_write_run(sbi
, &ni
->file
.run
, 0, rh
, log
->page_size
, 0);
5175 err
= ntfs_sb_write_run(sbi
, &log
->ni
->file
.run
, log
->page_size
,
5176 rh
, log
->page_size
, 0);
5188 * Scan the Open Attribute Table to close all of
5189 * the open attributes.
5192 while ((oe
= enum_rstbl(oatbl
, oe
))) {
5193 rno
= ino_get(&oe
->ref
);
5195 if (oe
->is_attr_name
== 1) {
5201 if (oe
->is_attr_name
)
5208 run_close(&oa
->run0
);
5211 iput(&oa
->ni
->vfs_inode
);
5219 kfree(log
->rst_info
.r_page
);
5222 kfree(log
->one_page_buf
);
5225 sbi
->flags
|= NTFS_FLAGS_NEED_REPLAY
;
5229 else if (log
->set_dirty
)
5230 ntfs_set_state(sbi
, NTFS_DIRTY_ERROR
);