1 /* Copyright 2001, 2002, 2003 by Hans Reiser, licensing governed by reiser4/README */
4 #include "../../inode.h"
5 #include "../../page_cache.h"
6 #include "../../carry.h"
7 #include "../../vfs_ops.h"
9 #include <linux/quotaops.h>
10 #include <asm/uaccess.h>
11 #include <linux/swap.h>
12 #include <linux/writeback.h>
14 /* plugin->u.item.b.max_key_inside */
15 reiser4_key
*max_key_inside_tail(const coord_t
*coord
, reiser4_key
*key
)
17 item_key_by_coord(coord
, key
);
18 set_key_offset(key
, get_key_offset(reiser4_max_key()));
22 /* plugin->u.item.b.can_contain_key */
23 int can_contain_key_tail(const coord_t
*coord
, const reiser4_key
*key
,
24 const reiser4_item_data
*data
)
28 if (item_plugin_by_coord(coord
) != data
->iplug
)
31 item_key_by_coord(coord
, &item_key
);
32 if (get_key_locality(key
) != get_key_locality(&item_key
) ||
33 get_key_objectid(key
) != get_key_objectid(&item_key
))
39 /* plugin->u.item.b.mergeable
40 first item is of tail type */
41 /* Audited by: green(2002.06.14) */
42 int mergeable_tail(const coord_t
*p1
, const coord_t
*p2
)
44 reiser4_key key1
, key2
;
46 assert("vs-535", plugin_of_group(item_plugin_by_coord(p1
),
47 UNIX_FILE_METADATA_ITEM_TYPE
));
48 assert("vs-365", item_id_by_coord(p1
) == FORMATTING_ID
);
50 if (item_id_by_coord(p2
) != FORMATTING_ID
) {
51 /* second item is of another type */
55 item_key_by_coord(p1
, &key1
);
56 item_key_by_coord(p2
, &key2
);
57 if (get_key_locality(&key1
) != get_key_locality(&key2
) ||
58 get_key_objectid(&key1
) != get_key_objectid(&key2
)
59 || get_key_type(&key1
) != get_key_type(&key2
)) {
60 /* items of different objects */
63 if (get_key_offset(&key1
) + nr_units_tail(p1
) != get_key_offset(&key2
)) {
64 /* not adjacent items */
70 /* plugin->u.item.b.print
71 plugin->u.item.b.check */
73 /* plugin->u.item.b.nr_units */
74 pos_in_node_t
nr_units_tail(const coord_t
* coord
)
76 return item_length_by_coord(coord
);
79 /* plugin->u.item.b.lookup */
81 lookup_tail(const reiser4_key
* key
, lookup_bias bias
, coord_t
* coord
)
84 __u64 lookuped
, offset
;
87 item_key_by_coord(coord
, &item_key
);
88 offset
= get_key_offset(item_key_by_coord(coord
, &item_key
));
89 nr_units
= nr_units_tail(coord
);
91 /* key we are looking for must be greater than key of item @coord */
92 assert("vs-416", keygt(key
, &item_key
));
94 /* offset we are looking for */
95 lookuped
= get_key_offset(key
);
97 if (lookuped
>= offset
&& lookuped
< offset
+ nr_units
) {
98 /* byte we are looking for is in this item */
99 coord
->unit_pos
= lookuped
- offset
;
100 coord
->between
= AT_UNIT
;
101 return CBK_COORD_FOUND
;
104 /* set coord after last unit */
105 coord
->unit_pos
= nr_units
- 1;
106 coord
->between
= AFTER_UNIT
;
108 FIND_MAX_NOT_MORE_THAN
? CBK_COORD_FOUND
: CBK_COORD_NOTFOUND
;
111 /* plugin->u.item.b.paste */
113 paste_tail(coord_t
*coord
, reiser4_item_data
*data
,
114 carry_plugin_info
*info UNUSED_ARG
)
116 unsigned old_item_length
;
119 /* length the item had before resizing has been performed */
120 old_item_length
= item_length_by_coord(coord
) - data
->length
;
122 /* tail items never get pasted in the middle */
124 (coord
->unit_pos
== 0 && coord
->between
== BEFORE_UNIT
) ||
125 (coord
->unit_pos
== old_item_length
- 1 &&
126 coord
->between
== AFTER_UNIT
) ||
127 (coord
->unit_pos
== 0 && old_item_length
== 0
128 && coord
->between
== AT_UNIT
));
130 item
= item_body_by_coord(coord
);
131 if (coord
->unit_pos
== 0)
132 /* make space for pasted data when pasting at the beginning of
134 memmove(item
+ data
->length
, item
, old_item_length
);
136 if (coord
->between
== AFTER_UNIT
)
140 assert("vs-554", data
->user
== 0 || data
->user
== 1);
142 assert("nikita-3035", reiser4_schedulable());
143 /* copy from user space */
144 if (__copy_from_user(item
+ coord
->unit_pos
,
145 (const char __user
*)data
->data
,
146 (unsigned)data
->length
))
147 return RETERR(-EFAULT
);
149 /* copy from kernel space */
150 memcpy(item
+ coord
->unit_pos
, data
->data
,
151 (unsigned)data
->length
);
153 memset(item
+ coord
->unit_pos
, 0, (unsigned)data
->length
);
158 /* plugin->u.item.b.fast_paste */
160 /* plugin->u.item.b.can_shift
161 number of units is returned via return value, number of bytes via @size. For
162 tail items they coincide */
164 can_shift_tail(unsigned free_space
, coord_t
* source UNUSED_ARG
,
165 znode
* target UNUSED_ARG
, shift_direction direction UNUSED_ARG
,
166 unsigned *size
, unsigned want
)
168 /* make sure that that we do not want to shift more than we have */
169 assert("vs-364", want
> 0
170 && want
<= (unsigned)item_length_by_coord(source
));
172 *size
= min(want
, free_space
);
176 /* plugin->u.item.b.copy_units */
178 copy_units_tail(coord_t
* target
, coord_t
* source
,
179 unsigned from
, unsigned count
,
180 shift_direction where_is_free_space
,
181 unsigned free_space UNUSED_ARG
)
183 /* make sure that item @target is expanded already */
184 assert("vs-366", (unsigned)item_length_by_coord(target
) >= count
);
185 assert("vs-370", free_space
>= count
);
187 if (where_is_free_space
== SHIFT_LEFT
) {
188 /* append item @target with @count first bytes of @source */
189 assert("vs-365", from
== 0);
191 memcpy((char *)item_body_by_coord(target
) +
192 item_length_by_coord(target
) - count
,
193 (char *)item_body_by_coord(source
), count
);
195 /* target item is moved to right already */
199 (unsigned)item_length_by_coord(source
) == from
+ count
);
201 memcpy((char *)item_body_by_coord(target
),
202 (char *)item_body_by_coord(source
) + from
, count
);
204 /* new units are inserted before first unit in an item,
205 therefore, we have to update item key */
206 item_key_by_coord(source
, &key
);
207 set_key_offset(&key
, get_key_offset(&key
) + from
);
209 node_plugin_by_node(target
->node
)->update_item_key(target
, &key
,
214 /* plugin->u.item.b.create_hook */
216 /* item_plugin->b.kill_hook
217 this is called when @count units starting from @from-th one are going to be removed
220 kill_hook_tail(const coord_t
* coord
, pos_in_node_t from
,
221 pos_in_node_t count
, struct carry_kill_data
*kdata
)
226 assert("vs-1577", kdata
);
227 assert("vs-1579", kdata
->inode
);
229 item_key_by_coord(coord
, &key
);
230 start
= get_key_offset(&key
) + from
;
232 fake_kill_hook_tail(kdata
->inode
, start
, end
, kdata
->params
.truncate
);
236 /* plugin->u.item.b.shift_hook */
238 /* helper for kill_units_tail and cut_units_tail */
240 do_cut_or_kill(coord_t
* coord
, pos_in_node_t from
, pos_in_node_t to
,
241 reiser4_key
* smallest_removed
, reiser4_key
* new_first
)
245 /* this method is only called to remove part of item */
246 assert("vs-374", (to
- from
+ 1) < item_length_by_coord(coord
));
247 /* tails items are never cut from the middle of an item */
248 assert("vs-396", ergo(from
!= 0, to
== coord_last_unit_pos(coord
)));
249 assert("vs-1558", ergo(from
== 0, to
< coord_last_unit_pos(coord
)));
251 count
= to
- from
+ 1;
253 if (smallest_removed
) {
254 /* store smallest key removed */
255 item_key_by_coord(coord
, smallest_removed
);
256 set_key_offset(smallest_removed
,
257 get_key_offset(smallest_removed
) + from
);
260 /* head of item is cut */
261 assert("vs-1529", from
== 0);
263 item_key_by_coord(coord
, new_first
);
264 set_key_offset(new_first
,
265 get_key_offset(new_first
) + from
+ count
);
269 memset((char *)item_body_by_coord(coord
) + from
, 0, count
);
273 /* plugin->u.item.b.cut_units */
275 cut_units_tail(coord_t
* coord
, pos_in_node_t from
, pos_in_node_t to
,
276 struct carry_cut_data
*cdata UNUSED_ARG
,
277 reiser4_key
* smallest_removed
, reiser4_key
* new_first
)
279 return do_cut_or_kill(coord
, from
, to
, smallest_removed
, new_first
);
282 /* plugin->u.item.b.kill_units */
284 kill_units_tail(coord_t
* coord
, pos_in_node_t from
, pos_in_node_t to
,
285 struct carry_kill_data
*kdata
, reiser4_key
* smallest_removed
,
286 reiser4_key
* new_first
)
288 kill_hook_tail(coord
, from
, to
- from
+ 1, kdata
);
289 return do_cut_or_kill(coord
, from
, to
, smallest_removed
, new_first
);
292 /* plugin->u.item.b.unit_key */
293 reiser4_key
*unit_key_tail(const coord_t
* coord
, reiser4_key
* key
)
295 assert("vs-375", coord_is_existing_unit(coord
));
297 item_key_by_coord(coord
, key
);
298 set_key_offset(key
, (get_key_offset(key
) + coord
->unit_pos
));
303 /* plugin->u.item.b.estimate
304 plugin->u.item.b.item_data_by_flow */
306 /* tail redpage function. It is called from readpage_tail(). */
307 static int do_readpage_tail(uf_coord_t
*uf_coord
, struct page
*page
)
317 /* saving passed coord in order to do not move it by tap. */
319 copy_lh(&lh
, uf_coord
->lh
);
320 inode
= page
->mapping
->host
;
321 coord_dup(&coord
, &uf_coord
->coord
);
323 reiser4_tap_init(&tap
, &coord
, &lh
, ZNODE_READ_LOCK
);
325 if ((result
= reiser4_tap_load(&tap
)))
328 /* lookup until page is filled up. */
329 for (mapped
= 0; mapped
< PAGE_CACHE_SIZE
; ) {
330 /* number of bytes to be copied to page */
331 count
= item_length_by_coord(&coord
) - coord
.unit_pos
;
332 if (count
> PAGE_CACHE_SIZE
- mapped
)
333 count
= PAGE_CACHE_SIZE
- mapped
;
335 /* attach @page to address space and get data address */
336 pagedata
= kmap_atomic(page
, KM_USER0
);
338 /* copy tail item to page */
339 memcpy(pagedata
+ mapped
,
340 ((char *)item_body_by_coord(&coord
) + coord
.unit_pos
),
344 flush_dcache_page(page
);
346 /* dettach page from address space */
347 kunmap_atomic(pagedata
, KM_USER0
);
349 /* Getting next tail item. */
350 if (mapped
< PAGE_CACHE_SIZE
) {
352 * unlock page in order to avoid keep it locked
353 * during tree lookup, which takes long term locks
357 /* getting right neighbour. */
358 result
= go_dir_el(&tap
, RIGHT_SIDE
, 0);
362 if (PageUptodate(page
)) {
364 * another thread read the page, we have
368 goto out_unlock_page
;
372 if (result
== -E_NO_NEIGHBOR
) {
374 * rigth neighbor is not a formatted
383 if (!inode_file_plugin(inode
)->
384 owns_item(inode
, &coord
)) {
385 /* item of another file is found */
394 if (mapped
!= PAGE_CACHE_SIZE
)
395 zero_user_segment(page
, mapped
, PAGE_CACHE_SIZE
);
396 SetPageUptodate(page
);
400 reiser4_tap_relse(&tap
);
402 reiser4_tap_done(&tap
);
407 plugin->s.file.readpage
408 reiser4_read->unix_file_read->page_cache_readahead->reiser4_readpage->unix_file_readpage->readpage_tail
410 filemap_fault->reiser4_readpage->readpage_unix_file->->readpage_tail
412 At the beginning: coord->node is read locked, zloaded, page is locked, coord is set to existing unit inside of tail
414 int readpage_tail(void *vp
, struct page
*page
)
416 uf_coord_t
*uf_coord
= vp
;
417 ON_DEBUG(coord_t
* coord
= &uf_coord
->coord
);
418 ON_DEBUG(reiser4_key key
);
420 assert("umka-2515", PageLocked(page
));
421 assert("umka-2516", !PageUptodate(page
));
422 assert("umka-2517", !jprivate(page
) && !PagePrivate(page
));
423 assert("umka-2518", page
->mapping
&& page
->mapping
->host
);
425 assert("umka-2519", znode_is_loaded(coord
->node
));
426 assert("umka-2520", item_is_tail(coord
));
427 assert("umka-2521", coord_is_existing_unit(coord
));
428 assert("umka-2522", znode_is_rlocked(coord
->node
));
430 page
->mapping
->host
->i_ino
==
431 get_key_objectid(item_key_by_coord(coord
, &key
)));
433 return do_readpage_tail(uf_coord
, page
);
441 * Overwrites tail item or its part by user data. Returns number of bytes
442 * written or error code.
444 static int overwrite_tail(flow_t
*flow
, coord_t
*coord
)
448 assert("vs-570", flow
->user
== 1);
449 assert("vs-946", flow
->data
);
450 assert("vs-947", coord_is_existing_unit(coord
));
451 assert("vs-948", znode_is_write_locked(coord
->node
));
452 assert("nikita-3036", reiser4_schedulable());
454 count
= item_length_by_coord(coord
) - coord
->unit_pos
;
455 if (count
> flow
->length
)
456 count
= flow
->length
;
458 if (__copy_from_user((char *)item_body_by_coord(coord
) + coord
->unit_pos
,
459 (const char __user
*)flow
->data
, count
))
460 return RETERR(-EFAULT
);
462 znode_make_dirty(coord
->node
);
473 * Returns number of bytes written or error code.
475 static ssize_t
insert_first_tail(struct inode
*inode
, flow_t
*flow
,
476 coord_t
*coord
, lock_handle
*lh
)
480 struct unix_file_info
*uf_info
;
482 if (get_key_offset(&flow
->key
) != 0) {
484 * file is empty and we have to write not to the beginning of
485 * file. Create a hole at the beginning of file. On success
486 * insert_flow returns 0 as number of written bytes which is
487 * what we have to return on padding a file with holes
490 flow
->length
= get_key_offset(&flow
->key
);
491 set_key_offset(&flow
->key
, 0);
493 * holes in files built of tails are stored just like if there
494 * were real data which are all zeros. Therefore we have to
495 * allocate quota here as well
497 if (vfs_dq_alloc_space_nodirty(inode
, flow
->length
))
498 return RETERR(-EDQUOT
);
499 result
= reiser4_insert_flow(coord
, lh
, flow
);
501 vfs_dq_free_space_nodirty(inode
, flow
->length
);
503 uf_info
= unix_file_inode_data(inode
);
506 * first item insertion is only possible when writing to empty
507 * file or performing tail conversion
509 assert("", (uf_info
->container
== UF_CONTAINER_EMPTY
||
510 (reiser4_inode_get_flag(inode
,
511 REISER4_PART_MIXED
) &&
512 reiser4_inode_get_flag(inode
,
513 REISER4_PART_IN_CONV
))));
514 /* if file was empty - update its state */
515 if (result
== 0 && uf_info
->container
== UF_CONTAINER_EMPTY
)
516 uf_info
->container
= UF_CONTAINER_TAILS
;
520 /* check quota before appending data */
521 if (vfs_dq_alloc_space_nodirty(inode
, flow
->length
))
522 return RETERR(-EDQUOT
);
524 to_write
= flow
->length
;
525 result
= reiser4_insert_flow(coord
, lh
, flow
);
527 vfs_dq_free_space_nodirty(inode
, flow
->length
);
528 return (to_write
- flow
->length
) ? (to_write
- flow
->length
) : result
;
538 * Returns number of bytes written or error code.
540 static ssize_t
append_tail(struct inode
*inode
,
541 flow_t
*flow
, coord_t
*coord
, lock_handle
*lh
)
544 reiser4_key append_key
;
547 if (!keyeq(&flow
->key
, append_key_tail(coord
, &append_key
))) {
549 flow
->length
= get_key_offset(&flow
->key
) - get_key_offset(&append_key
);
550 set_key_offset(&flow
->key
, get_key_offset(&append_key
));
552 * holes in files built of tails are stored just like if there
553 * were real data which are all zeros. Therefore we have to
554 * allocate quota here as well
556 if (vfs_dq_alloc_space_nodirty(inode
, flow
->length
))
557 return RETERR(-EDQUOT
);
558 result
= reiser4_insert_flow(coord
, lh
, flow
);
560 vfs_dq_free_space_nodirty(inode
, flow
->length
);
564 /* check quota before appending data */
565 if (vfs_dq_alloc_space_nodirty(inode
, flow
->length
))
566 return RETERR(-EDQUOT
);
568 to_write
= flow
->length
;
569 result
= reiser4_insert_flow(coord
, lh
, flow
);
571 vfs_dq_free_space_nodirty(inode
, flow
->length
);
572 return (to_write
- flow
->length
) ? (to_write
- flow
->length
) : result
;
576 * write_tail_reserve_space - reserve space for tail write operation
579 * Estimates and reserves space which may be required for writing one flow to a
582 static int write_extent_reserve_space(struct inode
*inode
)
588 * to write one flow to a file by tails we have to reserve disk space for:
590 * 1. find_file_item may have to insert empty node to the tree (empty
591 * leaf node between two extent items). This requires 1 block and
592 * number of blocks which are necessary to perform insertion of an
593 * internal item into twig level.
597 * 3. stat data update
599 tree
= reiser4_tree_by_inode(inode
);
600 count
= estimate_one_insert_item(tree
) +
601 estimate_insert_flow(tree
->height
) +
602 estimate_one_insert_item(tree
);
604 return reiser4_grab_space(count
, 0 /* flags */);
607 #define PAGE_PER_FLOW 4
609 static loff_t
faultin_user_pages(const char __user
*buf
, size_t count
)
614 if (count
> PAGE_PER_FLOW
* PAGE_CACHE_SIZE
)
615 count
= PAGE_PER_FLOW
* PAGE_CACHE_SIZE
;
618 to_fault
= PAGE_CACHE_SIZE
;
619 if (count
< to_fault
)
621 fault_in_pages_readable(buf
+ faulted
, to_fault
);
629 * reiser4_write_tail - write method of tail item plugin
630 * @file: file to write to
631 * @buf: address of user-space buffer
632 * @count: number of bytes to write
633 * @pos: position in file to write to
635 * Returns number of written bytes or error code.
637 ssize_t
reiser4_write_tail(struct file
*file
, struct inode
* inode
,
638 const char __user
*buf
, size_t count
, loff_t
*pos
)
647 assert("edward-1548", inode
!= NULL
);
649 if (write_extent_reserve_space(inode
))
650 return RETERR(-ENOSPC
);
652 result
= load_file_hint(file
, &hint
);
655 flow
.length
= faultin_user_pages(buf
, count
);
657 memcpy(&flow
.data
, &buf
, sizeof(buf
));
659 key_by_inode_and_offset_common(inode
, *pos
, &flow
.key
);
661 result
= find_file_item(&hint
, &flow
.key
, ZNODE_WRITE_LOCK
, inode
);
662 if (IS_CBKERR(result
))
665 coord
= &hint
.ext_coord
.coord
;
666 lh
= hint
.ext_coord
.lh
;
668 result
= zload(coord
->node
);
670 loaded
= coord
->node
;
672 if (coord
->between
== AFTER_UNIT
) {
673 /* append with data or hole */
674 result
= append_tail(inode
, &flow
, coord
, lh
);
675 } else if (coord
->between
== AT_UNIT
) {
677 result
= overwrite_tail(&flow
, coord
);
679 /* no items of this file yet. insert data or hole */
680 result
= insert_first_tail(inode
, &flow
, coord
, lh
);
688 /* seal and unlock znode */
689 hint
.ext_coord
.valid
= 0;
690 if (hint
.ext_coord
.valid
)
691 reiser4_set_hint(&hint
, &flow
.key
, ZNODE_WRITE_LOCK
);
693 reiser4_unset_hint(&hint
);
695 save_file_hint(file
, &hint
);
702 coord_matches_key_tail(const coord_t
* coord
, const reiser4_key
* key
)
704 reiser4_key item_key
;
706 assert("vs-1356", coord_is_existing_unit(coord
));
707 assert("vs-1354", keylt(key
, append_key_tail(coord
, &item_key
)));
708 assert("vs-1355", keyge(key
, item_key_by_coord(coord
, &item_key
)));
709 return get_key_offset(key
) ==
710 get_key_offset(&item_key
) + coord
->unit_pos
;
716 /* plugin->u.item.s.file.read */
717 int reiser4_read_tail(struct file
*file UNUSED_ARG
, flow_t
*f
, hint_t
*hint
)
722 uf_coord_t
*uf_coord
;
724 uf_coord
= &hint
->ext_coord
;
725 coord
= &uf_coord
->coord
;
727 assert("vs-571", f
->user
== 1);
728 assert("vs-571", f
->data
);
729 assert("vs-967", coord
&& coord
->node
);
730 assert("vs-1117", znode_is_rlocked(coord
->node
));
731 assert("vs-1118", znode_is_loaded(coord
->node
));
733 assert("nikita-3037", reiser4_schedulable());
734 assert("vs-1357", coord_matches_key_tail(coord
, &f
->key
));
736 /* calculate number of bytes to read off the item */
737 item_length
= item_length_by_coord(coord
);
738 count
= item_length_by_coord(coord
) - coord
->unit_pos
;
739 if (count
> f
->length
)
742 /* user page has to be brought in so that major page fault does not
743 * occur here when longtem lock is held */
744 if (__copy_to_user((char __user
*)f
->data
,
745 ((char *)item_body_by_coord(coord
) + coord
->unit_pos
),
747 return RETERR(-EFAULT
);
749 /* probably mark_page_accessed() should only be called if
750 * coord->unit_pos is zero. */
751 mark_page_accessed(znode_page(coord
->node
));
752 move_flow_forward(f
, count
);
754 coord
->unit_pos
+= count
;
755 if (item_length
== coord
->unit_pos
) {
757 coord
->between
= AFTER_UNIT
;
759 reiser4_set_hint(hint
, &f
->key
, ZNODE_READ_LOCK
);
764 plugin->u.item.s.file.append_key
765 key of first byte which is the next to last byte by addressed by this item
767 reiser4_key
*append_key_tail(const coord_t
* coord
, reiser4_key
* key
)
769 item_key_by_coord(coord
, key
);
770 set_key_offset(key
, get_key_offset(key
) + item_length_by_coord(coord
));
774 /* plugin->u.item.s.file.init_coord_extension */
775 void init_coord_extension_tail(uf_coord_t
* uf_coord
, loff_t lookuped
)
781 plugin->u.item.s.file.get_block
784 get_block_address_tail(const coord_t
* coord
, sector_t lblock
, sector_t
* block
)
786 assert("nikita-3252", znode_get_level(coord
->node
) == LEAF_LEVEL
);
788 if (reiser4_blocknr_is_fake(znode_get_block(coord
->node
)))
789 /* if node has'nt obtainet its block number yet, return 0.
790 * Lets avoid upsetting users with some cosmic numbers beyond
791 * the device capacity.*/
794 *block
= *znode_get_block(coord
->node
);
800 * c-indentation-style: "K&R"