2 * Copyright (C) 2009 Oracle. All rights reserved.
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public
6 * License v2 as published by the Free Software Foundation.
8 * This program is distributed in the hope that it will be useful,
9 * but WITHOUT ANY WARRANTY; without even the implied warranty of
10 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
11 * General Public License for more details.
13 * You should have received a copy of the GNU General Public
14 * License along with this program; if not, write to the
15 * Free Software Foundation, Inc., 59 Temple Place - Suite 330,
16 * Boston, MA 021110-1307, USA.
19 #include <linux/sched.h>
20 #include <linux/slab.h>
21 #include <linux/sort.h>
23 #include "delayed-ref.h"
24 #include "transaction.h"
27 struct kmem_cache
*btrfs_delayed_ref_head_cachep
;
28 struct kmem_cache
*btrfs_delayed_tree_ref_cachep
;
29 struct kmem_cache
*btrfs_delayed_data_ref_cachep
;
30 struct kmem_cache
*btrfs_delayed_extent_op_cachep
;
32 * delayed back reference update tracking. For subvolume trees
33 * we queue up extent allocations and backref maintenance for
34 * delayed processing. This avoids deep call chains where we
35 * add extents in the middle of btrfs_search_slot, and it allows
36 * us to buffer up frequently modified backrefs in an rb tree instead
37 * of hammering updates on the extent allocation tree.
41 * compare two delayed tree backrefs with same bytenr and type
43 static int comp_tree_refs(struct btrfs_delayed_tree_ref
*ref1
,
44 struct btrfs_delayed_tree_ref
*ref2
)
46 if (ref1
->node
.type
== BTRFS_TREE_BLOCK_REF_KEY
) {
47 if (ref1
->root
< ref2
->root
)
49 if (ref1
->root
> ref2
->root
)
52 if (ref1
->parent
< ref2
->parent
)
54 if (ref1
->parent
> ref2
->parent
)
61 * compare two delayed data backrefs with same bytenr and type
63 static int comp_data_refs(struct btrfs_delayed_data_ref
*ref1
,
64 struct btrfs_delayed_data_ref
*ref2
)
66 if (ref1
->node
.type
== BTRFS_EXTENT_DATA_REF_KEY
) {
67 if (ref1
->root
< ref2
->root
)
69 if (ref1
->root
> ref2
->root
)
71 if (ref1
->objectid
< ref2
->objectid
)
73 if (ref1
->objectid
> ref2
->objectid
)
75 if (ref1
->offset
< ref2
->offset
)
77 if (ref1
->offset
> ref2
->offset
)
80 if (ref1
->parent
< ref2
->parent
)
82 if (ref1
->parent
> ref2
->parent
)
88 static int comp_refs(struct btrfs_delayed_ref_node
*ref1
,
89 struct btrfs_delayed_ref_node
*ref2
,
94 if (ref1
->type
< ref2
->type
)
96 if (ref1
->type
> ref2
->type
)
98 if (ref1
->type
== BTRFS_TREE_BLOCK_REF_KEY
||
99 ref1
->type
== BTRFS_SHARED_BLOCK_REF_KEY
)
100 ret
= comp_tree_refs(btrfs_delayed_node_to_tree_ref(ref1
),
101 btrfs_delayed_node_to_tree_ref(ref2
));
103 ret
= comp_data_refs(btrfs_delayed_node_to_data_ref(ref1
),
104 btrfs_delayed_node_to_data_ref(ref2
));
108 if (ref1
->seq
< ref2
->seq
)
110 if (ref1
->seq
> ref2
->seq
)
116 /* insert a new ref to head ref rbtree */
117 static struct btrfs_delayed_ref_head
*htree_insert(struct rb_root
*root
,
118 struct rb_node
*node
)
120 struct rb_node
**p
= &root
->rb_node
;
121 struct rb_node
*parent_node
= NULL
;
122 struct btrfs_delayed_ref_head
*entry
;
123 struct btrfs_delayed_ref_head
*ins
;
126 ins
= rb_entry(node
, struct btrfs_delayed_ref_head
, href_node
);
127 bytenr
= ins
->bytenr
;
130 entry
= rb_entry(parent_node
, struct btrfs_delayed_ref_head
,
133 if (bytenr
< entry
->bytenr
)
135 else if (bytenr
> entry
->bytenr
)
141 rb_link_node(node
, parent_node
, p
);
142 rb_insert_color(node
, root
);
146 static struct btrfs_delayed_ref_node
* tree_insert(struct rb_root
*root
,
147 struct btrfs_delayed_ref_node
*ins
)
149 struct rb_node
**p
= &root
->rb_node
;
150 struct rb_node
*node
= &ins
->ref_node
;
151 struct rb_node
*parent_node
= NULL
;
152 struct btrfs_delayed_ref_node
*entry
;
158 entry
= rb_entry(parent_node
, struct btrfs_delayed_ref_node
,
160 comp
= comp_refs(ins
, entry
, true);
169 rb_link_node(node
, parent_node
, p
);
170 rb_insert_color(node
, root
);
175 * find an head entry based on bytenr. This returns the delayed ref
176 * head if it was able to find one, or NULL if nothing was in that spot.
177 * If return_bigger is given, the next bigger entry is returned if no exact
180 static struct btrfs_delayed_ref_head
*
181 find_ref_head(struct rb_root
*root
, u64 bytenr
,
185 struct btrfs_delayed_ref_head
*entry
;
190 entry
= rb_entry(n
, struct btrfs_delayed_ref_head
, href_node
);
192 if (bytenr
< entry
->bytenr
)
194 else if (bytenr
> entry
->bytenr
)
199 if (entry
&& return_bigger
) {
200 if (bytenr
> entry
->bytenr
) {
201 n
= rb_next(&entry
->href_node
);
204 entry
= rb_entry(n
, struct btrfs_delayed_ref_head
,
213 int btrfs_delayed_ref_lock(struct btrfs_trans_handle
*trans
,
214 struct btrfs_delayed_ref_head
*head
)
216 struct btrfs_delayed_ref_root
*delayed_refs
;
218 delayed_refs
= &trans
->transaction
->delayed_refs
;
219 assert_spin_locked(&delayed_refs
->lock
);
220 if (mutex_trylock(&head
->mutex
))
223 refcount_inc(&head
->refs
);
224 spin_unlock(&delayed_refs
->lock
);
226 mutex_lock(&head
->mutex
);
227 spin_lock(&delayed_refs
->lock
);
228 if (RB_EMPTY_NODE(&head
->href_node
)) {
229 mutex_unlock(&head
->mutex
);
230 btrfs_put_delayed_ref_head(head
);
233 btrfs_put_delayed_ref_head(head
);
237 static inline void drop_delayed_ref(struct btrfs_trans_handle
*trans
,
238 struct btrfs_delayed_ref_root
*delayed_refs
,
239 struct btrfs_delayed_ref_head
*head
,
240 struct btrfs_delayed_ref_node
*ref
)
242 assert_spin_locked(&head
->lock
);
243 rb_erase(&ref
->ref_node
, &head
->ref_tree
);
244 RB_CLEAR_NODE(&ref
->ref_node
);
245 if (!list_empty(&ref
->add_list
))
246 list_del(&ref
->add_list
);
248 btrfs_put_delayed_ref(ref
);
249 atomic_dec(&delayed_refs
->num_entries
);
250 if (trans
->delayed_ref_updates
)
251 trans
->delayed_ref_updates
--;
254 static bool merge_ref(struct btrfs_trans_handle
*trans
,
255 struct btrfs_delayed_ref_root
*delayed_refs
,
256 struct btrfs_delayed_ref_head
*head
,
257 struct btrfs_delayed_ref_node
*ref
,
260 struct btrfs_delayed_ref_node
*next
;
261 struct rb_node
*node
= rb_next(&ref
->ref_node
);
264 while (!done
&& node
) {
267 next
= rb_entry(node
, struct btrfs_delayed_ref_node
, ref_node
);
268 node
= rb_next(node
);
269 if (seq
&& next
->seq
>= seq
)
271 if (comp_refs(ref
, next
, false))
274 if (ref
->action
== next
->action
) {
277 if (ref
->ref_mod
< next
->ref_mod
) {
281 mod
= -next
->ref_mod
;
284 drop_delayed_ref(trans
, delayed_refs
, head
, next
);
286 if (ref
->ref_mod
== 0) {
287 drop_delayed_ref(trans
, delayed_refs
, head
, ref
);
291 * Can't have multiples of the same ref on a tree block.
293 WARN_ON(ref
->type
== BTRFS_TREE_BLOCK_REF_KEY
||
294 ref
->type
== BTRFS_SHARED_BLOCK_REF_KEY
);
301 void btrfs_merge_delayed_refs(struct btrfs_trans_handle
*trans
,
302 struct btrfs_fs_info
*fs_info
,
303 struct btrfs_delayed_ref_root
*delayed_refs
,
304 struct btrfs_delayed_ref_head
*head
)
306 struct btrfs_delayed_ref_node
*ref
;
307 struct rb_node
*node
;
310 assert_spin_locked(&head
->lock
);
312 if (RB_EMPTY_ROOT(&head
->ref_tree
))
315 /* We don't have too many refs to merge for data. */
319 spin_lock(&fs_info
->tree_mod_seq_lock
);
320 if (!list_empty(&fs_info
->tree_mod_seq_list
)) {
321 struct seq_list
*elem
;
323 elem
= list_first_entry(&fs_info
->tree_mod_seq_list
,
324 struct seq_list
, list
);
327 spin_unlock(&fs_info
->tree_mod_seq_lock
);
330 for (node
= rb_first(&head
->ref_tree
); node
; node
= rb_next(node
)) {
331 ref
= rb_entry(node
, struct btrfs_delayed_ref_node
, ref_node
);
332 if (seq
&& ref
->seq
>= seq
)
334 if (merge_ref(trans
, delayed_refs
, head
, ref
, seq
))
339 int btrfs_check_delayed_seq(struct btrfs_fs_info
*fs_info
,
340 struct btrfs_delayed_ref_root
*delayed_refs
,
343 struct seq_list
*elem
;
346 spin_lock(&fs_info
->tree_mod_seq_lock
);
347 if (!list_empty(&fs_info
->tree_mod_seq_list
)) {
348 elem
= list_first_entry(&fs_info
->tree_mod_seq_list
,
349 struct seq_list
, list
);
350 if (seq
>= elem
->seq
) {
352 "holding back delayed_ref %#x.%x, lowest is %#x.%x (%p)",
353 (u32
)(seq
>> 32), (u32
)seq
,
354 (u32
)(elem
->seq
>> 32), (u32
)elem
->seq
,
360 spin_unlock(&fs_info
->tree_mod_seq_lock
);
364 struct btrfs_delayed_ref_head
*
365 btrfs_select_ref_head(struct btrfs_trans_handle
*trans
)
367 struct btrfs_delayed_ref_root
*delayed_refs
;
368 struct btrfs_delayed_ref_head
*head
;
372 delayed_refs
= &trans
->transaction
->delayed_refs
;
375 start
= delayed_refs
->run_delayed_start
;
376 head
= find_ref_head(&delayed_refs
->href_root
, start
, 1);
377 if (!head
&& !loop
) {
378 delayed_refs
->run_delayed_start
= 0;
381 head
= find_ref_head(&delayed_refs
->href_root
, start
, 1);
384 } else if (!head
&& loop
) {
388 while (head
->processing
) {
389 struct rb_node
*node
;
391 node
= rb_next(&head
->href_node
);
395 delayed_refs
->run_delayed_start
= 0;
400 head
= rb_entry(node
, struct btrfs_delayed_ref_head
,
404 head
->processing
= 1;
405 WARN_ON(delayed_refs
->num_heads_ready
== 0);
406 delayed_refs
->num_heads_ready
--;
407 delayed_refs
->run_delayed_start
= head
->bytenr
+
413 * Helper to insert the ref_node to the tail or merge with tail.
415 * Return 0 for insert.
416 * Return >0 for merge.
418 static int insert_delayed_ref(struct btrfs_trans_handle
*trans
,
419 struct btrfs_delayed_ref_root
*root
,
420 struct btrfs_delayed_ref_head
*href
,
421 struct btrfs_delayed_ref_node
*ref
)
423 struct btrfs_delayed_ref_node
*exist
;
427 spin_lock(&href
->lock
);
428 exist
= tree_insert(&href
->ref_tree
, ref
);
432 /* Now we are sure we can merge */
434 if (exist
->action
== ref
->action
) {
437 /* Need to change action */
438 if (exist
->ref_mod
< ref
->ref_mod
) {
439 exist
->action
= ref
->action
;
440 mod
= -exist
->ref_mod
;
441 exist
->ref_mod
= ref
->ref_mod
;
442 if (ref
->action
== BTRFS_ADD_DELAYED_REF
)
443 list_add_tail(&exist
->add_list
,
444 &href
->ref_add_list
);
445 else if (ref
->action
== BTRFS_DROP_DELAYED_REF
) {
446 ASSERT(!list_empty(&exist
->add_list
));
447 list_del(&exist
->add_list
);
454 exist
->ref_mod
+= mod
;
456 /* remove existing tail if its ref_mod is zero */
457 if (exist
->ref_mod
== 0)
458 drop_delayed_ref(trans
, root
, href
, exist
);
459 spin_unlock(&href
->lock
);
462 if (ref
->action
== BTRFS_ADD_DELAYED_REF
)
463 list_add_tail(&ref
->add_list
, &href
->ref_add_list
);
464 atomic_inc(&root
->num_entries
);
465 trans
->delayed_ref_updates
++;
466 spin_unlock(&href
->lock
);
471 * helper function to update the accounting in the head ref
472 * existing and update must have the same bytenr
475 update_existing_head_ref(struct btrfs_delayed_ref_root
*delayed_refs
,
476 struct btrfs_delayed_ref_head
*existing
,
477 struct btrfs_delayed_ref_head
*update
,
478 int *old_ref_mod_ret
)
482 BUG_ON(existing
->is_data
!= update
->is_data
);
484 spin_lock(&existing
->lock
);
485 if (update
->must_insert_reserved
) {
486 /* if the extent was freed and then
487 * reallocated before the delayed ref
488 * entries were processed, we can end up
489 * with an existing head ref without
490 * the must_insert_reserved flag set.
493 existing
->must_insert_reserved
= update
->must_insert_reserved
;
496 * update the num_bytes so we make sure the accounting
499 existing
->num_bytes
= update
->num_bytes
;
503 if (update
->extent_op
) {
504 if (!existing
->extent_op
) {
505 existing
->extent_op
= update
->extent_op
;
507 if (update
->extent_op
->update_key
) {
508 memcpy(&existing
->extent_op
->key
,
509 &update
->extent_op
->key
,
510 sizeof(update
->extent_op
->key
));
511 existing
->extent_op
->update_key
= true;
513 if (update
->extent_op
->update_flags
) {
514 existing
->extent_op
->flags_to_set
|=
515 update
->extent_op
->flags_to_set
;
516 existing
->extent_op
->update_flags
= true;
518 btrfs_free_delayed_extent_op(update
->extent_op
);
522 * update the reference mod on the head to reflect this new operation,
523 * only need the lock for this case cause we could be processing it
524 * currently, for refs we just added we know we're a-ok.
526 old_ref_mod
= existing
->total_ref_mod
;
528 *old_ref_mod_ret
= old_ref_mod
;
529 existing
->ref_mod
+= update
->ref_mod
;
530 existing
->total_ref_mod
+= update
->ref_mod
;
533 * If we are going to from a positive ref mod to a negative or vice
534 * versa we need to make sure to adjust pending_csums accordingly.
536 if (existing
->is_data
) {
537 if (existing
->total_ref_mod
>= 0 && old_ref_mod
< 0)
538 delayed_refs
->pending_csums
-= existing
->num_bytes
;
539 if (existing
->total_ref_mod
< 0 && old_ref_mod
>= 0)
540 delayed_refs
->pending_csums
+= existing
->num_bytes
;
542 spin_unlock(&existing
->lock
);
546 * helper function to actually insert a head node into the rbtree.
547 * this does all the dirty work in terms of maintaining the correct
548 * overall modification count.
550 static noinline
struct btrfs_delayed_ref_head
*
551 add_delayed_ref_head(struct btrfs_fs_info
*fs_info
,
552 struct btrfs_trans_handle
*trans
,
553 struct btrfs_delayed_ref_head
*head_ref
,
554 struct btrfs_qgroup_extent_record
*qrecord
,
555 u64 bytenr
, u64 num_bytes
, u64 ref_root
, u64 reserved
,
556 int action
, int is_data
, int is_system
,
557 int *qrecord_inserted_ret
,
558 int *old_ref_mod
, int *new_ref_mod
)
561 struct btrfs_delayed_ref_head
*existing
;
562 struct btrfs_delayed_ref_root
*delayed_refs
;
564 int must_insert_reserved
= 0;
565 int qrecord_inserted
= 0;
567 /* If reserved is provided, it must be a data extent. */
568 BUG_ON(!is_data
&& reserved
);
571 * the head node stores the sum of all the mods, so dropping a ref
572 * should drop the sum in the head node by one.
574 if (action
== BTRFS_UPDATE_DELAYED_HEAD
)
576 else if (action
== BTRFS_DROP_DELAYED_REF
)
580 * BTRFS_ADD_DELAYED_EXTENT means that we need to update
581 * the reserved accounting when the extent is finally added, or
582 * if a later modification deletes the delayed ref without ever
583 * inserting the extent into the extent allocation tree.
584 * ref->must_insert_reserved is the flag used to record
585 * that accounting mods are required.
587 * Once we record must_insert_reserved, switch the action to
588 * BTRFS_ADD_DELAYED_REF because other special casing is not required.
590 if (action
== BTRFS_ADD_DELAYED_EXTENT
)
591 must_insert_reserved
= 1;
593 must_insert_reserved
= 0;
595 delayed_refs
= &trans
->transaction
->delayed_refs
;
597 refcount_set(&head_ref
->refs
, 1);
598 head_ref
->bytenr
= bytenr
;
599 head_ref
->num_bytes
= num_bytes
;
600 head_ref
->ref_mod
= count_mod
;
601 head_ref
->must_insert_reserved
= must_insert_reserved
;
602 head_ref
->is_data
= is_data
;
603 head_ref
->is_system
= is_system
;
604 head_ref
->ref_tree
= RB_ROOT
;
605 INIT_LIST_HEAD(&head_ref
->ref_add_list
);
606 RB_CLEAR_NODE(&head_ref
->href_node
);
607 head_ref
->processing
= 0;
608 head_ref
->total_ref_mod
= count_mod
;
609 head_ref
->qgroup_reserved
= 0;
610 head_ref
->qgroup_ref_root
= 0;
611 spin_lock_init(&head_ref
->lock
);
612 mutex_init(&head_ref
->mutex
);
614 /* Record qgroup extent info if provided */
616 if (ref_root
&& reserved
) {
617 head_ref
->qgroup_ref_root
= ref_root
;
618 head_ref
->qgroup_reserved
= reserved
;
621 qrecord
->bytenr
= bytenr
;
622 qrecord
->num_bytes
= num_bytes
;
623 qrecord
->old_roots
= NULL
;
625 if(btrfs_qgroup_trace_extent_nolock(fs_info
,
626 delayed_refs
, qrecord
))
629 qrecord_inserted
= 1;
632 trace_add_delayed_ref_head(fs_info
, head_ref
, action
);
634 existing
= htree_insert(&delayed_refs
->href_root
,
635 &head_ref
->href_node
);
637 WARN_ON(ref_root
&& reserved
&& existing
->qgroup_ref_root
638 && existing
->qgroup_reserved
);
639 update_existing_head_ref(delayed_refs
, existing
, head_ref
,
642 * we've updated the existing ref, free the newly
645 kmem_cache_free(btrfs_delayed_ref_head_cachep
, head_ref
);
650 if (is_data
&& count_mod
< 0)
651 delayed_refs
->pending_csums
+= num_bytes
;
652 delayed_refs
->num_heads
++;
653 delayed_refs
->num_heads_ready
++;
654 atomic_inc(&delayed_refs
->num_entries
);
655 trans
->delayed_ref_updates
++;
657 if (qrecord_inserted_ret
)
658 *qrecord_inserted_ret
= qrecord_inserted
;
660 *new_ref_mod
= head_ref
->total_ref_mod
;
665 * helper to insert a delayed tree ref into the rbtree.
668 add_delayed_tree_ref(struct btrfs_fs_info
*fs_info
,
669 struct btrfs_trans_handle
*trans
,
670 struct btrfs_delayed_ref_head
*head_ref
,
671 struct btrfs_delayed_ref_node
*ref
, u64 bytenr
,
672 u64 num_bytes
, u64 parent
, u64 ref_root
, int level
,
675 struct btrfs_delayed_tree_ref
*full_ref
;
676 struct btrfs_delayed_ref_root
*delayed_refs
;
680 if (action
== BTRFS_ADD_DELAYED_EXTENT
)
681 action
= BTRFS_ADD_DELAYED_REF
;
683 if (is_fstree(ref_root
))
684 seq
= atomic64_read(&fs_info
->tree_mod_seq
);
685 delayed_refs
= &trans
->transaction
->delayed_refs
;
687 /* first set the basic ref node struct up */
688 refcount_set(&ref
->refs
, 1);
689 ref
->bytenr
= bytenr
;
690 ref
->num_bytes
= num_bytes
;
692 ref
->action
= action
;
696 RB_CLEAR_NODE(&ref
->ref_node
);
697 INIT_LIST_HEAD(&ref
->add_list
);
699 full_ref
= btrfs_delayed_node_to_tree_ref(ref
);
700 full_ref
->parent
= parent
;
701 full_ref
->root
= ref_root
;
703 ref
->type
= BTRFS_SHARED_BLOCK_REF_KEY
;
705 ref
->type
= BTRFS_TREE_BLOCK_REF_KEY
;
706 full_ref
->level
= level
;
708 trace_add_delayed_tree_ref(fs_info
, ref
, full_ref
, action
);
710 ret
= insert_delayed_ref(trans
, delayed_refs
, head_ref
, ref
);
713 * XXX: memory should be freed at the same level allocated.
714 * But bad practice is anywhere... Follow it now. Need cleanup.
717 kmem_cache_free(btrfs_delayed_tree_ref_cachep
, full_ref
);
721 * helper to insert a delayed data ref into the rbtree.
724 add_delayed_data_ref(struct btrfs_fs_info
*fs_info
,
725 struct btrfs_trans_handle
*trans
,
726 struct btrfs_delayed_ref_head
*head_ref
,
727 struct btrfs_delayed_ref_node
*ref
, u64 bytenr
,
728 u64 num_bytes
, u64 parent
, u64 ref_root
, u64 owner
,
729 u64 offset
, int action
)
731 struct btrfs_delayed_data_ref
*full_ref
;
732 struct btrfs_delayed_ref_root
*delayed_refs
;
736 if (action
== BTRFS_ADD_DELAYED_EXTENT
)
737 action
= BTRFS_ADD_DELAYED_REF
;
739 delayed_refs
= &trans
->transaction
->delayed_refs
;
741 if (is_fstree(ref_root
))
742 seq
= atomic64_read(&fs_info
->tree_mod_seq
);
744 /* first set the basic ref node struct up */
745 refcount_set(&ref
->refs
, 1);
746 ref
->bytenr
= bytenr
;
747 ref
->num_bytes
= num_bytes
;
749 ref
->action
= action
;
753 RB_CLEAR_NODE(&ref
->ref_node
);
754 INIT_LIST_HEAD(&ref
->add_list
);
756 full_ref
= btrfs_delayed_node_to_data_ref(ref
);
757 full_ref
->parent
= parent
;
758 full_ref
->root
= ref_root
;
760 ref
->type
= BTRFS_SHARED_DATA_REF_KEY
;
762 ref
->type
= BTRFS_EXTENT_DATA_REF_KEY
;
764 full_ref
->objectid
= owner
;
765 full_ref
->offset
= offset
;
767 trace_add_delayed_data_ref(fs_info
, ref
, full_ref
, action
);
769 ret
= insert_delayed_ref(trans
, delayed_refs
, head_ref
, ref
);
771 kmem_cache_free(btrfs_delayed_data_ref_cachep
, full_ref
);
775 * add a delayed tree ref. This does all of the accounting required
776 * to make sure the delayed ref is eventually processed before this
777 * transaction commits.
779 int btrfs_add_delayed_tree_ref(struct btrfs_fs_info
*fs_info
,
780 struct btrfs_trans_handle
*trans
,
781 u64 bytenr
, u64 num_bytes
, u64 parent
,
782 u64 ref_root
, int level
, int action
,
783 struct btrfs_delayed_extent_op
*extent_op
,
784 int *old_ref_mod
, int *new_ref_mod
)
786 struct btrfs_delayed_tree_ref
*ref
;
787 struct btrfs_delayed_ref_head
*head_ref
;
788 struct btrfs_delayed_ref_root
*delayed_refs
;
789 struct btrfs_qgroup_extent_record
*record
= NULL
;
790 int qrecord_inserted
;
791 int is_system
= (ref_root
== BTRFS_CHUNK_TREE_OBJECTID
);
793 BUG_ON(extent_op
&& extent_op
->is_data
);
794 ref
= kmem_cache_alloc(btrfs_delayed_tree_ref_cachep
, GFP_NOFS
);
798 head_ref
= kmem_cache_alloc(btrfs_delayed_ref_head_cachep
, GFP_NOFS
);
802 if (test_bit(BTRFS_FS_QUOTA_ENABLED
, &fs_info
->flags
) &&
803 is_fstree(ref_root
)) {
804 record
= kmalloc(sizeof(*record
), GFP_NOFS
);
809 head_ref
->extent_op
= extent_op
;
811 delayed_refs
= &trans
->transaction
->delayed_refs
;
812 spin_lock(&delayed_refs
->lock
);
815 * insert both the head node and the new ref without dropping
818 head_ref
= add_delayed_ref_head(fs_info
, trans
, head_ref
, record
,
819 bytenr
, num_bytes
, 0, 0, action
, 0,
820 is_system
, &qrecord_inserted
,
821 old_ref_mod
, new_ref_mod
);
823 add_delayed_tree_ref(fs_info
, trans
, head_ref
, &ref
->node
, bytenr
,
824 num_bytes
, parent
, ref_root
, level
, action
);
825 spin_unlock(&delayed_refs
->lock
);
827 if (qrecord_inserted
)
828 btrfs_qgroup_trace_extent_post(fs_info
, record
);
833 kmem_cache_free(btrfs_delayed_ref_head_cachep
, head_ref
);
835 kmem_cache_free(btrfs_delayed_tree_ref_cachep
, ref
);
841 * add a delayed data ref. it's similar to btrfs_add_delayed_tree_ref.
843 int btrfs_add_delayed_data_ref(struct btrfs_fs_info
*fs_info
,
844 struct btrfs_trans_handle
*trans
,
845 u64 bytenr
, u64 num_bytes
,
846 u64 parent
, u64 ref_root
,
847 u64 owner
, u64 offset
, u64 reserved
, int action
,
848 int *old_ref_mod
, int *new_ref_mod
)
850 struct btrfs_delayed_data_ref
*ref
;
851 struct btrfs_delayed_ref_head
*head_ref
;
852 struct btrfs_delayed_ref_root
*delayed_refs
;
853 struct btrfs_qgroup_extent_record
*record
= NULL
;
854 int qrecord_inserted
;
856 ref
= kmem_cache_alloc(btrfs_delayed_data_ref_cachep
, GFP_NOFS
);
860 head_ref
= kmem_cache_alloc(btrfs_delayed_ref_head_cachep
, GFP_NOFS
);
862 kmem_cache_free(btrfs_delayed_data_ref_cachep
, ref
);
866 if (test_bit(BTRFS_FS_QUOTA_ENABLED
, &fs_info
->flags
) &&
867 is_fstree(ref_root
)) {
868 record
= kmalloc(sizeof(*record
), GFP_NOFS
);
870 kmem_cache_free(btrfs_delayed_data_ref_cachep
, ref
);
871 kmem_cache_free(btrfs_delayed_ref_head_cachep
,
877 head_ref
->extent_op
= NULL
;
879 delayed_refs
= &trans
->transaction
->delayed_refs
;
880 spin_lock(&delayed_refs
->lock
);
883 * insert both the head node and the new ref without dropping
886 head_ref
= add_delayed_ref_head(fs_info
, trans
, head_ref
, record
,
887 bytenr
, num_bytes
, ref_root
, reserved
,
888 action
, 1, 0, &qrecord_inserted
,
889 old_ref_mod
, new_ref_mod
);
891 add_delayed_data_ref(fs_info
, trans
, head_ref
, &ref
->node
, bytenr
,
892 num_bytes
, parent
, ref_root
, owner
, offset
,
894 spin_unlock(&delayed_refs
->lock
);
896 if (qrecord_inserted
)
897 return btrfs_qgroup_trace_extent_post(fs_info
, record
);
901 int btrfs_add_delayed_extent_op(struct btrfs_fs_info
*fs_info
,
902 struct btrfs_trans_handle
*trans
,
903 u64 bytenr
, u64 num_bytes
,
904 struct btrfs_delayed_extent_op
*extent_op
)
906 struct btrfs_delayed_ref_head
*head_ref
;
907 struct btrfs_delayed_ref_root
*delayed_refs
;
909 head_ref
= kmem_cache_alloc(btrfs_delayed_ref_head_cachep
, GFP_NOFS
);
913 head_ref
->extent_op
= extent_op
;
915 delayed_refs
= &trans
->transaction
->delayed_refs
;
916 spin_lock(&delayed_refs
->lock
);
919 * extent_ops just modify the flags of an extent and they don't result
920 * in ref count changes, hence it's safe to pass false/0 for is_system
923 add_delayed_ref_head(fs_info
, trans
, head_ref
, NULL
, bytenr
,
924 num_bytes
, 0, 0, BTRFS_UPDATE_DELAYED_HEAD
,
925 extent_op
->is_data
, 0, NULL
, NULL
, NULL
);
927 spin_unlock(&delayed_refs
->lock
);
932 * this does a simple search for the head node for a given extent.
933 * It must be called with the delayed ref spinlock held, and it returns
934 * the head node if any where found, or NULL if not.
936 struct btrfs_delayed_ref_head
*
937 btrfs_find_delayed_ref_head(struct btrfs_delayed_ref_root
*delayed_refs
, u64 bytenr
)
939 return find_ref_head(&delayed_refs
->href_root
, bytenr
, 0);
942 void btrfs_delayed_ref_exit(void)
944 kmem_cache_destroy(btrfs_delayed_ref_head_cachep
);
945 kmem_cache_destroy(btrfs_delayed_tree_ref_cachep
);
946 kmem_cache_destroy(btrfs_delayed_data_ref_cachep
);
947 kmem_cache_destroy(btrfs_delayed_extent_op_cachep
);
950 int __init
btrfs_delayed_ref_init(void)
952 btrfs_delayed_ref_head_cachep
= kmem_cache_create(
953 "btrfs_delayed_ref_head",
954 sizeof(struct btrfs_delayed_ref_head
), 0,
955 SLAB_MEM_SPREAD
, NULL
);
956 if (!btrfs_delayed_ref_head_cachep
)
959 btrfs_delayed_tree_ref_cachep
= kmem_cache_create(
960 "btrfs_delayed_tree_ref",
961 sizeof(struct btrfs_delayed_tree_ref
), 0,
962 SLAB_MEM_SPREAD
, NULL
);
963 if (!btrfs_delayed_tree_ref_cachep
)
966 btrfs_delayed_data_ref_cachep
= kmem_cache_create(
967 "btrfs_delayed_data_ref",
968 sizeof(struct btrfs_delayed_data_ref
), 0,
969 SLAB_MEM_SPREAD
, NULL
);
970 if (!btrfs_delayed_data_ref_cachep
)
973 btrfs_delayed_extent_op_cachep
= kmem_cache_create(
974 "btrfs_delayed_extent_op",
975 sizeof(struct btrfs_delayed_extent_op
), 0,
976 SLAB_MEM_SPREAD
, NULL
);
977 if (!btrfs_delayed_extent_op_cachep
)
982 btrfs_delayed_ref_exit();