2 * Copyright (C) 2009 Oracle. All rights reserved.
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public
6 * License v2 as published by the Free Software Foundation.
8 * This program is distributed in the hope that it will be useful,
9 * but WITHOUT ANY WARRANTY; without even the implied warranty of
10 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
11 * General Public License for more details.
13 * You should have received a copy of the GNU General Public
14 * License along with this program; if not, write to the
15 * Free Software Foundation, Inc., 59 Temple Place - Suite 330,
16 * Boston, MA 021110-1307, USA.
19 #include <linux/sched.h>
20 #include <linux/slab.h>
21 #include <linux/sort.h>
23 #include "delayed-ref.h"
24 #include "transaction.h"
27 struct kmem_cache
*btrfs_delayed_ref_head_cachep
;
28 struct kmem_cache
*btrfs_delayed_tree_ref_cachep
;
29 struct kmem_cache
*btrfs_delayed_data_ref_cachep
;
30 struct kmem_cache
*btrfs_delayed_extent_op_cachep
;
32 * delayed back reference update tracking. For subvolume trees
33 * we queue up extent allocations and backref maintenance for
34 * delayed processing. This avoids deep call chains where we
35 * add extents in the middle of btrfs_search_slot, and it allows
36 * us to buffer up frequently modified backrefs in an rb tree instead
37 * of hammering updates on the extent allocation tree.
41 * compare two delayed tree backrefs with same bytenr and type
43 static int comp_tree_refs(struct btrfs_delayed_tree_ref
*ref2
,
44 struct btrfs_delayed_tree_ref
*ref1
, int type
)
46 if (type
== BTRFS_TREE_BLOCK_REF_KEY
) {
47 if (ref1
->root
< ref2
->root
)
49 if (ref1
->root
> ref2
->root
)
52 if (ref1
->parent
< ref2
->parent
)
54 if (ref1
->parent
> ref2
->parent
)
61 * compare two delayed data backrefs with same bytenr and type
63 static int comp_data_refs(struct btrfs_delayed_data_ref
*ref2
,
64 struct btrfs_delayed_data_ref
*ref1
)
66 if (ref1
->node
.type
== BTRFS_EXTENT_DATA_REF_KEY
) {
67 if (ref1
->root
< ref2
->root
)
69 if (ref1
->root
> ref2
->root
)
71 if (ref1
->objectid
< ref2
->objectid
)
73 if (ref1
->objectid
> ref2
->objectid
)
75 if (ref1
->offset
< ref2
->offset
)
77 if (ref1
->offset
> ref2
->offset
)
80 if (ref1
->parent
< ref2
->parent
)
82 if (ref1
->parent
> ref2
->parent
)
88 /* insert a new ref to head ref rbtree */
89 static struct btrfs_delayed_ref_head
*htree_insert(struct rb_root
*root
,
92 struct rb_node
**p
= &root
->rb_node
;
93 struct rb_node
*parent_node
= NULL
;
94 struct btrfs_delayed_ref_head
*entry
;
95 struct btrfs_delayed_ref_head
*ins
;
98 ins
= rb_entry(node
, struct btrfs_delayed_ref_head
, href_node
);
99 bytenr
= ins
->node
.bytenr
;
102 entry
= rb_entry(parent_node
, struct btrfs_delayed_ref_head
,
105 if (bytenr
< entry
->node
.bytenr
)
107 else if (bytenr
> entry
->node
.bytenr
)
113 rb_link_node(node
, parent_node
, p
);
114 rb_insert_color(node
, root
);
119 * find an head entry based on bytenr. This returns the delayed ref
120 * head if it was able to find one, or NULL if nothing was in that spot.
121 * If return_bigger is given, the next bigger entry is returned if no exact
124 static struct btrfs_delayed_ref_head
*
125 find_ref_head(struct rb_root
*root
, u64 bytenr
,
129 struct btrfs_delayed_ref_head
*entry
;
134 entry
= rb_entry(n
, struct btrfs_delayed_ref_head
, href_node
);
136 if (bytenr
< entry
->node
.bytenr
)
138 else if (bytenr
> entry
->node
.bytenr
)
143 if (entry
&& return_bigger
) {
144 if (bytenr
> entry
->node
.bytenr
) {
145 n
= rb_next(&entry
->href_node
);
148 entry
= rb_entry(n
, struct btrfs_delayed_ref_head
,
157 int btrfs_delayed_ref_lock(struct btrfs_trans_handle
*trans
,
158 struct btrfs_delayed_ref_head
*head
)
160 struct btrfs_delayed_ref_root
*delayed_refs
;
162 delayed_refs
= &trans
->transaction
->delayed_refs
;
163 assert_spin_locked(&delayed_refs
->lock
);
164 if (mutex_trylock(&head
->mutex
))
167 refcount_inc(&head
->node
.refs
);
168 spin_unlock(&delayed_refs
->lock
);
170 mutex_lock(&head
->mutex
);
171 spin_lock(&delayed_refs
->lock
);
172 if (!head
->node
.in_tree
) {
173 mutex_unlock(&head
->mutex
);
174 btrfs_put_delayed_ref(&head
->node
);
177 btrfs_put_delayed_ref(&head
->node
);
181 static inline void drop_delayed_ref(struct btrfs_trans_handle
*trans
,
182 struct btrfs_delayed_ref_root
*delayed_refs
,
183 struct btrfs_delayed_ref_head
*head
,
184 struct btrfs_delayed_ref_node
*ref
)
186 if (btrfs_delayed_ref_is_head(ref
)) {
187 head
= btrfs_delayed_node_to_head(ref
);
188 rb_erase(&head
->href_node
, &delayed_refs
->href_root
);
190 assert_spin_locked(&head
->lock
);
191 list_del(&ref
->list
);
192 if (!list_empty(&ref
->add_list
))
193 list_del(&ref
->add_list
);
196 btrfs_put_delayed_ref(ref
);
197 atomic_dec(&delayed_refs
->num_entries
);
198 if (trans
->delayed_ref_updates
)
199 trans
->delayed_ref_updates
--;
202 static bool merge_ref(struct btrfs_trans_handle
*trans
,
203 struct btrfs_delayed_ref_root
*delayed_refs
,
204 struct btrfs_delayed_ref_head
*head
,
205 struct btrfs_delayed_ref_node
*ref
,
208 struct btrfs_delayed_ref_node
*next
;
211 next
= list_first_entry(&head
->ref_list
, struct btrfs_delayed_ref_node
,
213 while (!done
&& &next
->list
!= &head
->ref_list
) {
215 struct btrfs_delayed_ref_node
*next2
;
217 next2
= list_next_entry(next
, list
);
222 if (seq
&& next
->seq
>= seq
)
225 if (next
->type
!= ref
->type
)
228 if ((ref
->type
== BTRFS_TREE_BLOCK_REF_KEY
||
229 ref
->type
== BTRFS_SHARED_BLOCK_REF_KEY
) &&
230 comp_tree_refs(btrfs_delayed_node_to_tree_ref(ref
),
231 btrfs_delayed_node_to_tree_ref(next
),
234 if ((ref
->type
== BTRFS_EXTENT_DATA_REF_KEY
||
235 ref
->type
== BTRFS_SHARED_DATA_REF_KEY
) &&
236 comp_data_refs(btrfs_delayed_node_to_data_ref(ref
),
237 btrfs_delayed_node_to_data_ref(next
)))
240 if (ref
->action
== next
->action
) {
243 if (ref
->ref_mod
< next
->ref_mod
) {
247 mod
= -next
->ref_mod
;
250 drop_delayed_ref(trans
, delayed_refs
, head
, next
);
252 if (ref
->ref_mod
== 0) {
253 drop_delayed_ref(trans
, delayed_refs
, head
, ref
);
257 * Can't have multiples of the same ref on a tree block.
259 WARN_ON(ref
->type
== BTRFS_TREE_BLOCK_REF_KEY
||
260 ref
->type
== BTRFS_SHARED_BLOCK_REF_KEY
);
269 void btrfs_merge_delayed_refs(struct btrfs_trans_handle
*trans
,
270 struct btrfs_fs_info
*fs_info
,
271 struct btrfs_delayed_ref_root
*delayed_refs
,
272 struct btrfs_delayed_ref_head
*head
)
274 struct btrfs_delayed_ref_node
*ref
;
277 assert_spin_locked(&head
->lock
);
279 if (list_empty(&head
->ref_list
))
282 /* We don't have too many refs to merge for data. */
286 spin_lock(&fs_info
->tree_mod_seq_lock
);
287 if (!list_empty(&fs_info
->tree_mod_seq_list
)) {
288 struct seq_list
*elem
;
290 elem
= list_first_entry(&fs_info
->tree_mod_seq_list
,
291 struct seq_list
, list
);
294 spin_unlock(&fs_info
->tree_mod_seq_lock
);
296 ref
= list_first_entry(&head
->ref_list
, struct btrfs_delayed_ref_node
,
298 while (&ref
->list
!= &head
->ref_list
) {
299 if (seq
&& ref
->seq
>= seq
)
302 if (merge_ref(trans
, delayed_refs
, head
, ref
, seq
)) {
303 if (list_empty(&head
->ref_list
))
305 ref
= list_first_entry(&head
->ref_list
,
306 struct btrfs_delayed_ref_node
,
311 ref
= list_next_entry(ref
, list
);
315 int btrfs_check_delayed_seq(struct btrfs_fs_info
*fs_info
,
316 struct btrfs_delayed_ref_root
*delayed_refs
,
319 struct seq_list
*elem
;
322 spin_lock(&fs_info
->tree_mod_seq_lock
);
323 if (!list_empty(&fs_info
->tree_mod_seq_list
)) {
324 elem
= list_first_entry(&fs_info
->tree_mod_seq_list
,
325 struct seq_list
, list
);
326 if (seq
>= elem
->seq
) {
328 "holding back delayed_ref %#x.%x, lowest is %#x.%x (%p)",
329 (u32
)(seq
>> 32), (u32
)seq
,
330 (u32
)(elem
->seq
>> 32), (u32
)elem
->seq
,
336 spin_unlock(&fs_info
->tree_mod_seq_lock
);
340 struct btrfs_delayed_ref_head
*
341 btrfs_select_ref_head(struct btrfs_trans_handle
*trans
)
343 struct btrfs_delayed_ref_root
*delayed_refs
;
344 struct btrfs_delayed_ref_head
*head
;
348 delayed_refs
= &trans
->transaction
->delayed_refs
;
351 start
= delayed_refs
->run_delayed_start
;
352 head
= find_ref_head(&delayed_refs
->href_root
, start
, 1);
353 if (!head
&& !loop
) {
354 delayed_refs
->run_delayed_start
= 0;
357 head
= find_ref_head(&delayed_refs
->href_root
, start
, 1);
360 } else if (!head
&& loop
) {
364 while (head
->processing
) {
365 struct rb_node
*node
;
367 node
= rb_next(&head
->href_node
);
371 delayed_refs
->run_delayed_start
= 0;
376 head
= rb_entry(node
, struct btrfs_delayed_ref_head
,
380 head
->processing
= 1;
381 WARN_ON(delayed_refs
->num_heads_ready
== 0);
382 delayed_refs
->num_heads_ready
--;
383 delayed_refs
->run_delayed_start
= head
->node
.bytenr
+
384 head
->node
.num_bytes
;
389 * Helper to insert the ref_node to the tail or merge with tail.
391 * Return 0 for insert.
392 * Return >0 for merge.
395 add_delayed_ref_tail_merge(struct btrfs_trans_handle
*trans
,
396 struct btrfs_delayed_ref_root
*root
,
397 struct btrfs_delayed_ref_head
*href
,
398 struct btrfs_delayed_ref_node
*ref
)
400 struct btrfs_delayed_ref_node
*exist
;
404 spin_lock(&href
->lock
);
405 /* Check whether we can merge the tail node with ref */
406 if (list_empty(&href
->ref_list
))
408 exist
= list_entry(href
->ref_list
.prev
, struct btrfs_delayed_ref_node
,
410 /* No need to compare bytenr nor is_head */
411 if (exist
->type
!= ref
->type
|| exist
->seq
!= ref
->seq
)
414 if ((exist
->type
== BTRFS_TREE_BLOCK_REF_KEY
||
415 exist
->type
== BTRFS_SHARED_BLOCK_REF_KEY
) &&
416 comp_tree_refs(btrfs_delayed_node_to_tree_ref(exist
),
417 btrfs_delayed_node_to_tree_ref(ref
),
420 if ((exist
->type
== BTRFS_EXTENT_DATA_REF_KEY
||
421 exist
->type
== BTRFS_SHARED_DATA_REF_KEY
) &&
422 comp_data_refs(btrfs_delayed_node_to_data_ref(exist
),
423 btrfs_delayed_node_to_data_ref(ref
)))
426 /* Now we are sure we can merge */
428 if (exist
->action
== ref
->action
) {
431 /* Need to change action */
432 if (exist
->ref_mod
< ref
->ref_mod
) {
433 exist
->action
= ref
->action
;
434 mod
= -exist
->ref_mod
;
435 exist
->ref_mod
= ref
->ref_mod
;
436 if (ref
->action
== BTRFS_ADD_DELAYED_REF
)
437 list_add_tail(&exist
->add_list
,
438 &href
->ref_add_list
);
439 else if (ref
->action
== BTRFS_DROP_DELAYED_REF
) {
440 ASSERT(!list_empty(&exist
->add_list
));
441 list_del(&exist
->add_list
);
448 exist
->ref_mod
+= mod
;
450 /* remove existing tail if its ref_mod is zero */
451 if (exist
->ref_mod
== 0)
452 drop_delayed_ref(trans
, root
, href
, exist
);
453 spin_unlock(&href
->lock
);
457 list_add_tail(&ref
->list
, &href
->ref_list
);
458 if (ref
->action
== BTRFS_ADD_DELAYED_REF
)
459 list_add_tail(&ref
->add_list
, &href
->ref_add_list
);
460 atomic_inc(&root
->num_entries
);
461 trans
->delayed_ref_updates
++;
462 spin_unlock(&href
->lock
);
467 * helper function to update the accounting in the head ref
468 * existing and update must have the same bytenr
471 update_existing_head_ref(struct btrfs_delayed_ref_root
*delayed_refs
,
472 struct btrfs_delayed_ref_node
*existing
,
473 struct btrfs_delayed_ref_node
*update
,
474 int *old_ref_mod_ret
)
476 struct btrfs_delayed_ref_head
*existing_ref
;
477 struct btrfs_delayed_ref_head
*ref
;
480 existing_ref
= btrfs_delayed_node_to_head(existing
);
481 ref
= btrfs_delayed_node_to_head(update
);
482 BUG_ON(existing_ref
->is_data
!= ref
->is_data
);
484 spin_lock(&existing_ref
->lock
);
485 if (ref
->must_insert_reserved
) {
486 /* if the extent was freed and then
487 * reallocated before the delayed ref
488 * entries were processed, we can end up
489 * with an existing head ref without
490 * the must_insert_reserved flag set.
493 existing_ref
->must_insert_reserved
= ref
->must_insert_reserved
;
496 * update the num_bytes so we make sure the accounting
499 existing
->num_bytes
= update
->num_bytes
;
503 if (ref
->extent_op
) {
504 if (!existing_ref
->extent_op
) {
505 existing_ref
->extent_op
= ref
->extent_op
;
507 if (ref
->extent_op
->update_key
) {
508 memcpy(&existing_ref
->extent_op
->key
,
509 &ref
->extent_op
->key
,
510 sizeof(ref
->extent_op
->key
));
511 existing_ref
->extent_op
->update_key
= true;
513 if (ref
->extent_op
->update_flags
) {
514 existing_ref
->extent_op
->flags_to_set
|=
515 ref
->extent_op
->flags_to_set
;
516 existing_ref
->extent_op
->update_flags
= true;
518 btrfs_free_delayed_extent_op(ref
->extent_op
);
522 * update the reference mod on the head to reflect this new operation,
523 * only need the lock for this case cause we could be processing it
524 * currently, for refs we just added we know we're a-ok.
526 old_ref_mod
= existing_ref
->total_ref_mod
;
528 *old_ref_mod_ret
= old_ref_mod
;
529 existing
->ref_mod
+= update
->ref_mod
;
530 existing_ref
->total_ref_mod
+= update
->ref_mod
;
533 * If we are going to from a positive ref mod to a negative or vice
534 * versa we need to make sure to adjust pending_csums accordingly.
536 if (existing_ref
->is_data
) {
537 if (existing_ref
->total_ref_mod
>= 0 && old_ref_mod
< 0)
538 delayed_refs
->pending_csums
-= existing
->num_bytes
;
539 if (existing_ref
->total_ref_mod
< 0 && old_ref_mod
>= 0)
540 delayed_refs
->pending_csums
+= existing
->num_bytes
;
542 spin_unlock(&existing_ref
->lock
);
546 * helper function to actually insert a head node into the rbtree.
547 * this does all the dirty work in terms of maintaining the correct
548 * overall modification count.
550 static noinline
struct btrfs_delayed_ref_head
*
551 add_delayed_ref_head(struct btrfs_fs_info
*fs_info
,
552 struct btrfs_trans_handle
*trans
,
553 struct btrfs_delayed_ref_node
*ref
,
554 struct btrfs_qgroup_extent_record
*qrecord
,
555 u64 bytenr
, u64 num_bytes
, u64 ref_root
, u64 reserved
,
556 int action
, int is_data
, int *qrecord_inserted_ret
,
557 int *old_ref_mod
, int *new_ref_mod
)
559 struct btrfs_delayed_ref_head
*existing
;
560 struct btrfs_delayed_ref_head
*head_ref
= NULL
;
561 struct btrfs_delayed_ref_root
*delayed_refs
;
563 int must_insert_reserved
= 0;
564 int qrecord_inserted
= 0;
566 /* If reserved is provided, it must be a data extent. */
567 BUG_ON(!is_data
&& reserved
);
570 * the head node stores the sum of all the mods, so dropping a ref
571 * should drop the sum in the head node by one.
573 if (action
== BTRFS_UPDATE_DELAYED_HEAD
)
575 else if (action
== BTRFS_DROP_DELAYED_REF
)
579 * BTRFS_ADD_DELAYED_EXTENT means that we need to update
580 * the reserved accounting when the extent is finally added, or
581 * if a later modification deletes the delayed ref without ever
582 * inserting the extent into the extent allocation tree.
583 * ref->must_insert_reserved is the flag used to record
584 * that accounting mods are required.
586 * Once we record must_insert_reserved, switch the action to
587 * BTRFS_ADD_DELAYED_REF because other special casing is not required.
589 if (action
== BTRFS_ADD_DELAYED_EXTENT
)
590 must_insert_reserved
= 1;
592 must_insert_reserved
= 0;
594 delayed_refs
= &trans
->transaction
->delayed_refs
;
596 /* first set the basic ref node struct up */
597 refcount_set(&ref
->refs
, 1);
598 ref
->bytenr
= bytenr
;
599 ref
->num_bytes
= num_bytes
;
600 ref
->ref_mod
= count_mod
;
607 head_ref
= btrfs_delayed_node_to_head(ref
);
608 head_ref
->must_insert_reserved
= must_insert_reserved
;
609 head_ref
->is_data
= is_data
;
610 INIT_LIST_HEAD(&head_ref
->ref_list
);
611 INIT_LIST_HEAD(&head_ref
->ref_add_list
);
612 head_ref
->processing
= 0;
613 head_ref
->total_ref_mod
= count_mod
;
614 head_ref
->qgroup_reserved
= 0;
615 head_ref
->qgroup_ref_root
= 0;
617 /* Record qgroup extent info if provided */
619 if (ref_root
&& reserved
) {
620 head_ref
->qgroup_ref_root
= ref_root
;
621 head_ref
->qgroup_reserved
= reserved
;
624 qrecord
->bytenr
= bytenr
;
625 qrecord
->num_bytes
= num_bytes
;
626 qrecord
->old_roots
= NULL
;
628 if(btrfs_qgroup_trace_extent_nolock(fs_info
,
629 delayed_refs
, qrecord
))
632 qrecord_inserted
= 1;
635 spin_lock_init(&head_ref
->lock
);
636 mutex_init(&head_ref
->mutex
);
638 trace_add_delayed_ref_head(fs_info
, ref
, head_ref
, action
);
640 existing
= htree_insert(&delayed_refs
->href_root
,
641 &head_ref
->href_node
);
643 WARN_ON(ref_root
&& reserved
&& existing
->qgroup_ref_root
644 && existing
->qgroup_reserved
);
645 update_existing_head_ref(delayed_refs
, &existing
->node
, ref
,
648 * we've updated the existing ref, free the newly
651 kmem_cache_free(btrfs_delayed_ref_head_cachep
, head_ref
);
656 if (is_data
&& count_mod
< 0)
657 delayed_refs
->pending_csums
+= num_bytes
;
658 delayed_refs
->num_heads
++;
659 delayed_refs
->num_heads_ready
++;
660 atomic_inc(&delayed_refs
->num_entries
);
661 trans
->delayed_ref_updates
++;
663 if (qrecord_inserted_ret
)
664 *qrecord_inserted_ret
= qrecord_inserted
;
666 *new_ref_mod
= head_ref
->total_ref_mod
;
671 * helper to insert a delayed tree ref into the rbtree.
674 add_delayed_tree_ref(struct btrfs_fs_info
*fs_info
,
675 struct btrfs_trans_handle
*trans
,
676 struct btrfs_delayed_ref_head
*head_ref
,
677 struct btrfs_delayed_ref_node
*ref
, u64 bytenr
,
678 u64 num_bytes
, u64 parent
, u64 ref_root
, int level
,
681 struct btrfs_delayed_tree_ref
*full_ref
;
682 struct btrfs_delayed_ref_root
*delayed_refs
;
686 if (action
== BTRFS_ADD_DELAYED_EXTENT
)
687 action
= BTRFS_ADD_DELAYED_REF
;
689 if (is_fstree(ref_root
))
690 seq
= atomic64_read(&fs_info
->tree_mod_seq
);
691 delayed_refs
= &trans
->transaction
->delayed_refs
;
693 /* first set the basic ref node struct up */
694 refcount_set(&ref
->refs
, 1);
695 ref
->bytenr
= bytenr
;
696 ref
->num_bytes
= num_bytes
;
698 ref
->action
= action
;
702 INIT_LIST_HEAD(&ref
->list
);
703 INIT_LIST_HEAD(&ref
->add_list
);
705 full_ref
= btrfs_delayed_node_to_tree_ref(ref
);
706 full_ref
->parent
= parent
;
707 full_ref
->root
= ref_root
;
709 ref
->type
= BTRFS_SHARED_BLOCK_REF_KEY
;
711 ref
->type
= BTRFS_TREE_BLOCK_REF_KEY
;
712 full_ref
->level
= level
;
714 trace_add_delayed_tree_ref(fs_info
, ref
, full_ref
, action
);
716 ret
= add_delayed_ref_tail_merge(trans
, delayed_refs
, head_ref
, ref
);
719 * XXX: memory should be freed at the same level allocated.
720 * But bad practice is anywhere... Follow it now. Need cleanup.
723 kmem_cache_free(btrfs_delayed_tree_ref_cachep
, full_ref
);
727 * helper to insert a delayed data ref into the rbtree.
730 add_delayed_data_ref(struct btrfs_fs_info
*fs_info
,
731 struct btrfs_trans_handle
*trans
,
732 struct btrfs_delayed_ref_head
*head_ref
,
733 struct btrfs_delayed_ref_node
*ref
, u64 bytenr
,
734 u64 num_bytes
, u64 parent
, u64 ref_root
, u64 owner
,
735 u64 offset
, int action
)
737 struct btrfs_delayed_data_ref
*full_ref
;
738 struct btrfs_delayed_ref_root
*delayed_refs
;
742 if (action
== BTRFS_ADD_DELAYED_EXTENT
)
743 action
= BTRFS_ADD_DELAYED_REF
;
745 delayed_refs
= &trans
->transaction
->delayed_refs
;
747 if (is_fstree(ref_root
))
748 seq
= atomic64_read(&fs_info
->tree_mod_seq
);
750 /* first set the basic ref node struct up */
751 refcount_set(&ref
->refs
, 1);
752 ref
->bytenr
= bytenr
;
753 ref
->num_bytes
= num_bytes
;
755 ref
->action
= action
;
759 INIT_LIST_HEAD(&ref
->list
);
760 INIT_LIST_HEAD(&ref
->add_list
);
762 full_ref
= btrfs_delayed_node_to_data_ref(ref
);
763 full_ref
->parent
= parent
;
764 full_ref
->root
= ref_root
;
766 ref
->type
= BTRFS_SHARED_DATA_REF_KEY
;
768 ref
->type
= BTRFS_EXTENT_DATA_REF_KEY
;
770 full_ref
->objectid
= owner
;
771 full_ref
->offset
= offset
;
773 trace_add_delayed_data_ref(fs_info
, ref
, full_ref
, action
);
775 ret
= add_delayed_ref_tail_merge(trans
, delayed_refs
, head_ref
, ref
);
778 kmem_cache_free(btrfs_delayed_data_ref_cachep
, full_ref
);
782 * add a delayed tree ref. This does all of the accounting required
783 * to make sure the delayed ref is eventually processed before this
784 * transaction commits.
786 int btrfs_add_delayed_tree_ref(struct btrfs_fs_info
*fs_info
,
787 struct btrfs_trans_handle
*trans
,
788 u64 bytenr
, u64 num_bytes
, u64 parent
,
789 u64 ref_root
, int level
, int action
,
790 struct btrfs_delayed_extent_op
*extent_op
,
791 int *old_ref_mod
, int *new_ref_mod
)
793 struct btrfs_delayed_tree_ref
*ref
;
794 struct btrfs_delayed_ref_head
*head_ref
;
795 struct btrfs_delayed_ref_root
*delayed_refs
;
796 struct btrfs_qgroup_extent_record
*record
= NULL
;
797 int qrecord_inserted
;
799 BUG_ON(extent_op
&& extent_op
->is_data
);
800 ref
= kmem_cache_alloc(btrfs_delayed_tree_ref_cachep
, GFP_NOFS
);
804 head_ref
= kmem_cache_alloc(btrfs_delayed_ref_head_cachep
, GFP_NOFS
);
808 if (test_bit(BTRFS_FS_QUOTA_ENABLED
, &fs_info
->flags
) &&
809 is_fstree(ref_root
)) {
810 record
= kmalloc(sizeof(*record
), GFP_NOFS
);
815 head_ref
->extent_op
= extent_op
;
817 delayed_refs
= &trans
->transaction
->delayed_refs
;
818 spin_lock(&delayed_refs
->lock
);
821 * insert both the head node and the new ref without dropping
824 head_ref
= add_delayed_ref_head(fs_info
, trans
, &head_ref
->node
, record
,
825 bytenr
, num_bytes
, 0, 0, action
, 0,
826 &qrecord_inserted
, old_ref_mod
,
829 add_delayed_tree_ref(fs_info
, trans
, head_ref
, &ref
->node
, bytenr
,
830 num_bytes
, parent
, ref_root
, level
, action
);
831 spin_unlock(&delayed_refs
->lock
);
833 if (qrecord_inserted
)
834 return btrfs_qgroup_trace_extent_post(fs_info
, record
);
838 kmem_cache_free(btrfs_delayed_ref_head_cachep
, head_ref
);
840 kmem_cache_free(btrfs_delayed_tree_ref_cachep
, ref
);
846 * add a delayed data ref. it's similar to btrfs_add_delayed_tree_ref.
848 int btrfs_add_delayed_data_ref(struct btrfs_fs_info
*fs_info
,
849 struct btrfs_trans_handle
*trans
,
850 u64 bytenr
, u64 num_bytes
,
851 u64 parent
, u64 ref_root
,
852 u64 owner
, u64 offset
, u64 reserved
, int action
,
853 int *old_ref_mod
, int *new_ref_mod
)
855 struct btrfs_delayed_data_ref
*ref
;
856 struct btrfs_delayed_ref_head
*head_ref
;
857 struct btrfs_delayed_ref_root
*delayed_refs
;
858 struct btrfs_qgroup_extent_record
*record
= NULL
;
859 int qrecord_inserted
;
861 ref
= kmem_cache_alloc(btrfs_delayed_data_ref_cachep
, GFP_NOFS
);
865 head_ref
= kmem_cache_alloc(btrfs_delayed_ref_head_cachep
, GFP_NOFS
);
867 kmem_cache_free(btrfs_delayed_data_ref_cachep
, ref
);
871 if (test_bit(BTRFS_FS_QUOTA_ENABLED
, &fs_info
->flags
) &&
872 is_fstree(ref_root
)) {
873 record
= kmalloc(sizeof(*record
), GFP_NOFS
);
875 kmem_cache_free(btrfs_delayed_data_ref_cachep
, ref
);
876 kmem_cache_free(btrfs_delayed_ref_head_cachep
,
882 head_ref
->extent_op
= NULL
;
884 delayed_refs
= &trans
->transaction
->delayed_refs
;
885 spin_lock(&delayed_refs
->lock
);
888 * insert both the head node and the new ref without dropping
891 head_ref
= add_delayed_ref_head(fs_info
, trans
, &head_ref
->node
, record
,
892 bytenr
, num_bytes
, ref_root
, reserved
,
893 action
, 1, &qrecord_inserted
,
894 old_ref_mod
, new_ref_mod
);
896 add_delayed_data_ref(fs_info
, trans
, head_ref
, &ref
->node
, bytenr
,
897 num_bytes
, parent
, ref_root
, owner
, offset
,
899 spin_unlock(&delayed_refs
->lock
);
901 if (qrecord_inserted
)
902 return btrfs_qgroup_trace_extent_post(fs_info
, record
);
906 int btrfs_add_delayed_extent_op(struct btrfs_fs_info
*fs_info
,
907 struct btrfs_trans_handle
*trans
,
908 u64 bytenr
, u64 num_bytes
,
909 struct btrfs_delayed_extent_op
*extent_op
)
911 struct btrfs_delayed_ref_head
*head_ref
;
912 struct btrfs_delayed_ref_root
*delayed_refs
;
914 head_ref
= kmem_cache_alloc(btrfs_delayed_ref_head_cachep
, GFP_NOFS
);
918 head_ref
->extent_op
= extent_op
;
920 delayed_refs
= &trans
->transaction
->delayed_refs
;
921 spin_lock(&delayed_refs
->lock
);
923 add_delayed_ref_head(fs_info
, trans
, &head_ref
->node
, NULL
, bytenr
,
924 num_bytes
, 0, 0, BTRFS_UPDATE_DELAYED_HEAD
,
925 extent_op
->is_data
, NULL
, NULL
, NULL
);
927 spin_unlock(&delayed_refs
->lock
);
932 * this does a simple search for the head node for a given extent.
933 * It must be called with the delayed ref spinlock held, and it returns
934 * the head node if any where found, or NULL if not.
936 struct btrfs_delayed_ref_head
*
937 btrfs_find_delayed_ref_head(struct btrfs_delayed_ref_root
*delayed_refs
, u64 bytenr
)
939 return find_ref_head(&delayed_refs
->href_root
, bytenr
, 0);
942 void btrfs_delayed_ref_exit(void)
944 kmem_cache_destroy(btrfs_delayed_ref_head_cachep
);
945 kmem_cache_destroy(btrfs_delayed_tree_ref_cachep
);
946 kmem_cache_destroy(btrfs_delayed_data_ref_cachep
);
947 kmem_cache_destroy(btrfs_delayed_extent_op_cachep
);
950 int btrfs_delayed_ref_init(void)
952 btrfs_delayed_ref_head_cachep
= kmem_cache_create(
953 "btrfs_delayed_ref_head",
954 sizeof(struct btrfs_delayed_ref_head
), 0,
955 SLAB_MEM_SPREAD
, NULL
);
956 if (!btrfs_delayed_ref_head_cachep
)
959 btrfs_delayed_tree_ref_cachep
= kmem_cache_create(
960 "btrfs_delayed_tree_ref",
961 sizeof(struct btrfs_delayed_tree_ref
), 0,
962 SLAB_MEM_SPREAD
, NULL
);
963 if (!btrfs_delayed_tree_ref_cachep
)
966 btrfs_delayed_data_ref_cachep
= kmem_cache_create(
967 "btrfs_delayed_data_ref",
968 sizeof(struct btrfs_delayed_data_ref
), 0,
969 SLAB_MEM_SPREAD
, NULL
);
970 if (!btrfs_delayed_data_ref_cachep
)
973 btrfs_delayed_extent_op_cachep
= kmem_cache_create(
974 "btrfs_delayed_extent_op",
975 sizeof(struct btrfs_delayed_extent_op
), 0,
976 SLAB_MEM_SPREAD
, NULL
);
977 if (!btrfs_delayed_extent_op_cachep
)
982 btrfs_delayed_ref_exit();