2 * Copyright (c) 2007-2008 The DragonFly Project. All rights reserved.
4 * This code is derived from software contributed to The DragonFly Project
5 * by Matthew Dillon <dillon@backplane.com>
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in
15 * the documentation and/or other materials provided with the
17 * 3. Neither the name of The DragonFly Project nor the names of its
18 * contributors may be used to endorse or promote products derived
19 * from this software without specific, prior written permission.
21 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
22 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
23 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
24 * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
25 * COPYRIGHT HOLDERS OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
26 * INCIDENTAL, SPECIAL, EXEMPLARY OR CONSEQUENTIAL DAMAGES (INCLUDING,
27 * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
28 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
29 * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
30 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
31 * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
34 * $DragonFly: src/sys/vfs/hammer/hammer_transaction.c,v 1.25 2008/09/23 21:03:52 dillon Exp $
39 static hammer_tid_t
hammer_alloc_tid(hammer_mount_t hmp
, int count
);
40 static u_int32_t
ocp_allocbit(hammer_objid_cache_t ocp
, u_int32_t n
);
44 * Start a standard transaction.
47 hammer_start_transaction(struct hammer_transaction
*trans
,
48 struct hammer_mount
*hmp
)
53 trans
->type
= HAMMER_TRANS_STD
;
55 trans
->rootvol
= hammer_get_root_volume(hmp
, &error
);
58 trans
->sync_lock_refs
= 0;
62 trans
->time
= (unsigned long)tv
.tv_sec
* 1000000ULL + tv
.tv_usec
;
63 trans
->time32
= (u_int32_t
)tv
.tv_sec
;
67 * Start a simple read-only transaction. This will not stall.
70 hammer_simple_transaction(struct hammer_transaction
*trans
,
71 struct hammer_mount
*hmp
)
76 trans
->type
= HAMMER_TRANS_RO
;
78 trans
->rootvol
= hammer_get_root_volume(hmp
, &error
);
81 trans
->sync_lock_refs
= 0;
85 trans
->time
= (unsigned long)tv
.tv_sec
* 1000000ULL + tv
.tv_usec
;
86 trans
->time32
= (u_int32_t
)tv
.tv_sec
;
90 * Start a transaction using a particular TID. Used by the sync code.
91 * This does not stall.
93 * This routine may only be called from the flusher thread. We predispose
94 * sync_lock_refs, implying serialization against the synchronization stage
95 * (which the flusher is responsible for).
98 hammer_start_transaction_fls(struct hammer_transaction
*trans
,
99 struct hammer_mount
*hmp
)
104 bzero(trans
, sizeof(*trans
));
106 trans
->type
= HAMMER_TRANS_FLS
;
108 trans
->rootvol
= hammer_get_root_volume(hmp
, &error
);
109 KKASSERT(error
== 0);
110 trans
->tid
= hammer_alloc_tid(hmp
, 1);
111 trans
->sync_lock_refs
= 1;
115 trans
->time
= (unsigned long)tv
.tv_sec
* 1000000ULL + tv
.tv_usec
;
116 trans
->time32
= (u_int32_t
)tv
.tv_sec
;
120 hammer_done_transaction(struct hammer_transaction
*trans
)
122 hammer_mount_t hmp
= trans
->hmp
;
123 int expected_lock_refs
;
125 hammer_rel_volume(trans
->rootvol
, 0);
126 trans
->rootvol
= NULL
;
127 expected_lock_refs
= (trans
->type
== HAMMER_TRANS_FLS
) ? 1 : 0;
128 KKASSERT(trans
->sync_lock_refs
== expected_lock_refs
);
129 trans
->sync_lock_refs
= 0;
130 if (trans
->type
!= HAMMER_TRANS_FLS
) {
131 if (trans
->flags
& HAMMER_TRANSF_NEWINODE
)
132 hammer_inode_waitreclaims(hmp
);
133 else if (trans
->flags
& HAMMER_TRANSF_DIDIO
)
134 hammer_inode_waithard(hmp
);
139 * Allocate (count) TIDs. If running in multi-master mode the returned
140 * base will be aligned to a 16-count plus the master id (0-15).
141 * Multi-master mode allows non-conflicting to run and new objects to be
142 * created on multiple masters in parallel. The transaction id identifies
143 * the original master. The object_id is also subject to this rule in
144 * order to allow objects to be created on multiple masters in parallel.
146 * Directories may pre-allocate a large number of object ids (100,000).
148 * NOTE: There is no longer a requirement that successive transaction
149 * ids be 2 apart for separator generation.
152 hammer_alloc_tid(hammer_mount_t hmp
, int count
)
156 if (hmp
->master_id
< 0) {
157 tid
= hmp
->next_tid
+ 1;
158 hmp
->next_tid
= tid
+ count
;
160 tid
= (hmp
->next_tid
+ HAMMER_MAX_MASTERS
) &
161 ~(hammer_tid_t
)(HAMMER_MAX_MASTERS
- 1);
162 hmp
->next_tid
= tid
+ count
* HAMMER_MAX_MASTERS
;
163 tid
|= hmp
->master_id
;
165 if (tid
>= 0xFFFFFFFFFF000000ULL
)
166 panic("hammer_start_transaction: Ran out of TIDs!");
167 if (hammer_debug_tid
)
168 kprintf("alloc_tid %016llx\n", (long long)tid
);
173 * Allocate an object id.
175 * We use the upper OBJID_CACHE_BITS bits of the namekey to try to match
176 * the low bits of the objid we allocate.
179 hammer_alloc_objid(hammer_mount_t hmp
, hammer_inode_t dip
, int64_t namekey
)
181 hammer_objid_cache_t ocp
;
186 while ((ocp
= dip
->objid_cache
) == NULL
) {
187 if (hmp
->objid_cache_count
< OBJID_CACHE_SIZE
) {
188 ocp
= kmalloc(sizeof(*ocp
), hmp
->m_misc
,
190 ocp
->base_tid
= hammer_alloc_tid(hmp
,
191 OBJID_CACHE_BULK
* 2);
192 ocp
->base_tid
+= OBJID_CACHE_BULK_MASK64
;
193 ocp
->base_tid
&= ~OBJID_CACHE_BULK_MASK64
;
194 TAILQ_INSERT_HEAD(&hmp
->objid_cache_list
, ocp
, entry
);
195 ++hmp
->objid_cache_count
;
196 /* may have blocked, recheck */
197 if (dip
->objid_cache
== NULL
) {
198 dip
->objid_cache
= ocp
;
203 * Steal one from another directory?
205 * Throw away ocp's that are more then half full, they
206 * aren't worth stealing.
208 ocp
= TAILQ_FIRST(&hmp
->objid_cache_list
);
210 ocp
->dip
->objid_cache
= NULL
;
211 if (ocp
->count
>= OBJID_CACHE_BULK
/ 2) {
212 --hmp
->objid_cache_count
;
213 kfree(ocp
, hmp
->m_misc
);
215 dip
->objid_cache
= ocp
;
220 TAILQ_REMOVE(&hmp
->objid_cache_list
, ocp
, entry
);
223 * Allocate a bit based on our namekey for the low bits of our
226 incluster
= (hmp
->master_id
>= 0);
227 n
= (namekey
>> (63 - OBJID_CACHE_BULK_BITS
)) & OBJID_CACHE_BULK_MASK
;
228 n
= ocp_allocbit(ocp
, n
);
229 tid
= ocp
->base_tid
+ n
;
233 * The TID is incremented by 1 or by 16 depending what mode the
234 * mount is operating in.
236 ocp
->next_tid
+= (hmp
->master_id
< 0) ? 1 : HAMMER_MAX_MASTERS
;
238 if (ocp
->count
>= OBJID_CACHE_BULK
/ 2) {
239 dip
->objid_cache
= NULL
;
240 --hmp
->objid_cache_count
;
242 kfree(ocp
, hmp
->m_misc
);
244 TAILQ_INSERT_TAIL(&hmp
->objid_cache_list
, ocp
, entry
);
250 * Allocate a bit starting with bit n. Wrap if necessary.
252 * This routine is only ever called if a bit is available somewhere
256 ocp_allocbit(hammer_objid_cache_t ocp
, u_int32_t n
)
263 while (ocp
->bm1
[n0
] & (1 << n
)) {
264 if (ocp
->bm0
& (1 << n0
)) {
267 } else if (++n
== 32) {
273 ocp
->bm1
[n0
] |= 1 << n
;
274 if (ocp
->bm1
[n0
] == 0xFFFFFFFFU
)
276 return((n0
<< 5) + n
);
280 hammer_clear_objid(hammer_inode_t dip
)
282 hammer_objid_cache_t ocp
;
284 if ((ocp
= dip
->objid_cache
) != NULL
) {
285 dip
->objid_cache
= NULL
;
287 TAILQ_REMOVE(&dip
->hmp
->objid_cache_list
, ocp
, entry
);
288 TAILQ_INSERT_HEAD(&dip
->hmp
->objid_cache_list
, ocp
, entry
);
293 hammer_destroy_objid_cache(hammer_mount_t hmp
)
295 hammer_objid_cache_t ocp
;
297 while ((ocp
= TAILQ_FIRST(&hmp
->objid_cache_list
)) != NULL
) {
298 TAILQ_REMOVE(&hmp
->objid_cache_list
, ocp
, entry
);
300 ocp
->dip
->objid_cache
= NULL
;
301 kfree(ocp
, hmp
->m_misc
);