Miscellanious performance adjustments to the kernel
[dragonfly.git] / sys / vfs / isofs / cd9660 / cd9660_lookup.c
blob01661ae2ee726995b17bac63c54bf1f369c70bdc
1 /*-
2 * Copyright (c) 1989, 1993, 1994
3 * The Regents of the University of California. All rights reserved.
5 * This code is derived from software contributed to Berkeley
6 * by Pace Willisson (pace@blitz.com). The Rock Ridge Extension
7 * Support code is derived from software contributed to Berkeley
8 * by Atsushi Murai (amurai@spec.co.jp).
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
12 * are met:
13 * 1. Redistributions of source code must retain the above copyright
14 * notice, this list of conditions and the following disclaimer.
15 * 2. Redistributions in binary form must reproduce the above copyright
16 * notice, this list of conditions and the following disclaimer in the
17 * documentation and/or other materials provided with the distribution.
18 * 3. All advertising materials mentioning features or use of this software
19 * must display the following acknowledgement:
20 * This product includes software developed by the University of
21 * California, Berkeley and its contributors.
22 * 4. Neither the name of the University nor the names of its contributors
23 * may be used to endorse or promote products derived from this software
24 * without specific prior written permission.
26 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
27 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
28 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
29 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
30 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
31 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
32 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
33 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
34 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
35 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
36 * SUCH DAMAGE.
38 * from: @(#)ufs_lookup.c 7.33 (Berkeley) 5/19/91
40 * @(#)cd9660_lookup.c 8.2 (Berkeley) 1/23/94
41 * $FreeBSD: src/sys/isofs/cd9660/cd9660_lookup.c,v 1.23.2.2 2001/11/04 06:19:47 dillon Exp $
42 * $DragonFly: src/sys/vfs/isofs/cd9660/cd9660_lookup.c,v 1.25 2008/06/19 23:27:39 dillon Exp $
45 #include <sys/param.h>
46 #include <sys/systm.h>
47 #include <sys/proc.h>
48 #include <sys/namei.h>
49 #include <sys/buf.h>
50 #include <sys/vnode.h>
51 #include <sys/mount.h>
53 #include "iso.h"
54 #include "cd9660_node.h"
55 #include "iso_rrip.h"
58 * Convert a component of a pathname into a pointer to a locked inode.
59 * This is a very central and rather complicated routine.
60 * If the file system is not maintained in a strict tree hierarchy,
61 * this can result in a deadlock situation (see comments in code below).
63 * The flag argument is LOOKUP, CREATE, RENAME, or DELETE depending on
64 * whether the name is to be looked up, created, renamed, or deleted.
65 * When CREATE, RENAME, or DELETE is specified, information usable in
66 * creating, renaming, or deleting a directory entry may be calculated.
67 * If flag has LOCKPARENT or'ed into it and the target of the pathname
68 * exists, lookup returns both the target and its parent directory locked.
69 * When creating or renaming and LOCKPARENT is specified, the target may
70 * not be ".". When deleting and LOCKPARENT is specified, the target may
71 * be "."., but the caller must check to ensure it does an vrele and iput
72 * instead of two iputs.
74 * Overall outline of ufs_lookup:
76 * search for name in directory, to found or notfound
77 * notfound:
78 * if creating, return locked directory, leaving info on available slots
79 * else return error
80 * found:
81 * if at end of path and deleting, return information to allow delete
82 * if at end of path and rewriting (RENAME and LOCKPARENT), lock target
83 * inode and return info to allow rewrite
84 * if not at end, add name to cache; if at end and neither creating
85 * nor deleting, add name to cache
87 * NOTE: (LOOKUP | LOCKPARENT) currently returns the parent inode unlocked.
89 * cd9660_lookup(struct vnode *a_dvp, struct vnode **a_vpp,
90 * struct componentname *a_cnp)
92 int
93 cd9660_lookup(struct vop_old_lookup_args *ap)
95 struct vnode *vdp; /* vnode for directory being searched */
96 globaldata_t gd = mycpu;
97 struct iso_node *dp; /* inode for directory being searched */
98 struct iso_mnt *imp; /* file system that directory is in */
99 struct buf *bp; /* a buffer of directory entries */
100 struct iso_directory_record *ep = 0;/* the current directory entry */
101 int entryoffsetinblock; /* offset of ep in bp's buffer */
102 int saveoffset = 0; /* offset of last directory entry in dir */
103 int numdirpasses; /* strategy for directory search */
104 doff_t endsearch; /* offset to end directory search */
105 struct vnode *pdp; /* saved dp during symlink work */
106 struct vnode *tdp; /* returned by cd9660_vget_internal */
107 u_long bmask; /* block offset mask */
108 int lockparent; /* 1 => lockparent flag is set */
109 int wantparent; /* 1 => wantparent or lockparent flag */
110 int error;
111 ino_t ino = 0;
112 int reclen;
113 u_short namelen;
114 int isoflags;
115 char altname[NAME_MAX];
116 int res;
117 int assoc, len;
118 char *name;
119 struct vnode **vpp = ap->a_vpp;
120 struct componentname *cnp = ap->a_cnp;
121 int flags = cnp->cn_flags;
122 int nameiop = cnp->cn_nameiop;
124 bp = NULL;
125 *vpp = NULL;
126 vdp = ap->a_dvp;
127 dp = VTOI(vdp);
128 imp = dp->i_mnt;
129 lockparent = flags & CNP_LOCKPARENT;
130 wantparent = flags & (CNP_LOCKPARENT | CNP_WANTPARENT);
131 cnp->cn_flags &= ~CNP_PDIRUNLOCK;
134 * We now have a segment name to search for, and a directory to search.
137 len = cnp->cn_namelen;
138 name = cnp->cn_nameptr;
140 * A leading `=' means, we are looking for an associated file
142 if ((assoc = (imp->iso_ftype != ISO_FTYPE_RRIP && *name == ASSOCCHAR)))
144 len--;
145 name++;
149 * If there is cached information on a previous search of
150 * this directory, pick up where we last left off.
151 * We cache only lookups as these are the most common
152 * and have the greatest payoff. Caching CREATE has little
153 * benefit as it usually must search the entire directory
154 * to determine that the entry does not exist. Caching the
155 * location of the last DELETE or RENAME has not reduced
156 * profiling time and hence has been removed in the interest
157 * of simplicity.
159 bmask = imp->im_bmask;
160 if (nameiop != NAMEI_LOOKUP || dp->i_diroff == 0 ||
161 dp->i_diroff > dp->i_size) {
162 entryoffsetinblock = 0;
163 dp->i_offset = 0;
164 numdirpasses = 1;
165 } else {
166 dp->i_offset = dp->i_diroff;
167 if ((entryoffsetinblock = dp->i_offset & bmask) &&
168 (error = cd9660_devblkatoff(vdp, (off_t)dp->i_offset, NULL, &bp)))
169 return (error);
170 numdirpasses = 2;
171 gd->gd_nchstats->ncs_2passes++;
173 endsearch = dp->i_size;
175 searchloop:
176 while (dp->i_offset < endsearch) {
178 * If offset is on a block boundary,
179 * read the next directory block.
180 * Release previous if it exists.
182 if ((dp->i_offset & bmask) == 0) {
183 if (bp != NULL)
184 brelse(bp);
185 if ((error =
186 cd9660_devblkatoff(vdp, (off_t)dp->i_offset, NULL, &bp)) != 0)
187 return (error);
188 entryoffsetinblock = 0;
191 * Get pointer to next entry.
193 ep = (struct iso_directory_record *)
194 ((char *)bp->b_data + entryoffsetinblock);
196 reclen = isonum_711(ep->length);
197 if (reclen == 0) {
198 /* skip to next block, if any */
199 dp->i_offset =
200 (dp->i_offset & ~bmask) + imp->logical_block_size;
201 continue;
204 if (reclen < ISO_DIRECTORY_RECORD_SIZE)
205 /* illegal entry, stop */
206 break;
208 if (entryoffsetinblock + reclen > imp->logical_block_size)
209 /* entries are not allowed to cross boundaries */
210 break;
212 namelen = isonum_711(ep->name_len);
213 isoflags = isonum_711(imp->iso_ftype == ISO_FTYPE_HIGH_SIERRA?
214 &ep->date[6]: ep->flags);
216 if (reclen < ISO_DIRECTORY_RECORD_SIZE + namelen)
217 /* illegal entry, stop */
218 break;
221 * Check for a name match.
223 switch (imp->iso_ftype) {
224 default:
225 if (!(isoflags & 4) == !assoc) {
226 if ((len == 1
227 && *name == '.')
228 || (flags & CNP_ISDOTDOT)) {
229 if (namelen == 1
230 && ep->name[0] == ((flags & CNP_ISDOTDOT) ? 1 : 0)) {
232 * Save directory entry's inode number and
233 * release directory buffer.
235 dp->i_ino = isodirino(ep, imp);
236 goto found;
238 if (namelen != 1
239 || ep->name[0] != 0)
240 goto notfound;
241 } else if (!(res = isofncmp(name, len, ep->name, namelen, imp->joliet_level))) {
242 if (isoflags & 2)
243 ino = isodirino(ep, imp);
244 else
245 ino = bp->b_bio1.bio_offset +
246 entryoffsetinblock;
247 saveoffset = dp->i_offset;
248 } else if (ino)
249 goto foundino;
250 #ifdef NOSORTBUG /* On some CDs directory entries are not sorted correctly */
251 else if (res < 0)
252 goto notfound;
253 else if (res > 0 && numdirpasses == 2)
254 numdirpasses++;
255 #endif
257 break;
258 case ISO_FTYPE_RRIP:
259 if (isonum_711(ep->flags)&2)
260 ino = isodirino(ep, imp);
261 else
262 ino = bp->b_bio1.bio_offset +
263 entryoffsetinblock;
264 dp->i_ino = ino;
265 cd9660_rrip_getname(ep,altname,&namelen,&dp->i_ino,imp);
266 if (namelen == cnp->cn_namelen
267 && !bcmp(name,altname,namelen))
268 goto found;
269 ino = 0;
270 break;
272 dp->i_offset += reclen;
273 entryoffsetinblock += reclen;
275 if (ino) {
276 foundino:
277 dp->i_ino = ino;
278 if (saveoffset != dp->i_offset) {
279 if (lblkno(imp, dp->i_offset) !=
280 lblkno(imp, saveoffset)) {
281 if (bp != NULL)
282 brelse(bp);
283 if ((error = cd9660_devblkatoff(vdp,
284 (off_t)saveoffset, NULL, &bp)) != 0)
285 return (error);
287 entryoffsetinblock = saveoffset & bmask;
288 ep = (struct iso_directory_record *)
289 ((char *)bp->b_data + entryoffsetinblock);
290 dp->i_offset = saveoffset;
292 goto found;
294 notfound:
296 * If we started in the middle of the directory and failed
297 * to find our target, we must check the beginning as well.
299 if (numdirpasses == 2) {
300 numdirpasses--;
301 dp->i_offset = 0;
302 endsearch = dp->i_diroff;
303 goto searchloop;
305 if (bp != NULL)
306 brelse(bp);
308 if (nameiop == NAMEI_CREATE || nameiop == NAMEI_RENAME)
309 return (EROFS);
310 return (ENOENT);
312 found:
313 if (numdirpasses == 2)
314 gd->gd_nchstats->ncs_pass2++;
317 * Found component in pathname.
318 * If the final component of path name, save information
319 * in the cache as to where the entry was found.
321 if (nameiop == NAMEI_LOOKUP)
322 dp->i_diroff = dp->i_offset;
325 * Step through the translation in the name. We do not `iput' the
326 * directory because we may need it again if a symbolic link
327 * is relative to the current directory. Instead we save it
328 * unlocked as "pdp". We must get the target inode before unlocking
329 * the directory to insure that the inode will not be removed
330 * before we get it. We prevent deadlock by always fetching
331 * inodes from the root, moving down the directory tree. Thus
332 * when following backward pointers ".." we must unlock the
333 * parent directory before getting the requested directory.
334 * There is a potential race condition here if both the current
335 * and parent directories are removed before the `iget' for the
336 * inode associated with ".." returns. We hope that this occurs
337 * infrequently since we cannot avoid this race condition without
338 * implementing a sophisticated deadlock detection algorithm.
339 * Note also that this simple deadlock detection scheme will not
340 * work if the file system has any hard links other than ".."
341 * that point backwards in the directory structure.
343 pdp = vdp;
345 * If ino is different from dp->i_ino,
346 * it's a relocated directory.
348 if (flags & CNP_ISDOTDOT) {
349 vn_unlock(pdp); /* race to get the inode */
350 error = cd9660_vget_internal(vdp->v_mount, dp->i_ino, &tdp,
351 dp->i_ino != ino, ep);
352 brelse(bp);
353 if (error) {
354 vn_lock(pdp, LK_EXCLUSIVE | LK_RETRY);
355 return (error);
357 if (lockparent) {
358 if ((error = vn_lock(pdp, LK_EXCLUSIVE)) != 0) {
359 cnp->cn_flags |= CNP_PDIRUNLOCK;
360 vput(tdp);
361 return (error);
363 } else
364 cnp->cn_flags |= CNP_PDIRUNLOCK;
365 *vpp = tdp;
366 } else if (dp->i_number == dp->i_ino) {
367 brelse(bp);
368 vref(vdp); /* we want ourself, ie "." */
369 *vpp = vdp;
370 } else {
371 error = cd9660_vget_internal(vdp->v_mount, dp->i_ino, &tdp,
372 dp->i_ino != ino, ep);
373 brelse(bp);
374 if (error)
375 return (error);
376 if (!lockparent) {
377 cnp->cn_flags |= CNP_PDIRUNLOCK;
378 vn_unlock(pdp);
380 *vpp = tdp;
382 return (0);
386 * Return a buffer with the contents of block "offset" from the beginning of
387 * directory "ip". If "res" is non-zero, fill it in with a pointer to the
388 * remaining space in the directory.
391 cd9660_blkatoff(struct vnode *vp, off_t offset, char **res, struct buf **bpp)
393 struct iso_node *ip;
394 struct iso_mnt *imp;
395 struct buf *bp;
396 daddr_t lbn;
397 int bsize, error;
399 ip = VTOI(vp);
400 imp = ip->i_mnt;
401 lbn = lblkno(imp, offset);
402 bsize = blksize(imp, ip, lbn);
404 if ((error = bread(vp, lblktooff(imp, lbn), bsize, &bp)) != 0) {
405 brelse(bp);
406 *bpp = NULL;
407 return (error);
411 * We must BMAP the buffer because the directory code may use
412 * bio_offset to calculate the inode for certain types of directory
413 * entries. We could get away with not doing it before we
414 * VMIO-backed the directories because the buffers would get freed
415 * atomically with the invalidation of their data. But with
416 * VMIO-backed buffers the buffers may be freed and then later
417 * reconstituted - and the reconstituted buffer will have no
418 * knowledge of bio_offset.
420 if (bp->b_bio2.bio_offset == NOOFFSET) {
421 error = VOP_BMAP(vp, bp->b_bio1.bio_offset,
422 &bp->b_bio2.bio_offset, NULL, NULL,
423 BUF_CMD_READ);
424 if (error) {
425 bp->b_error = error;
426 bp->b_flags |= B_ERROR;
427 brelse(bp);
428 *bpp = NULL;
429 return (error);
433 if (res)
434 *res = (char *)bp->b_data + blkoff(imp, offset);
435 *bpp = bp;
436 return (0);
441 * Return a buffer with the contents of block "offset" from the beginning of
442 * directory "ip". If "res" is non-zero, fill it in with a pointer to the
443 * remaining space in the directory.
445 * Use the underlying device vnode rather then the passed vnode for the
446 * buffer cache operation. This allows us to access meta-data conveniently
447 * without having to instantiate a VM object for the vnode.
449 * WARNING! Callers of this routine need to be careful when accessing
450 * the bio_offset. Since this is a device buffer, the device offset will
451 * be in bio1.bio_offset, not bio2.bio_offset.
454 cd9660_devblkatoff(struct vnode *vp, off_t offset, char **res, struct buf **bpp)
456 struct iso_node *ip;
457 struct iso_mnt *imp;
458 struct buf *bp;
459 daddr_t lbn;
460 off_t doffset;
461 int bsize, error;
463 ip = VTOI(vp);
464 imp = ip->i_mnt;
465 lbn = lblkno(imp, offset);
466 bsize = blksize(imp, ip, lbn);
468 error = VOP_BMAP(vp, lblktooff(imp, lbn), &doffset, NULL, NULL,
469 BUF_CMD_READ);
470 if (error)
471 return (error);
473 if ((error = bread(imp->im_devvp, doffset, bsize, &bp)) != 0) {
474 brelse(bp);
475 *bpp = NULL;
476 return (error);
478 if (res)
479 *res = (char *)bp->b_data + blkoff(imp, offset);
480 *bpp = bp;
481 return (0);