1 /* Traverse a file hierarchy.
3 Copyright (C) 2004-2020 Free Software Foundation, Inc.
5 This program is free software: you can redistribute it and/or modify
6 it under the terms of the GNU General Public License as published by
7 the Free Software Foundation; either version 3 of the License, or
8 (at your option) any later version.
10 This program is distributed in the hope that it will be useful,
11 but WITHOUT ANY WARRANTY; without even the implied warranty of
12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 GNU General Public License for more details.
15 You should have received a copy of the GNU General Public License
16 along with this program. If not, see <https://www.gnu.org/licenses/>. */
19 * Copyright (c) 1990, 1993, 1994
20 * The Regents of the University of California. All rights reserved.
22 * Redistribution and use in source and binary forms, with or without
23 * modification, are permitted provided that the following conditions
25 * 1. Redistributions of source code must retain the above copyright
26 * notice, this list of conditions and the following disclaimer.
27 * 2. Redistributions in binary form must reproduce the above copyright
28 * notice, this list of conditions and the following disclaimer in the
29 * documentation and/or other materials provided with the distribution.
30 * 4. Neither the name of the University nor the names of its contributors
31 * may be used to endorse or promote products derived from this software
32 * without specific prior written permission.
34 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS" AND
35 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
36 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
37 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
38 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
39 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
40 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
41 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
42 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
43 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
49 #if defined LIBC_SCCS && !defined GCC_LINT && !defined lint
50 static char sccsid
[] = "@(#)fts.c 8.6 (Berkeley) 8/14/94";
55 #if HAVE_SYS_PARAM_H || defined _LIBC
56 # include <sys/param.h>
59 # include <include/sys/stat.h>
61 # include <sys/stat.h>
73 # include "attribute.h"
75 # include "flexmember.h"
77 # include "opendirat.h"
78 # include "same-inode.h"
82 #ifndef _D_EXACT_NAMLEN
83 # define _D_EXACT_NAMLEN(dirent) strlen ((dirent)->d_name)
86 #if HAVE_STRUCT_DIRENT_D_TYPE
87 /* True if the type of the directory entry D is known. */
88 # define DT_IS_KNOWN(d) ((d)->d_type != DT_UNKNOWN)
89 /* True if the type of the directory entry D must be T. */
90 # define DT_MUST_BE(d, t) ((d)->d_type == (t))
91 # define D_TYPE(d) ((d)->d_type)
93 # define DT_IS_KNOWN(d) false
94 # define DT_MUST_BE(d, t) false
95 # define D_TYPE(d) DT_UNKNOWN
100 /* Any nonzero values will do here, so long as they're distinct.
101 Undef any existing macros out of the way. */
127 NOT_AN_INODE_NUMBER
= 0
130 #ifdef D_INO_IN_DIRENT
131 # define D_INO(dp) (dp)->d_ino
133 /* Some systems don't have inodes, so fake them to avoid lots of ifdefs. */
134 # define D_INO(dp) NOT_AN_INODE_NUMBER
137 /* If possible (see max_entries, below), read no more than this many directory
138 entries at a time. Without this limit (i.e., when using non-NULL
139 fts_compar), processing a directory with 4,000,000 entries requires ~1GiB
140 of memory, and handling 64M entries would require 16GiB of memory. */
141 #ifndef FTS_MAX_READDIR_ENTRIES
142 # define FTS_MAX_READDIR_ENTRIES 100000
145 /* If there are more than this many entries in a directory,
146 and the conditions mentioned below are satisfied, then sort
147 the entries on inode number before any further processing. */
148 #ifndef FTS_INODE_SORT_DIR_ENTRIES_THRESHOLD
149 # define FTS_INODE_SORT_DIR_ENTRIES_THRESHOLD 10000
154 _FTS_INODE_SORT_DIR_ENTRIES_THRESHOLD
= FTS_INODE_SORT_DIR_ENTRIES_THRESHOLD
159 FTS_NO_STAT_REQUIRED
= 1,
160 FTS_STAT_REQUIRED
= 2
165 # define close __close
167 # define closedir __closedir
169 # define fchdir __fchdir
173 # define readdir __readdir
175 # undef internal_function
176 # define internal_function /* empty */
180 # define __set_errno(Val) errno = (Val)
183 /* If this host provides the openat function, then we can avoid
184 attempting to open "." in some initialization code below. */
186 # define HAVE_OPENAT_SUPPORT 1
188 # define HAVE_OPENAT_SUPPORT 0
192 # define fts_assert(expr) ((void) (0 && (expr)))
194 # define fts_assert(expr) \
204 # if (__GNUC__ >= 7) || (__clang_major__ >= 10)
205 # define FALLTHROUGH __attribute__ ((__fallthrough__))
207 # define FALLTHROUGH ((void) 0)
211 static FTSENT
*fts_alloc (FTS
*, const char *, size_t) internal_function
;
212 static FTSENT
*fts_build (FTS
*, int) internal_function
;
213 static void fts_lfree (FTSENT
*) internal_function
;
214 static void fts_load (FTS
*, FTSENT
*) internal_function
;
215 static size_t fts_maxarglen (char * const *) internal_function
;
216 static void fts_padjust (FTS
*, FTSENT
*) internal_function
;
217 static bool fts_palloc (FTS
*, size_t) internal_function
;
218 static FTSENT
*fts_sort (FTS
*, FTSENT
*, size_t) internal_function
;
219 static unsigned short int fts_stat (FTS
*, FTSENT
*, bool) internal_function
;
220 static int fts_safe_changedir (FTS
*, FTSENT
*, int, const char *)
223 #include "fts-cycle.c"
226 # define MAX(a,b) ((a) > (b) ? (a) : (b))
230 # define SIZE_MAX ((size_t) -1)
233 #define ISDOT(a) (a[0] == '.' && (!a[1] || (a[1] == '.' && !a[2])))
234 #define STREQ(a, b) (strcmp (a, b) == 0)
236 #define CLR(opt) (sp->fts_options &= ~(opt))
237 #define ISSET(opt) (sp->fts_options & (opt))
238 #define SET(opt) (sp->fts_options |= (opt))
240 /* FIXME: FTS_NOCHDIR is now misnamed.
241 Call it FTS_USE_FULL_RELATIVE_FILE_NAMES instead. */
242 #define FCHDIR(sp, fd) \
243 (!ISSET(FTS_NOCHDIR) && (ISSET(FTS_CWDFD) \
244 ? (cwd_advance_fd ((sp), (fd), true), 0) \
248 /* fts_build flags */
249 /* FIXME: make this an enum */
250 #define BCHILD 1 /* fts_children */
251 #define BNAMES 2 /* fts_children, names only */
252 #define BREAD 3 /* fts_read */
255 # include <inttypes.h>
258 # include "getcwdat.h"
259 bool fts_debug
= false;
260 # define Dprintf(x) do { if (fts_debug) printf x; } while (false)
263 # define fd_ring_check(x)
264 # define fd_ring_print(a, b, c)
267 #define LEAVE_DIR(Fts, Ent, Tag) \
270 Dprintf ((" %s-leaving: %s\n", Tag, (Ent)->fts_path)); \
271 leave_dir (Fts, Ent); \
272 fd_ring_check (Fts); \
277 fd_ring_clear (I_ring
*fd_ring
)
279 while ( ! i_ring_empty (fd_ring
))
281 int fd
= i_ring_pop (fd_ring
);
287 /* Overload the fts_statp->st_size member (otherwise unused, when
288 fts_info is FTS_NSOK) to indicate whether fts_read should stat
289 this entry or not. */
291 fts_set_stat_required (FTSENT
*p
, bool required
)
293 fts_assert (p
->fts_info
== FTS_NSOK
);
294 p
->fts_statp
->st_size
= (required
296 : FTS_NO_STAT_REQUIRED
);
299 /* Virtual fchdir. Advance SP's working directory file descriptor,
300 SP->fts_cwd_fd, to FD, and push the previous value onto the fd_ring.
301 CHDIR_DOWN_ONE is true if FD corresponds to an entry in the directory
302 open on sp->fts_cwd_fd; i.e., to move the working directory one level
306 cwd_advance_fd (FTS
*sp
, int fd
, bool chdir_down_one
)
308 int old
= sp
->fts_cwd_fd
;
309 fts_assert (old
!= fd
|| old
== AT_FDCWD
);
313 /* Push "old" onto the ring.
314 If the displaced file descriptor is non-negative, close it. */
315 int prev_fd_in_slot
= i_ring_push (&sp
->fts_fd_ring
, old
);
316 fd_ring_print (sp
, stderr
, "post-push");
317 if (0 <= prev_fd_in_slot
)
318 close (prev_fd_in_slot
); /* ignore any close failure */
320 else if ( ! ISSET (FTS_NOCHDIR
))
323 close (old
); /* ignore any close failure */
329 /* Restore the initial, pre-traversal, "working directory".
330 In FTS_CWDFD mode, we merely call cwd_advance_fd, otherwise,
331 we may actually change the working directory.
332 Return 0 upon success. Upon failure, set errno and return nonzero. */
334 restore_initial_cwd (FTS
*sp
)
336 int fail
= FCHDIR (sp
, ISSET (FTS_CWDFD
) ? AT_FDCWD
: sp
->fts_rfd
);
337 fd_ring_clear (&(sp
->fts_fd_ring
));
341 /* Open the directory DIR if possible, and return a file
342 descriptor. Return -1 and set errno on failure. It doesn't matter
343 whether the file descriptor has read or write access. */
347 diropen (FTS
const *sp
, char const *dir
)
349 int open_flags
= (O_SEARCH
| O_CLOEXEC
| O_DIRECTORY
| O_NOCTTY
| O_NONBLOCK
350 | (ISSET (FTS_PHYSICAL
) ? O_NOFOLLOW
: 0));
352 int fd
= (ISSET (FTS_CWDFD
)
353 ? openat (sp
->fts_cwd_fd
, dir
, open_flags
)
354 : open (dir
, open_flags
));
359 fts_open (char * const *argv
,
360 register int options
,
361 int (*compar
) (FTSENT
const **, FTSENT
const **))
364 register FTSENT
*p
, *root
;
365 register size_t nitems
;
366 FTSENT
*parent
= NULL
;
367 FTSENT
*tmp
= NULL
; /* pacify gcc */
371 if (options
& ~FTS_OPTIONMASK
) {
372 __set_errno (EINVAL
);
375 if ((options
& FTS_NOCHDIR
) && (options
& FTS_CWDFD
)) {
376 __set_errno (EINVAL
);
379 if ( ! (options
& (FTS_LOGICAL
| FTS_PHYSICAL
))) {
380 __set_errno (EINVAL
);
384 /* Allocate/initialize the stream */
385 sp
= calloc (1, sizeof *sp
);
388 sp
->fts_compar
= compar
;
389 sp
->fts_options
= options
;
391 /* Logical walks turn on NOCHDIR; symbolic links are too hard. */
392 if (ISSET(FTS_LOGICAL
)) {
397 /* Initialize fts_cwd_fd. */
398 sp
->fts_cwd_fd
= AT_FDCWD
;
399 if ( ISSET(FTS_CWDFD
) && ! HAVE_OPENAT_SUPPORT
)
401 /* While it isn't technically necessary to open "." this
402 early, doing it here saves us the trouble of ensuring
403 later (where it'd be messier) that "." can in fact
404 be opened. If not, revert to FTS_NOCHDIR mode. */
405 int fd
= open (".", O_SEARCH
| O_CLOEXEC
);
408 /* Even if "." is unreadable, don't revert to FTS_NOCHDIR mode
409 on systems like Linux+PROC_FS, where our openat emulation
410 is good enough. Note: on a system that emulates
411 openat via /proc, this technique can still fail, but
412 only in extreme conditions, e.g., when the working
413 directory cannot be saved (i.e. save_cwd fails) --
414 and that happens on Linux only when "." is unreadable
415 and the CWD would be longer than PATH_MAX.
416 FIXME: once Linux kernel openat support is well established,
417 replace the above open call and this entire if/else block
418 with the body of the if-block below. */
419 if ( openat_needs_fchdir ())
432 * Start out with 1K of file name space, and enough, in any case,
433 * to hold the user's file names.
436 # define MAXPATHLEN 1024
439 size_t maxarglen
= fts_maxarglen(argv
);
440 if (! fts_palloc(sp
, MAX(maxarglen
, MAXPATHLEN
)))
444 /* Allocate/initialize root's parent. */
446 if ((parent
= fts_alloc(sp
, "", 0)) == NULL
)
448 parent
->fts_level
= FTS_ROOTPARENTLEVEL
;
451 /* The classic fts implementation would call fts_stat with
452 a new entry for each iteration of the loop below.
453 If the comparison function is not specified or if the
454 FTS_DEFER_STAT option is in effect, don't stat any entry
455 in this loop. This is an attempt to minimize the interval
456 between the initial stat/lstat/fstatat and the point at which
457 a directory argument is first opened. This matters for any
458 directory command line argument that resides on a file system
459 without genuine i-nodes. If you specify FTS_DEFER_STAT along
460 with a comparison function, that function must not access any
461 data via the fts_statp pointer. */
462 defer_stat
= (compar
== NULL
|| ISSET(FTS_DEFER_STAT
));
464 /* Allocate/initialize root(s). */
465 for (root
= NULL
, nitems
= 0; *argv
!= NULL
; ++argv
, ++nitems
) {
466 /* *Do* allow zero-length file names. */
467 size_t len
= strlen(*argv
);
469 if ( ! (options
& FTS_VERBATIM
))
471 /* If there are two or more trailing slashes, trim all but one,
472 but don't change "//" to "/", and do map "///" to "/". */
473 char const *v
= *argv
;
474 if (2 < len
&& v
[len
- 1] == '/')
475 while (1 < len
&& v
[len
- 2] == '/')
479 if ((p
= fts_alloc(sp
, *argv
, len
)) == NULL
)
481 p
->fts_level
= FTS_ROOTLEVEL
;
482 p
->fts_parent
= parent
;
483 p
->fts_accpath
= p
->fts_name
;
484 /* Even when defer_stat is true, be sure to stat the first
485 command line argument, since fts_read (at least with
486 FTS_XDEV) requires that. */
487 if (defer_stat
&& root
!= NULL
) {
488 p
->fts_info
= FTS_NSOK
;
489 fts_set_stat_required(p
, true);
491 p
->fts_info
= fts_stat(sp
, p
, false);
495 * If comparison routine supplied, traverse in sorted
496 * order; otherwise traverse in the order specified.
511 if (compar
&& nitems
> 1)
512 root
= fts_sort(sp
, root
, nitems
);
515 * Allocate a dummy pointer and make fts_read think that we've just
516 * finished the node before the root(s); set p->fts_info to FTS_INIT
517 * so that everything about the "current" node is ignored.
519 if ((sp
->fts_cur
= fts_alloc(sp
, "", 0)) == NULL
)
521 sp
->fts_cur
->fts_link
= root
;
522 sp
->fts_cur
->fts_info
= FTS_INIT
;
523 sp
->fts_cur
->fts_level
= 1;
524 if (! setup_dir (sp
))
528 * If using chdir(2), grab a file descriptor pointing to dot to ensure
529 * that we can get back here; this could be avoided for some file names,
530 * but almost certainly not worth the effort. Slashes, symbolic links,
531 * and ".." are all fairly nasty problems. Note, if we can't get the
532 * descriptor we run anyway, just more slowly.
534 if (!ISSET(FTS_NOCHDIR
) && !ISSET(FTS_CWDFD
)
535 && (sp
->fts_rfd
= diropen (sp
, ".")) < 0)
538 i_ring_init (&sp
->fts_fd_ring
, -1);
541 mem3
: fts_lfree(root
);
543 mem2
: free(sp
->fts_path
);
550 fts_load (FTS
*sp
, register FTSENT
*p
)
556 * Load the stream structure for the next traversal. Since we don't
557 * actually enter the directory until after the preorder visit, set
558 * the fts_accpath field specially so the chdir gets done to the right
559 * place and the user can access the first node. From fts_open it's
560 * known that the file name will fit.
562 len
= p
->fts_pathlen
= p
->fts_namelen
;
563 memmove(sp
->fts_path
, p
->fts_name
, len
+ 1);
564 if ((cp
= strrchr(p
->fts_name
, '/')) && (cp
!= p
->fts_name
|| cp
[1])) {
566 memmove(p
->fts_name
, cp
, len
+ 1);
567 p
->fts_namelen
= len
;
569 p
->fts_accpath
= p
->fts_path
= sp
->fts_path
;
575 register FTSENT
*freep
, *p
;
579 * This still works if we haven't read anything -- the dummy structure
580 * points to the root list, so we step through to the end of the root
581 * list which has a valid parent pointer.
584 for (p
= sp
->fts_cur
; p
->fts_level
>= FTS_ROOTLEVEL
;) {
586 p
= p
->fts_link
!= NULL
? p
->fts_link
: p
->fts_parent
;
592 /* Free up child linked list, sort array, file name buffer. */
594 fts_lfree(sp
->fts_child
);
598 if (ISSET(FTS_CWDFD
))
600 if (0 <= sp
->fts_cwd_fd
)
601 if (close (sp
->fts_cwd_fd
))
604 else if (!ISSET(FTS_NOCHDIR
))
606 /* Return to original directory, save errno if necessary. */
607 if (fchdir(sp
->fts_rfd
))
610 /* If close fails, record errno only if saved_errno is zero,
611 so that we report the probably-more-meaningful fchdir errno. */
612 if (close (sp
->fts_rfd
))
613 if (saved_errno
== 0)
617 fd_ring_clear (&sp
->fts_fd_ring
);
619 if (sp
->fts_leaf_optimization_works_ht
)
620 hash_free (sp
->fts_leaf_optimization_works_ht
);
624 /* Free up the stream pointer. */
627 /* Set errno and return. */
629 __set_errno (saved_errno
);
636 /* Minimum link count of a traditional Unix directory. When leaf
637 optimization is OK and a directory's st_nlink == MIN_DIR_NLINK,
638 then the directory has no subdirectories. */
639 enum { MIN_DIR_NLINK
= 2 };
641 /* Whether leaf optimization is OK for a directory. */
642 enum leaf_optimization
644 /* st_nlink is not reliable for this directory's subdirectories. */
645 NO_LEAF_OPTIMIZATION
,
647 /* st_nlink == 2 means the directory lacks subdirectories. */
651 #if (defined __linux__ || defined __ANDROID__) \
652 && HAVE_SYS_VFS_H && HAVE_FSTATFS && HAVE_STRUCT_STATFS_F_TYPE
654 # include <sys/vfs.h>
656 /* Linux-specific constants from coreutils' src/fs.h */
657 # define S_MAGIC_AFS 0x5346414F
658 # define S_MAGIC_CIFS 0xFF534D42
659 # define S_MAGIC_NFS 0x6969
660 # define S_MAGIC_PROC 0x9FA0
661 # define S_MAGIC_TMPFS 0x1021994
663 # ifdef HAVE___FSWORD_T
664 typedef __fsword_t fsword
;
666 typedef long int fsword
;
669 /* Map a stat.st_dev number to a file system type number f_ftype. */
676 /* Use a tiny initial size. If a traversal encounters more than
677 a few devices, the cost of growing/rehashing this table will be
678 rendered negligible by the number of inodes processed. */
679 enum { DEV_TYPE_HT_INITIAL_SIZE
= 13 };
682 dev_type_hash (void const *x
, size_t table_size
)
684 struct dev_type
const *ax
= x
;
685 uintmax_t dev
= ax
->st_dev
;
686 return dev
% table_size
;
690 dev_type_compare (void const *x
, void const *y
)
692 struct dev_type
const *ax
= x
;
693 struct dev_type
const *ay
= y
;
694 return ax
->st_dev
== ay
->st_dev
;
697 /* Return the file system type of P with file descriptor FD, or 0 if not known.
698 If FD is negative, P's file descriptor is unavailable.
699 Try to cache known values. */
702 filesystem_type (FTSENT
const *p
, int fd
)
704 FTS
*sp
= p
->fts_fts
;
705 Hash_table
*h
= sp
->fts_leaf_optimization_works_ht
;
706 struct dev_type
*ent
;
707 struct statfs fs_buf
;
709 /* If we're not in CWDFD mode, don't bother with this optimization,
710 since the caller is not serious about performance. */
711 if (!ISSET (FTS_CWDFD
))
715 h
= sp
->fts_leaf_optimization_works_ht
716 = hash_initialize (DEV_TYPE_HT_INITIAL_SIZE
, NULL
, dev_type_hash
,
717 dev_type_compare
, free
);
721 tmp
.st_dev
= p
->fts_statp
->st_dev
;
722 ent
= hash_lookup (h
, &tmp
);
727 /* Look-up failed. Query directly and cache the result. */
728 if (fd
< 0 || fstatfs (fd
, &fs_buf
) != 0)
733 struct dev_type
*t2
= malloc (sizeof *t2
);
736 t2
->st_dev
= p
->fts_statp
->st_dev
;
737 t2
->f_type
= fs_buf
.f_type
;
739 ent
= hash_insert (h
, t2
);
741 fts_assert (ent
== t2
);
747 return fs_buf
.f_type
;
750 /* Return true if sorting dirents on inode numbers is known to improve
751 traversal performance for the directory P with descriptor DIR_FD.
752 Return false otherwise. When in doubt, return true.
753 DIR_FD is negative if unavailable. */
755 dirent_inode_sort_may_be_useful (FTSENT
const *p
, int dir_fd
)
757 /* Skip the sort only if we can determine efficiently
758 that skipping it is the right thing to do.
759 The cost of performing an unnecessary sort is negligible,
760 while the cost of *not* performing it can be O(N^2) with
761 a very large constant. */
763 switch (filesystem_type (p
, dir_fd
))
768 /* On a file system of any of these types, sorting
769 is unnecessary, and hence wasteful. */
777 /* Given an FTS entry P for a directory with descriptor DIR_FD,
778 return whether it is valid to apply leaf optimization.
779 The optimization is valid if a directory's st_nlink value equal
780 to MIN_DIR_NLINK means the directory has no subdirectories.
781 DIR_FD is negative if unavailable. */
782 static enum leaf_optimization
783 leaf_optimization (FTSENT
const *p
, int dir_fd
)
785 switch (filesystem_type (p
, dir_fd
))
788 /* Leaf optimization is unsafe if the file system type is unknown. */
791 /* Although AFS mount points are not counted in st_nlink, they
792 act like directories. See <https://bugs.debian.org/143111>. */
795 /* Leaf optimization causes 'find' to abort. See
796 <https://lists.gnu.org/r/bug-gnulib/2018-04/msg00015.html>. */
799 /* NFS provides usable dirent.d_type but not necessarily for all entries
800 of large directories, so as per <https://bugzilla.redhat.com/1252549>
801 NFS should return true. However st_nlink values are not accurate on
802 all implementations as per <https://bugzilla.redhat.com/1299169>. */
805 /* Per <https://bugs.debian.org/cgi-bin/bugreport.cgi?bug=143111> /proc
806 may have bogus stat.st_nlink values. */
807 return NO_LEAF_OPTIMIZATION
;
810 return OK_LEAF_OPTIMIZATION
;
816 dirent_inode_sort_may_be_useful (FTSENT
const *p _GL_UNUSED
,
817 int dir_fd _GL_UNUSED
)
821 static enum leaf_optimization
822 leaf_optimization (FTSENT
const *p _GL_UNUSED
, int dir_fd _GL_UNUSED
)
824 return NO_LEAF_OPTIMIZATION
;
829 * Special case of "/" at the end of the file name so that slashes aren't
830 * appended which would cause file names to be written as "....//foo".
833 (p->fts_path[p->fts_pathlen - 1] == '/' \
834 ? p->fts_pathlen - 1 : p->fts_pathlen)
837 fts_read (register FTS
*sp
)
839 register FTSENT
*p
, *tmp
;
840 register unsigned short int instr
;
843 /* If finished or unrecoverable error, return NULL. */
844 if (sp
->fts_cur
== NULL
|| ISSET(FTS_STOP
))
847 /* Set current node pointer. */
850 /* Save and zero out user instructions. */
851 instr
= p
->fts_instr
;
852 p
->fts_instr
= FTS_NOINSTR
;
854 /* Any type of file may be re-visited; re-stat and re-turn. */
855 if (instr
== FTS_AGAIN
) {
856 p
->fts_info
= fts_stat(sp
, p
, false);
859 Dprintf (("fts_read: p=%s\n",
860 p
->fts_info
== FTS_INIT
? "" : p
->fts_path
));
863 * Following a symlink -- SLNONE test allows application to see
864 * SLNONE and recover. If indirecting through a symlink, have
865 * keep a pointer to current location. If unable to get that
866 * pointer, follow fails.
868 if (instr
== FTS_FOLLOW
&&
869 (p
->fts_info
== FTS_SL
|| p
->fts_info
== FTS_SLNONE
)) {
870 p
->fts_info
= fts_stat(sp
, p
, true);
871 if (p
->fts_info
== FTS_D
&& !ISSET(FTS_NOCHDIR
)) {
872 if ((p
->fts_symfd
= diropen (sp
, ".")) < 0) {
873 p
->fts_errno
= errno
;
874 p
->fts_info
= FTS_ERR
;
876 p
->fts_flags
|= FTS_SYMFOLLOW
;
881 /* Directory in pre-order. */
882 if (p
->fts_info
== FTS_D
) {
883 /* If skipped or crossed mount point, do post-order visit. */
884 if (instr
== FTS_SKIP
||
885 (ISSET(FTS_XDEV
) && p
->fts_statp
->st_dev
!= sp
->fts_dev
)) {
886 if (p
->fts_flags
& FTS_SYMFOLLOW
)
887 (void)close(p
->fts_symfd
);
889 fts_lfree(sp
->fts_child
);
890 sp
->fts_child
= NULL
;
892 p
->fts_info
= FTS_DP
;
893 LEAVE_DIR (sp
, p
, "1");
897 /* Rebuild if only read the names and now traversing. */
898 if (sp
->fts_child
!= NULL
&& ISSET(FTS_NAMEONLY
)) {
900 fts_lfree(sp
->fts_child
);
901 sp
->fts_child
= NULL
;
905 * Cd to the subdirectory.
907 * If have already read and now fail to chdir, whack the list
908 * to make the names come out right, and set the parent errno
909 * so the application will eventually get an error condition.
910 * Set the FTS_DONTCHDIR flag so that when we logically change
911 * directories back to the parent we don't do a chdir.
913 * If haven't read do so. If the read fails, fts_build sets
914 * FTS_STOP or the fts_info field of the node.
916 if (sp
->fts_child
!= NULL
) {
917 if (fts_safe_changedir(sp
, p
, -1, p
->fts_accpath
)) {
918 p
->fts_errno
= errno
;
919 p
->fts_flags
|= FTS_DONTCHDIR
;
920 for (p
= sp
->fts_child
; p
!= NULL
;
923 p
->fts_parent
->fts_accpath
;
925 } else if ((sp
->fts_child
= fts_build(sp
, BREAD
)) == NULL
) {
928 /* If fts_build's call to fts_safe_changedir failed
929 because it was not able to fchdir into a
930 subdirectory, tell the caller. */
931 if (p
->fts_errno
&& p
->fts_info
!= FTS_DNR
)
932 p
->fts_info
= FTS_ERR
;
933 LEAVE_DIR (sp
, p
, "2");
937 sp
->fts_child
= NULL
;
941 /* Move to the next node on this level. */
944 /* If we have so many directory entries that we're reading them
945 in batches, and we've reached the end of the current batch,
946 read in a new batch. */
947 if (p
->fts_link
== NULL
&& p
->fts_parent
->fts_dirp
)
951 sp
->fts_path
[p
->fts_pathlen
] = '\0';
953 if ((p
= fts_build (sp
, BREAD
)) == NULL
)
964 if ((p
= p
->fts_link
) != NULL
) {
969 * If reached the top, return to the original directory (or
970 * the root of the tree), and load the file names for the next
973 if (p
->fts_level
== FTS_ROOTLEVEL
) {
974 if (restore_initial_cwd(sp
)) {
985 * User may have called fts_set on the node. If skipped,
986 * ignore. If followed, get a file descriptor so we can
987 * get back if necessary.
989 if (p
->fts_instr
== FTS_SKIP
)
991 if (p
->fts_instr
== FTS_FOLLOW
) {
992 p
->fts_info
= fts_stat(sp
, p
, true);
993 if (p
->fts_info
== FTS_D
&& !ISSET(FTS_NOCHDIR
)) {
994 if ((p
->fts_symfd
= diropen (sp
, ".")) < 0) {
995 p
->fts_errno
= errno
;
996 p
->fts_info
= FTS_ERR
;
998 p
->fts_flags
|= FTS_SYMFOLLOW
;
1000 p
->fts_instr
= FTS_NOINSTR
;
1003 name
: t
= sp
->fts_path
+ NAPPEND(p
->fts_parent
);
1005 memmove(t
, p
->fts_name
, p
->fts_namelen
+ 1);
1008 if (p
->fts_info
== FTS_NSOK
)
1010 if (p
->fts_statp
->st_size
== FTS_STAT_REQUIRED
)
1011 p
->fts_info
= fts_stat(sp
, p
, false);
1013 fts_assert (p
->fts_statp
->st_size
== FTS_NO_STAT_REQUIRED
);
1016 if (p
->fts_info
== FTS_D
)
1018 /* Now that P->fts_statp is guaranteed to be valid,
1019 if this is a command-line directory, record its
1020 device number, to be used for FTS_XDEV. */
1021 if (p
->fts_level
== FTS_ROOTLEVEL
)
1022 sp
->fts_dev
= p
->fts_statp
->st_dev
;
1023 Dprintf ((" entering: %s\n", p
->fts_path
));
1024 if (! enter_dir (sp
, p
))
1026 __set_errno (ENOMEM
);
1034 /* Move up to the parent node. */
1035 p
= tmp
->fts_parent
;
1039 if (p
->fts_level
== FTS_ROOTPARENTLEVEL
) {
1041 * Done; free everything up and set errno to 0 so the user
1042 * can distinguish between error and EOF.
1046 return (sp
->fts_cur
= NULL
);
1049 fts_assert (p
->fts_info
!= FTS_NSOK
);
1051 /* NUL terminate the file name. */
1052 sp
->fts_path
[p
->fts_pathlen
] = '\0';
1055 * Return to the parent directory. If at a root node, restore
1056 * the initial working directory. If we came through a symlink,
1057 * go back through the file descriptor. Otherwise, move up
1058 * one level, via "..".
1060 if (p
->fts_level
== FTS_ROOTLEVEL
) {
1061 if (restore_initial_cwd(sp
)) {
1062 p
->fts_errno
= errno
;
1065 } else if (p
->fts_flags
& FTS_SYMFOLLOW
) {
1066 if (FCHDIR(sp
, p
->fts_symfd
)) {
1067 p
->fts_errno
= errno
;
1070 (void)close(p
->fts_symfd
);
1071 } else if (!(p
->fts_flags
& FTS_DONTCHDIR
) &&
1072 fts_safe_changedir(sp
, p
->fts_parent
, -1, "..")) {
1073 p
->fts_errno
= errno
;
1077 /* If the directory causes a cycle, preserve the FTS_DC flag and keep
1078 the corresponding dev/ino pair in the hash table. It is going to be
1079 removed when leaving the original directory. */
1080 if (p
->fts_info
!= FTS_DC
) {
1081 p
->fts_info
= p
->fts_errno
? FTS_ERR
: FTS_DP
;
1082 if (p
->fts_errno
== 0)
1083 LEAVE_DIR (sp
, p
, "3");
1085 return ISSET(FTS_STOP
) ? NULL
: p
;
1089 * Fts_set takes the stream as an argument although it's not used in this
1090 * implementation; it would be necessary if anyone wanted to add global
1091 * semantics to fts using fts_set. An error return is allowed for similar
1096 fts_set(FTS
*sp _GL_UNUSED
, FTSENT
*p
, int instr
)
1098 if (instr
!= 0 && instr
!= FTS_AGAIN
&& instr
!= FTS_FOLLOW
&&
1099 instr
!= FTS_NOINSTR
&& instr
!= FTS_SKIP
) {
1100 __set_errno (EINVAL
);
1103 p
->fts_instr
= instr
;
1108 fts_children (register FTS
*sp
, int instr
)
1113 if (instr
!= 0 && instr
!= FTS_NAMEONLY
) {
1114 __set_errno (EINVAL
);
1118 /* Set current node pointer. */
1122 * Errno set to 0 so user can distinguish empty directory from
1127 /* Fatal errors stop here. */
1128 if (ISSET(FTS_STOP
))
1131 /* Return logical hierarchy of user's arguments. */
1132 if (p
->fts_info
== FTS_INIT
)
1133 return (p
->fts_link
);
1136 * If not a directory being visited in pre-order, stop here. Could
1137 * allow FTS_DNR, assuming the user has fixed the problem, but the
1138 * same effect is available with FTS_AGAIN.
1140 if (p
->fts_info
!= FTS_D
/* && p->fts_info != FTS_DNR */)
1143 /* Free up any previous child list. */
1144 if (sp
->fts_child
!= NULL
)
1145 fts_lfree(sp
->fts_child
);
1147 if (instr
== FTS_NAMEONLY
) {
1154 * If using chdir on a relative file name and called BEFORE fts_read
1155 * does its chdir to the root of a traversal, we can lose -- we need to
1156 * chdir into the subdirectory, and we don't know where the current
1157 * directory is, so we can't get back so that the upcoming chdir by
1158 * fts_read will work.
1160 if (p
->fts_level
!= FTS_ROOTLEVEL
|| p
->fts_accpath
[0] == '/' ||
1162 return (sp
->fts_child
= fts_build(sp
, instr
));
1164 if ((fd
= diropen (sp
, ".")) < 0)
1165 return (sp
->fts_child
= NULL
);
1166 sp
->fts_child
= fts_build(sp
, instr
);
1167 if (ISSET(FTS_CWDFD
))
1169 cwd_advance_fd (sp
, fd
, true);
1175 int saved_errno
= errno
;
1177 __set_errno (saved_errno
);
1182 return (sp
->fts_child
);
1185 /* A comparison function to sort on increasing inode number.
1186 For some file system types, sorting either way makes a huge
1187 performance difference for a directory with very many entries,
1188 but sorting on increasing values is slightly better than sorting
1189 on decreasing values. The difference is in the 5% range. */
1191 fts_compare_ino (struct _ftsent
const **a
, struct _ftsent
const **b
)
1193 return _GL_CMP (a
[0]->fts_statp
->st_ino
, b
[0]->fts_statp
->st_ino
);
1196 /* Map the dirent.d_type value, DTYPE, to the corresponding stat.st_mode
1197 S_IF* bit and set ST.st_mode, thus clearing all other bits in that field. */
1199 set_stat_type (struct stat
*st
, unsigned int dtype
)
1231 #define closedir_and_clear(dirp) \
1239 #define fts_opendir(file, Pdir_fd) \
1240 opendirat((! ISSET(FTS_NOCHDIR) && ISSET(FTS_CWDFD) \
1241 ? sp->fts_cwd_fd : AT_FDCWD), \
1243 (((ISSET(FTS_PHYSICAL) \
1244 && ! (ISSET(FTS_COMFOLLOW) \
1245 && cur->fts_level == FTS_ROOTLEVEL)) \
1246 ? O_NOFOLLOW : 0)), \
1250 * This is the tricky part -- do not casually change *anything* in here. The
1251 * idea is to build the linked list of entries that are used by fts_children
1252 * and fts_read. There are lots of special cases.
1254 * The real slowdown in walking the tree is the stat calls. If FTS_NOSTAT is
1255 * set and it's a physical walk (so that symbolic links can't be directories),
1256 * we can do things quickly. First, if it's a 4.4BSD file system, the type
1257 * of the file is in the directory entry. Otherwise, we assume that the number
1258 * of subdirectories in a node is equal to the number of links to the parent.
1259 * The former skips all stat calls. The latter skips stat calls in any leaf
1260 * directories and for any files after the subdirectories in the directory have
1261 * been found, cutting the stat calls by about 2/3.
1265 fts_build (register FTS
*sp
, int type
)
1267 register FTSENT
*p
, *head
;
1268 register size_t nitems
;
1275 size_t len
, maxlen
, new_len
;
1278 FTSENT
*cur
= sp
->fts_cur
;
1279 bool continue_readdir
= !!cur
->fts_dirp
;
1280 bool sort_by_inode
= false;
1283 /* When cur->fts_dirp is non-NULL, that means we should
1284 continue calling readdir on that existing DIR* pointer
1285 rather than opening a new one. */
1286 if (continue_readdir
)
1288 DIR *dp
= cur
->fts_dirp
;
1289 dir_fd
= dirfd (dp
);
1292 closedir_and_clear (cur
->fts_dirp
);
1295 cur
->fts_info
= FTS_DNR
;
1296 cur
->fts_errno
= errno
;
1303 /* Open the directory for reading. If this fails, we're done.
1304 If being called from fts_read, set the fts_info field. */
1305 if ((cur
->fts_dirp
= fts_opendir(cur
->fts_accpath
, &dir_fd
)) == NULL
)
1309 cur
->fts_info
= FTS_DNR
;
1310 cur
->fts_errno
= errno
;
1314 /* Rather than calling fts_stat for each and every entry encountered
1315 in the readdir loop (below), stat each directory only right after
1317 if (cur
->fts_info
== FTS_NSOK
)
1318 cur
->fts_info
= fts_stat(sp
, cur
, false);
1319 else if (sp
->fts_options
& FTS_TIGHT_CYCLE_CHECK
)
1321 /* Now read the stat info again after opening a directory to
1322 reveal eventual changes caused by a submount triggered by
1323 the traversal. But do it only for utilities which use
1324 FTS_TIGHT_CYCLE_CHECK. Therefore, only find and du
1325 benefit/suffer from this feature for now. */
1326 LEAVE_DIR (sp
, cur
, "4");
1327 fts_stat (sp
, cur
, false);
1328 if (! enter_dir (sp
, cur
))
1330 __set_errno (ENOMEM
);
1336 /* Maximum number of readdir entries to read at one time. This
1337 limitation is to avoid reading millions of entries into memory
1338 at once. When an fts_compar function is specified, we have no
1339 choice: we must read all entries into memory before calling that
1340 function. But when no such function is specified, we can read
1341 entries in batches that are large enough to help us with inode-
1342 sorting, yet not so large that we risk exhausting memory. */
1343 max_entries
= sp
->fts_compar
? SIZE_MAX
: FTS_MAX_READDIR_ENTRIES
;
1346 * If we're going to need to stat anything or we want to descend
1347 * and stay in the directory, chdir. If this fails we keep going,
1348 * but set a flag so we don't chdir after the post-order visit.
1349 * We won't be able to stat anything, but we can still return the
1350 * names themselves. Note, that since fts_read won't be able to
1351 * chdir into the directory, it will have to return different file
1352 * names than before, i.e. "a/b" instead of "b". Since the node
1353 * has already been visited in pre-order, have to wait until the
1354 * post-order visit to return the error. There is a special case
1355 * here, if there was nothing to stat then it's not an error to
1356 * not be able to stat. This is all fairly nasty. If a program
1357 * needed sorted entries or stat information, they had better be
1358 * checking FTS_NS on the returned nodes.
1360 if (continue_readdir
)
1362 /* When resuming a short readdir run, we already have
1363 the required dirp and dir_fd. */
1368 /* Try to descend unless it is a names-only fts_children,
1369 or the directory is known to lack subdirectories. */
1370 descend
= (type
!= BNAMES
1371 && ! (ISSET (FTS_NOSTAT
) && ISSET (FTS_PHYSICAL
)
1372 && ! ISSET (FTS_SEEDOT
)
1373 && cur
->fts_statp
->st_nlink
== MIN_DIR_NLINK
1374 && (leaf_optimization (cur
, dir_fd
)
1375 != NO_LEAF_OPTIMIZATION
)));
1376 if (descend
|| type
== BREAD
)
1378 if (ISSET(FTS_CWDFD
))
1379 dir_fd
= fcntl (dir_fd
, F_DUPFD_CLOEXEC
, STDERR_FILENO
+ 1);
1380 if (dir_fd
< 0 || fts_safe_changedir(sp
, cur
, dir_fd
, NULL
)) {
1381 if (descend
&& type
== BREAD
)
1382 cur
->fts_errno
= errno
;
1383 cur
->fts_flags
|= FTS_DONTCHDIR
;
1385 closedir_and_clear(cur
->fts_dirp
);
1386 if (ISSET(FTS_CWDFD
) && 0 <= dir_fd
)
1388 cur
->fts_dirp
= NULL
;
1395 * Figure out the max file name length that can be stored in the
1396 * current buffer -- the inner loop allocates more space as necessary.
1397 * We really wouldn't have to do the maxlen calculations here, we
1398 * could do them in fts_read before returning the name, but it's a
1399 * lot easier here since the length is part of the dirent structure.
1401 * If not changing directories set a pointer so that can just append
1402 * each new component into the file name.
1405 if (ISSET(FTS_NOCHDIR
)) {
1406 cp
= sp
->fts_path
+ len
;
1409 /* GCC, you're too verbose. */
1413 maxlen
= sp
->fts_pathlen
- len
;
1415 level
= cur
->fts_level
+ 1;
1417 /* Read the directory, attaching each entry to the "link" pointer. */
1422 while (cur
->fts_dirp
) {
1425 struct dirent
*dp
= readdir(cur
->fts_dirp
);
1428 cur
->fts_errno
= errno
;
1429 /* If we've not read any items yet, treat
1430 the error as if we can't access the dir. */
1431 cur
->fts_info
= (continue_readdir
|| nitems
)
1432 ? FTS_ERR
: FTS_DNR
;
1436 if (!ISSET(FTS_SEEDOT
) && ISDOT(dp
->d_name
))
1439 d_namelen
= _D_EXACT_NAMLEN (dp
);
1440 p
= fts_alloc (sp
, dp
->d_name
, d_namelen
);
1443 if (d_namelen
>= maxlen
) {
1444 /* include space for NUL */
1445 oldaddr
= sp
->fts_path
;
1446 if (! fts_palloc(sp
, d_namelen
+ len
+ 1)) {
1448 * No more memory. Save
1449 * errno, free up the current structure and the
1450 * structures already allocated.
1452 mem1
: saved_errno
= errno
;
1455 closedir_and_clear(cur
->fts_dirp
);
1456 cur
->fts_info
= FTS_ERR
;
1458 __set_errno (saved_errno
);
1461 /* Did realloc() change the pointer? */
1462 if (oldaddr
!= sp
->fts_path
) {
1464 if (ISSET(FTS_NOCHDIR
))
1465 cp
= sp
->fts_path
+ len
;
1467 maxlen
= sp
->fts_pathlen
- len
;
1470 new_len
= len
+ d_namelen
;
1471 if (new_len
< len
) {
1473 * In the unlikely event that we would end up
1474 * with a file name longer than SIZE_MAX, free up
1475 * the current structure and the structures already
1476 * allocated, then error out with ENAMETOOLONG.
1480 closedir_and_clear(cur
->fts_dirp
);
1481 cur
->fts_info
= FTS_ERR
;
1483 __set_errno (ENAMETOOLONG
);
1486 p
->fts_level
= level
;
1487 p
->fts_parent
= sp
->fts_cur
;
1488 p
->fts_pathlen
= new_len
;
1490 /* Store dirent.d_ino, in case we need to sort
1491 entries before processing them. */
1492 p
->fts_statp
->st_ino
= D_INO (dp
);
1494 /* Build a file name for fts_stat to stat. */
1495 if (ISSET(FTS_NOCHDIR
)) {
1496 p
->fts_accpath
= p
->fts_path
;
1497 memmove(cp
, p
->fts_name
, p
->fts_namelen
+ 1);
1499 p
->fts_accpath
= p
->fts_name
;
1501 if (sp
->fts_compar
== NULL
|| ISSET(FTS_DEFER_STAT
)) {
1502 /* Record what fts_read will have to do with this
1503 entry. In many cases, it will simply fts_stat it,
1504 but we can take advantage of any d_type information
1505 to optimize away the unnecessary stat calls. I.e.,
1506 if FTS_NOSTAT is in effect and we're not following
1507 symlinks (FTS_PHYSICAL) and d_type indicates this
1508 is *not* a directory, then we won't have to stat it
1509 at all. If it *is* a directory, then (currently)
1510 we stat it regardless, in order to get device and
1511 inode numbers. Some day we might optimize that
1512 away, too, for directories where d_ino is known to
1514 bool skip_stat
= (ISSET(FTS_NOSTAT
)
1516 && ! DT_MUST_BE(dp
, DT_DIR
)
1517 && (ISSET(FTS_PHYSICAL
)
1518 || ! DT_MUST_BE(dp
, DT_LNK
)));
1519 p
->fts_info
= FTS_NSOK
;
1520 /* Propagate dirent.d_type information back
1521 to caller, when possible. */
1522 set_stat_type (p
->fts_statp
, D_TYPE (dp
));
1523 fts_set_stat_required(p
, !skip_stat
);
1525 p
->fts_info
= fts_stat(sp
, p
, false);
1528 /* We walk in directory order so "ls -f" doesn't get upset. */
1537 /* If there are many entries, no sorting function has been
1538 specified, and this file system is of a type that may be
1539 slow with a large number of entries, arrange to sort the
1540 directory entries on increasing inode numbers.
1542 The NITEMS comparison uses ==, not >, because the test
1543 needs to be tried at most once once, and NITEMS will exceed
1544 the threshold after it is incremented below. */
1545 if (nitems
== _FTS_INODE_SORT_DIR_ENTRIES_THRESHOLD
1547 sort_by_inode
= dirent_inode_sort_may_be_useful (cur
, dir_fd
);
1550 if (max_entries
<= nitems
) {
1551 /* When there are too many dir entries, leave
1552 fts_dirp open, so that a subsequent fts_read
1553 can take up where we leave off. */
1554 goto break_without_closedir
;
1559 closedir_and_clear(cur
->fts_dirp
);
1561 break_without_closedir
:
1564 * If realloc() changed the address of the file name, adjust the
1565 * addresses for the rest of the tree and the dir list.
1568 fts_padjust(sp
, head
);
1571 * If not changing directories, reset the file name back to original
1574 if (ISSET(FTS_NOCHDIR
)) {
1575 if (len
== sp
->fts_pathlen
|| nitems
== 0)
1581 * If descended after called from fts_children or after called from
1582 * fts_read and nothing found, get back. At the root level we use
1583 * the saved fd; if one of fts_open()'s arguments is a relative name
1584 * to an empty directory, we wind up here with no other way back. If
1585 * can't get back, we're done.
1587 if (!continue_readdir
&& descend
&& (type
== BCHILD
|| !nitems
) &&
1588 (cur
->fts_level
== FTS_ROOTLEVEL
1589 ? restore_initial_cwd(sp
)
1590 : fts_safe_changedir(sp
, cur
->fts_parent
, -1, ".."))) {
1591 cur
->fts_info
= FTS_ERR
;
1597 /* If didn't find anything, return NULL. */
1600 && cur
->fts_info
!= FTS_DNR
&& cur
->fts_info
!= FTS_ERR
)
1601 cur
->fts_info
= FTS_DP
;
1606 if (sort_by_inode
) {
1607 sp
->fts_compar
= fts_compare_ino
;
1608 head
= fts_sort (sp
, head
, nitems
);
1609 sp
->fts_compar
= NULL
;
1612 /* Sort the entries. */
1613 if (sp
->fts_compar
&& nitems
> 1)
1614 head
= fts_sort(sp
, head
, nitems
);
1620 /* Walk ->fts_parent links starting at E_CURR, until the root of the
1621 current hierarchy. There should be a directory with dev/inode
1622 matching those of AD. If not, print a lot of diagnostics. */
1624 find_matching_ancestor (FTSENT
const *e_curr
, struct Active_dir
const *ad
)
1627 for (ent
= e_curr
; ent
->fts_level
>= FTS_ROOTLEVEL
; ent
= ent
->fts_parent
)
1629 if (ad
->ino
== ent
->fts_statp
->st_ino
1630 && ad
->dev
== ent
->fts_statp
->st_dev
)
1633 printf ("ERROR: tree dir, %s, not active\n", ad
->fts_ent
->fts_accpath
);
1634 printf ("active dirs:\n");
1636 ent
->fts_level
>= FTS_ROOTLEVEL
; ent
= ent
->fts_parent
)
1637 printf (" %s(%"PRIuMAX
"/%"PRIuMAX
") to %s(%"PRIuMAX
"/%"PRIuMAX
")...\n",
1638 ad
->fts_ent
->fts_accpath
,
1639 (uintmax_t) ad
->dev
,
1640 (uintmax_t) ad
->ino
,
1642 (uintmax_t) ent
->fts_statp
->st_dev
,
1643 (uintmax_t) ent
->fts_statp
->st_ino
);
1647 fts_cross_check (FTS
const *sp
)
1649 FTSENT
const *ent
= sp
->fts_cur
;
1651 if ( ! ISSET (FTS_TIGHT_CYCLE_CHECK
))
1654 Dprintf (("fts-cross-check cur=%s\n", ent
->fts_path
));
1655 /* Make sure every parent dir is in the tree. */
1656 for (t
= ent
->fts_parent
; t
->fts_level
>= FTS_ROOTLEVEL
; t
= t
->fts_parent
)
1658 struct Active_dir ad
;
1659 ad
.ino
= t
->fts_statp
->st_ino
;
1660 ad
.dev
= t
->fts_statp
->st_dev
;
1661 if ( ! hash_lookup (sp
->fts_cycle
.ht
, &ad
))
1662 printf ("ERROR: active dir, %s, not in tree\n", t
->fts_path
);
1665 /* Make sure every dir in the tree is an active dir.
1666 But ENT is not necessarily a directory. If so, just skip this part. */
1667 if (ent
->fts_parent
->fts_level
>= FTS_ROOTLEVEL
1668 && (ent
->fts_info
== FTS_DP
1669 || ent
->fts_info
== FTS_D
))
1671 struct Active_dir
*ad
;
1672 for (ad
= hash_get_first (sp
->fts_cycle
.ht
); ad
!= NULL
;
1673 ad
= hash_get_next (sp
->fts_cycle
.ht
, ad
))
1675 find_matching_ancestor (ent
, ad
);
1681 same_fd (int fd1
, int fd2
)
1683 struct stat sb1
, sb2
;
1684 return (fstat (fd1
, &sb1
) == 0
1685 && fstat (fd2
, &sb2
) == 0
1686 && SAME_INODE (sb1
, sb2
));
1690 fd_ring_print (FTS
const *sp
, FILE *stream
, char const *msg
)
1692 I_ring
const *fd_ring
= &sp
->fts_fd_ring
;
1693 unsigned int i
= fd_ring
->fts_front
;
1694 char *cwd
= getcwdat (sp
->fts_cwd_fd
, NULL
, 0);
1695 fprintf (stream
, "=== %s ========== %s\n", msg
, cwd
);
1697 if (i_ring_empty (fd_ring
))
1702 int fd
= fd_ring
->fts_fd_ring
[i
];
1704 fprintf (stream
, "%d: %d:\n", i
, fd
);
1707 char *wd
= getcwdat (fd
, NULL
, 0);
1708 fprintf (stream
, "%d: %d: %s\n", i
, fd
, wd
);
1711 if (i
== fd_ring
->fts_back
)
1713 i
= (i
+ I_RING_SIZE
- 1) % I_RING_SIZE
;
1717 /* Ensure that each file descriptor on the fd_ring matches a
1718 parent, grandparent, etc. of the current working directory. */
1720 fd_ring_check (FTS
const *sp
)
1725 /* Make a writable copy. */
1726 I_ring fd_w
= sp
->fts_fd_ring
;
1728 int cwd_fd
= sp
->fts_cwd_fd
;
1729 cwd_fd
= fcntl (cwd_fd
, F_DUPFD_CLOEXEC
, STDERR_FILENO
+ 1);
1730 char *dot
= getcwdat (cwd_fd
, NULL
, 0);
1731 error (0, 0, "===== check ===== cwd: %s", dot
);
1733 while ( ! i_ring_empty (&fd_w
))
1735 int fd
= i_ring_pop (&fd_w
);
1738 int open_flags
= O_SEARCH
| O_CLOEXEC
;
1739 int parent_fd
= openat (cwd_fd
, "..", open_flags
);
1745 if (!same_fd (fd
, parent_fd
))
1747 char *cwd
= getcwdat (fd
, NULL
, 0);
1748 error (0, errno
, "ring : %s", cwd
);
1749 char *c2
= getcwdat (parent_fd
, NULL
, 0);
1750 error (0, errno
, "parent: %s", c2
);
1763 static unsigned short int
1765 fts_stat(FTS
*sp
, register FTSENT
*p
, bool follow
)
1767 struct stat
*sbp
= p
->fts_statp
;
1769 if (p
->fts_level
== FTS_ROOTLEVEL
&& ISSET(FTS_COMFOLLOW
))
1773 * If doing a logical walk, or application requested FTS_FOLLOW, do
1774 * a stat(2). If that fails, check for a non-existent symlink. If
1775 * fail, set the errno from the stat call.
1777 if (ISSET(FTS_LOGICAL
) || follow
) {
1778 if (stat(p
->fts_accpath
, sbp
)) {
1780 && lstat(p
->fts_accpath
, sbp
) == 0) {
1782 return (FTS_SLNONE
);
1784 p
->fts_errno
= errno
;
1787 } else if (fstatat(sp
->fts_cwd_fd
, p
->fts_accpath
, sbp
,
1788 AT_SYMLINK_NOFOLLOW
)) {
1789 p
->fts_errno
= errno
;
1790 err
: memset(sbp
, 0, sizeof(struct stat
));
1794 if (S_ISDIR(sbp
->st_mode
)) {
1795 if (ISDOT(p
->fts_name
)) {
1796 /* Command-line "." and ".." are real directories. */
1797 return (p
->fts_level
== FTS_ROOTLEVEL
? FTS_D
: FTS_DOT
);
1802 if (S_ISLNK(sbp
->st_mode
))
1804 if (S_ISREG(sbp
->st_mode
))
1806 return (FTS_DEFAULT
);
1810 fts_compar (void const *a
, void const *b
)
1812 /* Convert A and B to the correct types, to pacify the compiler, and
1813 for portability to bizarre hosts where "void const *" and "FTSENT
1814 const **" differ in runtime representation. The comparison
1815 function cannot modify *a and *b, but there is no compile-time
1817 FTSENT
const **pa
= (FTSENT
const **) a
;
1818 FTSENT
const **pb
= (FTSENT
const **) b
;
1819 return pa
[0]->fts_fts
->fts_compar (pa
, pb
);
1824 fts_sort (FTS
*sp
, FTSENT
*head
, register size_t nitems
)
1826 register FTSENT
**ap
, *p
;
1828 /* On most modern hosts, void * and FTSENT ** have the same
1829 run-time representation, and one can convert sp->fts_compar to
1830 the type qsort expects without problem. Use the heuristic that
1831 this is OK if the two pointer types are the same size, and if
1832 converting FTSENT ** to long int is the same as converting
1833 FTSENT ** to void * and then to long int. This heuristic isn't
1834 valid in general but we don't know of any counterexamples. */
1836 int (*compare
) (void const *, void const *) =
1837 ((sizeof &dummy
== sizeof (void *)
1838 && (long int) &dummy
== (long int) (void *) &dummy
)
1839 ? (int (*) (void const *, void const *)) sp
->fts_compar
1843 * Construct an array of pointers to the structures and call qsort(3).
1844 * Reassemble the array in the order returned by qsort. If unable to
1845 * sort for memory reasons, return the directory entries in their
1846 * current order. Allocate enough space for the current needs plus
1847 * 40 so don't realloc one entry at a time.
1849 if (nitems
> sp
->fts_nitems
) {
1852 sp
->fts_nitems
= nitems
+ 40;
1853 if (SIZE_MAX
/ sizeof *a
< sp
->fts_nitems
1854 || ! (a
= realloc (sp
->fts_array
,
1855 sp
->fts_nitems
* sizeof *a
))) {
1856 free(sp
->fts_array
);
1857 sp
->fts_array
= NULL
;
1863 for (ap
= sp
->fts_array
, p
= head
; p
; p
= p
->fts_link
)
1865 qsort((void *)sp
->fts_array
, nitems
, sizeof(FTSENT
*), compare
);
1866 for (head
= *(ap
= sp
->fts_array
); --nitems
; ++ap
)
1867 ap
[0]->fts_link
= ap
[1];
1868 ap
[0]->fts_link
= NULL
;
1874 fts_alloc (FTS
*sp
, const char *name
, register size_t namelen
)
1880 * The file name is a variable length array. Allocate the FTSENT
1881 * structure and the file name in one chunk.
1883 len
= FLEXSIZEOF(FTSENT
, fts_name
, namelen
+ 1);
1884 if ((p
= malloc(len
)) == NULL
)
1887 /* Copy the name and guarantee NUL termination. */
1888 memcpy(p
->fts_name
, name
, namelen
);
1889 p
->fts_name
[namelen
] = '\0';
1891 p
->fts_namelen
= namelen
;
1893 p
->fts_path
= sp
->fts_path
;
1897 p
->fts_instr
= FTS_NOINSTR
;
1899 p
->fts_pointer
= NULL
;
1905 fts_lfree (register FTSENT
*head
)
1909 /* Free a linked list of structures. */
1910 while ((p
= head
)) {
1911 head
= head
->fts_link
;
1913 closedir (p
->fts_dirp
);
1919 * Allow essentially unlimited file name lengths; find, rm, ls should
1920 * all work on any tree. Most systems will allow creation of file
1921 * names much longer than MAXPATHLEN, even though the kernel won't
1922 * resolve them. Add the size (not just what's needed) plus 256 bytes
1923 * so don't realloc the file name 2 bytes at a time.
1927 fts_palloc (FTS
*sp
, size_t more
)
1930 size_t new_len
= sp
->fts_pathlen
+ more
+ 256;
1933 * See if fts_pathlen would overflow.
1935 if (new_len
< sp
->fts_pathlen
) {
1937 sp
->fts_path
= NULL
;
1938 __set_errno (ENAMETOOLONG
);
1941 sp
->fts_pathlen
= new_len
;
1942 p
= realloc(sp
->fts_path
, sp
->fts_pathlen
);
1945 sp
->fts_path
= NULL
;
1953 * When the file name is realloc'd, have to fix all of the pointers in
1954 * structures already returned.
1958 fts_padjust (FTS
*sp
, FTSENT
*head
)
1961 char *addr
= sp
->fts_path
;
1963 #define ADJUST(p) do { \
1964 if ((p)->fts_accpath != (p)->fts_name) { \
1965 (p)->fts_accpath = \
1966 (char *)addr + ((p)->fts_accpath - (p)->fts_path); \
1968 (p)->fts_path = addr; \
1970 /* Adjust the current set of children. */
1971 for (p
= sp
->fts_child
; p
; p
= p
->fts_link
)
1974 /* Adjust the rest of the tree, including the current level. */
1975 for (p
= head
; p
->fts_level
>= FTS_ROOTLEVEL
;) {
1977 p
= p
->fts_link
? p
->fts_link
: p
->fts_parent
;
1982 internal_function _GL_ATTRIBUTE_PURE
1983 fts_maxarglen (char * const *argv
)
1987 for (max
= 0; *argv
; ++argv
)
1988 if ((len
= strlen(*argv
)) > max
)
1994 * Change to dir specified by fd or file name without getting
1995 * tricked by someone changing the world out from underneath us.
1996 * Assumes p->fts_statp->st_dev and p->fts_statp->st_ino are filled in.
1997 * If FD is non-negative, expect it to be used after this function returns,
1998 * and to be closed eventually. So don't pass e.g., 'dirfd(dirp)' and then
1999 * do closedir(dirp), because that would invalidate the saved FD.
2000 * Upon failure, close FD immediately and return nonzero.
2004 fts_safe_changedir (FTS
*sp
, FTSENT
*p
, int fd
, char const *dir
)
2007 bool is_dotdot
= dir
&& STREQ (dir
, "..");
2010 /* This clause handles the unusual case in which FTS_NOCHDIR
2011 is specified, along with FTS_CWDFD. In that case, there is
2012 no need to change even the virtual cwd file descriptor.
2013 However, if FD is non-negative, we do close it here. */
2014 if (ISSET (FTS_NOCHDIR
))
2016 if (ISSET (FTS_CWDFD
) && 0 <= fd
)
2021 if (fd
< 0 && is_dotdot
&& ISSET (FTS_CWDFD
))
2023 /* When possible, skip the diropen and subsequent fstat+dev/ino
2024 comparison. I.e., when changing to parent directory
2025 (chdir ("..")), use a file descriptor from the ring and
2026 save the overhead of diropen+fstat, as well as avoiding
2027 failure when we lack "x" access to the virtual cwd. */
2028 if ( ! i_ring_empty (&sp
->fts_fd_ring
))
2031 fd_ring_print (sp
, stderr
, "pre-pop");
2032 parent_fd
= i_ring_pop (&sp
->fts_fd_ring
);
2042 if (fd
< 0 && (newfd
= diropen (sp
, dir
)) < 0)
2045 /* The following dev/inode check is necessary if we're doing a
2046 "logical" traversal (through symlinks, a la chown -L), if the
2047 system lacks O_NOFOLLOW support, or if we're changing to ".."
2048 (but not via a popped file descriptor). When changing to the
2049 name "..", O_NOFOLLOW can't help. In general, when the target is
2050 not "..", diropen's use of O_NOFOLLOW ensures we don't mistakenly
2051 follow a symlink, so we can avoid the expense of this fstat. */
2052 if (ISSET(FTS_LOGICAL
) || ! HAVE_WORKING_O_NOFOLLOW
2053 || (dir
&& STREQ (dir
, "..")))
2056 if (fstat(newfd
, &sb
))
2061 if (p
->fts_statp
->st_dev
!= sb
.st_dev
2062 || p
->fts_statp
->st_ino
!= sb
.st_ino
)
2064 __set_errno (ENOENT
); /* disinformation */
2070 if (ISSET(FTS_CWDFD
))
2072 cwd_advance_fd (sp
, newfd
, ! is_dotdot
);
2076 ret
= fchdir(newfd
);
2082 __set_errno (oerrno
);