tests: fix false failure with spaces in $PWD
[coreutils.git] / src / du.c
blobcef8dacaf0ddac28f5d2fd45b2830596dbf81e5d
1 /* du -- summarize disk usage
2 Copyright (C) 1988-2016 Free Software Foundation, Inc.
4 This program is free software: you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation, either version 3 of the License, or
7 (at your option) any later version.
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program. If not, see <http://www.gnu.org/licenses/>. */
17 /* Differences from the Unix du:
18 * Doesn't simply ignore the names of regular files given as arguments
19 when -a is given.
21 By tege@sics.se, Torbjorn Granlund,
22 and djm@ai.mit.edu, David MacKenzie.
23 Variable blocks added by lm@sgi.com and eggert@twinsun.com.
24 Rewritten to use nftw, then to use fts by Jim Meyering. */
26 #include <config.h>
27 #include <getopt.h>
28 #include <sys/types.h>
29 #include <assert.h>
30 #include "system.h"
31 #include "argmatch.h"
32 #include "argv-iter.h"
33 #include "di-set.h"
34 #include "die.h"
35 #include "error.h"
36 #include "exclude.h"
37 #include "fprintftime.h"
38 #include "human.h"
39 #include "mountlist.h"
40 #include "quote.h"
41 #include "stat-size.h"
42 #include "stat-time.h"
43 #include "stdio--.h"
44 #include "xfts.h"
45 #include "xstrtol.h"
47 extern bool fts_debug;
49 /* The official name of this program (e.g., no 'g' prefix). */
50 #define PROGRAM_NAME "du"
52 #define AUTHORS \
53 proper_name ("Torbjorn Granlund"), \
54 proper_name ("David MacKenzie"), \
55 proper_name ("Paul Eggert"), \
56 proper_name ("Jim Meyering")
58 #if DU_DEBUG
59 # define FTS_CROSS_CHECK(Fts) fts_cross_check (Fts)
60 #else
61 # define FTS_CROSS_CHECK(Fts)
62 #endif
64 /* A set of dev/ino pairs to help identify files and directories
65 whose sizes have already been counted. */
66 static struct di_set *di_files;
68 /* A set containing a dev/ino pair for each local mount point directory. */
69 static struct di_set *di_mnt;
71 /* Keep track of the preceding "level" (depth in hierarchy)
72 from one call of process_file to the next. */
73 static size_t prev_level;
75 /* Define a class for collecting directory information. */
76 struct duinfo
78 /* Size of files in directory. */
79 uintmax_t size;
81 /* Number of inodes in directory. */
82 uintmax_t inodes;
84 /* Latest time stamp found. If tmax.tv_sec == TYPE_MINIMUM (time_t)
85 && tmax.tv_nsec < 0, no time stamp has been found. */
86 struct timespec tmax;
89 /* Initialize directory data. */
90 static inline void
91 duinfo_init (struct duinfo *a)
93 a->size = 0;
94 a->inodes = 0;
95 a->tmax.tv_sec = TYPE_MINIMUM (time_t);
96 a->tmax.tv_nsec = -1;
99 /* Set directory data. */
100 static inline void
101 duinfo_set (struct duinfo *a, uintmax_t size, struct timespec tmax)
103 a->size = size;
104 a->inodes = 1;
105 a->tmax = tmax;
108 /* Accumulate directory data. */
109 static inline void
110 duinfo_add (struct duinfo *a, struct duinfo const *b)
112 uintmax_t sum = a->size + b->size;
113 a->size = a->size <= sum ? sum : UINTMAX_MAX;
114 a->inodes = a->inodes + b->inodes;
115 if (timespec_cmp (a->tmax, b->tmax) < 0)
116 a->tmax = b->tmax;
119 /* A structure for per-directory level information. */
120 struct dulevel
122 /* Entries in this directory. */
123 struct duinfo ent;
125 /* Total for subdirectories. */
126 struct duinfo subdir;
129 /* If true, display counts for all files, not just directories. */
130 static bool opt_all = false;
132 /* If true, rather than using the disk usage of each file,
133 use the apparent size (a la stat.st_size). */
134 static bool apparent_size = false;
136 /* If true, count each hard link of files with multiple links. */
137 static bool opt_count_all = false;
139 /* If true, hash all files to look for hard links. */
140 static bool hash_all;
142 /* If true, output the NUL byte instead of a newline at the end of each line. */
143 static bool opt_nul_terminate_output = false;
145 /* If true, print a grand total at the end. */
146 static bool print_grand_total = false;
148 /* If nonzero, do not add sizes of subdirectories. */
149 static bool opt_separate_dirs = false;
151 /* Show the total for each directory (and file if --all) that is at
152 most MAX_DEPTH levels down from the root of the hierarchy. The root
153 is at level 0, so 'du --max-depth=0' is equivalent to 'du -s'. */
154 static size_t max_depth = SIZE_MAX;
156 /* Only output entries with at least this SIZE if positive,
157 or at most if negative. See --threshold option. */
158 static intmax_t opt_threshold = 0;
160 /* Human-readable options for output. */
161 static int human_output_opts;
163 /* Output inodes count instead of blocks used. */
164 static bool opt_inodes = false;
166 /* If true, print most recently modified date, using the specified format. */
167 static bool opt_time = false;
169 /* Type of time to display. controlled by --time. */
171 enum time_type
173 time_mtime, /* default */
174 time_ctime,
175 time_atime
178 static enum time_type time_type = time_mtime;
180 /* User specified date / time style */
181 static char const *time_style = NULL;
183 /* Format used to display date / time. Controlled by --time-style */
184 static char const *time_format = NULL;
186 /* The local time zone rules, as per the TZ environment variable. */
187 static timezone_t localtz;
189 /* The units to use when printing sizes. */
190 static uintmax_t output_block_size;
192 /* File name patterns to exclude. */
193 static struct exclude *exclude;
195 /* Grand total size of all args, in bytes. Also latest modified date. */
196 static struct duinfo tot_dui;
198 #define IS_DIR_TYPE(Type) \
199 ((Type) == FTS_DP \
200 || (Type) == FTS_DNR)
202 /* For long options that have no equivalent short option, use a
203 non-character as a pseudo short option, starting with CHAR_MAX + 1. */
204 enum
206 APPARENT_SIZE_OPTION = CHAR_MAX + 1,
207 EXCLUDE_OPTION,
208 FILES0_FROM_OPTION,
209 HUMAN_SI_OPTION,
210 FTS_DEBUG,
211 TIME_OPTION,
212 TIME_STYLE_OPTION,
213 INODES_OPTION
216 static struct option const long_options[] =
218 {"all", no_argument, NULL, 'a'},
219 {"apparent-size", no_argument, NULL, APPARENT_SIZE_OPTION},
220 {"block-size", required_argument, NULL, 'B'},
221 {"bytes", no_argument, NULL, 'b'},
222 {"count-links", no_argument, NULL, 'l'},
223 /* {"-debug", no_argument, NULL, FTS_DEBUG}, */
224 {"dereference", no_argument, NULL, 'L'},
225 {"dereference-args", no_argument, NULL, 'D'},
226 {"exclude", required_argument, NULL, EXCLUDE_OPTION},
227 {"exclude-from", required_argument, NULL, 'X'},
228 {"files0-from", required_argument, NULL, FILES0_FROM_OPTION},
229 {"human-readable", no_argument, NULL, 'h'},
230 {"inodes", no_argument, NULL, INODES_OPTION},
231 {"si", no_argument, NULL, HUMAN_SI_OPTION},
232 {"max-depth", required_argument, NULL, 'd'},
233 {"null", no_argument, NULL, '0'},
234 {"no-dereference", no_argument, NULL, 'P'},
235 {"one-file-system", no_argument, NULL, 'x'},
236 {"separate-dirs", no_argument, NULL, 'S'},
237 {"summarize", no_argument, NULL, 's'},
238 {"total", no_argument, NULL, 'c'},
239 {"threshold", required_argument, NULL, 't'},
240 {"time", optional_argument, NULL, TIME_OPTION},
241 {"time-style", required_argument, NULL, TIME_STYLE_OPTION},
242 {GETOPT_HELP_OPTION_DECL},
243 {GETOPT_VERSION_OPTION_DECL},
244 {NULL, 0, NULL, 0}
247 static char const *const time_args[] =
249 "atime", "access", "use", "ctime", "status", NULL
251 static enum time_type const time_types[] =
253 time_atime, time_atime, time_atime, time_ctime, time_ctime
255 ARGMATCH_VERIFY (time_args, time_types);
257 /* 'full-iso' uses full ISO-style dates and times. 'long-iso' uses longer
258 ISO-style time stamps, though shorter than 'full-iso'. 'iso' uses shorter
259 ISO-style time stamps. */
260 enum time_style
262 full_iso_time_style, /* --time-style=full-iso */
263 long_iso_time_style, /* --time-style=long-iso */
264 iso_time_style /* --time-style=iso */
267 static char const *const time_style_args[] =
269 "full-iso", "long-iso", "iso", NULL
271 static enum time_style const time_style_types[] =
273 full_iso_time_style, long_iso_time_style, iso_time_style
275 ARGMATCH_VERIFY (time_style_args, time_style_types);
277 void
278 usage (int status)
280 if (status != EXIT_SUCCESS)
281 emit_try_help ();
282 else
284 printf (_("\
285 Usage: %s [OPTION]... [FILE]...\n\
286 or: %s [OPTION]... --files0-from=F\n\
287 "), program_name, program_name);
288 fputs (_("\
289 Summarize disk usage of the set of FILEs, recursively for directories.\n\
290 "), stdout);
292 emit_mandatory_arg_note ();
294 fputs (_("\
295 -0, --null end each output line with NUL, not newline\n\
296 -a, --all write counts for all files, not just directories\n\
297 --apparent-size print apparent sizes, rather than disk usage; although\
299 the apparent size is usually smaller, it may be\n\
300 larger due to holes in ('sparse') files, internal\n\
301 fragmentation, indirect blocks, and the like\n\
302 "), stdout);
303 fputs (_("\
304 -B, --block-size=SIZE scale sizes by SIZE before printing them; e.g.,\n\
305 '-BM' prints sizes in units of 1,048,576 bytes;\n\
306 see SIZE format below\n\
307 -b, --bytes equivalent to '--apparent-size --block-size=1'\n\
308 -c, --total produce a grand total\n\
309 -D, --dereference-args dereference only symlinks that are listed on the\n\
310 command line\n\
311 -d, --max-depth=N print the total for a directory (or file, with --all)\n\
312 only if it is N or fewer levels below the command\n\
313 line argument; --max-depth=0 is the same as\n\
314 --summarize\n\
315 "), stdout);
316 fputs (_("\
317 --files0-from=F summarize disk usage of the\n\
318 NUL-terminated file names specified in file F;\n\
319 if F is -, then read names from standard input\n\
320 -H equivalent to --dereference-args (-D)\n\
321 -h, --human-readable print sizes in human readable format (e.g., 1K 234M 2G)\
323 --inodes list inode usage information instead of block usage\n\
324 "), stdout);
325 fputs (_("\
326 -k like --block-size=1K\n\
327 -L, --dereference dereference all symbolic links\n\
328 -l, --count-links count sizes many times if hard linked\n\
329 -m like --block-size=1M\n\
330 "), stdout);
331 fputs (_("\
332 -P, --no-dereference don't follow any symbolic links (this is the default)\n\
333 -S, --separate-dirs for directories do not include size of subdirectories\n\
334 --si like -h, but use powers of 1000 not 1024\n\
335 -s, --summarize display only a total for each argument\n\
336 "), stdout);
337 fputs (_("\
338 -t, --threshold=SIZE exclude entries smaller than SIZE if positive,\n\
339 or entries greater than SIZE if negative\n\
340 --time show time of the last modification of any file in the\n\
341 directory, or any of its subdirectories\n\
342 --time=WORD show time as WORD instead of modification time:\n\
343 atime, access, use, ctime or status\n\
344 --time-style=STYLE show times using STYLE, which can be:\n\
345 full-iso, long-iso, iso, or +FORMAT;\n\
346 FORMAT is interpreted like in 'date'\n\
347 "), stdout);
348 fputs (_("\
349 -X, --exclude-from=FILE exclude files that match any pattern in FILE\n\
350 --exclude=PATTERN exclude files that match PATTERN\n\
351 -x, --one-file-system skip directories on different file systems\n\
352 "), stdout);
353 fputs (HELP_OPTION_DESCRIPTION, stdout);
354 fputs (VERSION_OPTION_DESCRIPTION, stdout);
355 emit_blocksize_note ("DU");
356 emit_size_note ();
357 emit_ancillary_info (PROGRAM_NAME);
359 exit (status);
362 /* Try to insert the INO/DEV pair into DI_SET.
363 Return true if the pair is successfully inserted,
364 false if the pair was already there. */
365 static bool
366 hash_ins (struct di_set *di_set, ino_t ino, dev_t dev)
368 int inserted = di_set_insert (di_set, dev, ino);
369 if (inserted < 0)
370 xalloc_die ();
371 return inserted;
374 /* FIXME: this code is nearly identical to code in date.c */
375 /* Display the date and time in WHEN according to the format specified
376 in FORMAT. */
378 static void
379 show_date (const char *format, struct timespec when, timezone_t tz)
381 struct tm tm;
382 if (localtime_rz (tz, &when.tv_sec, &tm))
383 fprintftime (stdout, format, &tm, tz, when.tv_nsec);
384 else
386 char buf[INT_BUFSIZE_BOUND (intmax_t)];
387 char *when_str = timetostr (when.tv_sec, buf);
388 error (0, 0, _("time %s is out of range"), quote (when_str));
389 fputs (when_str, stdout);
393 /* Print N_BYTES. Convert it to a readable value before printing. */
395 static void
396 print_only_size (uintmax_t n_bytes)
398 char buf[LONGEST_HUMAN_READABLE + 1];
399 fputs ((n_bytes == UINTMAX_MAX
400 ? _("Infinity")
401 : human_readable (n_bytes, buf, human_output_opts,
402 1, output_block_size)),
403 stdout);
406 /* Print size (and optionally time) indicated by *PDUI, followed by STRING. */
408 static void
409 print_size (const struct duinfo *pdui, const char *string)
411 print_only_size (opt_inodes
412 ? pdui->inodes
413 : pdui->size);
415 if (opt_time)
417 putchar ('\t');
418 show_date (time_format, pdui->tmax, localtz);
420 printf ("\t%s%c", string, opt_nul_terminate_output ? '\0' : '\n');
421 fflush (stdout);
424 /* Fill the di_mnt set with local mount point dev/ino pairs. */
426 static void
427 fill_mount_table (void)
429 struct mount_entry *mnt_ent = read_file_system_list (false);
430 while (mnt_ent)
432 struct mount_entry *mnt_free;
433 if (!mnt_ent->me_remote && !mnt_ent->me_dummy)
435 struct stat buf;
436 if (!stat (mnt_ent->me_mountdir, &buf))
437 hash_ins (di_mnt, buf.st_ino, buf.st_dev);
438 else
440 /* Ignore stat failure. False positives are too common.
441 E.g., "Permission denied" on /run/user/<name>/gvfs. */
445 mnt_free = mnt_ent;
446 mnt_ent = mnt_ent->me_next;
447 free_mount_entry (mnt_free);
451 /* This function checks whether any of the directories in the cycle that
452 fts detected is a mount point. */
454 static bool
455 mount_point_in_fts_cycle (FTSENT const *ent)
457 FTSENT const *cycle_ent = ent->fts_cycle;
459 if (!di_mnt)
461 /* Initialize the set of dev,inode pairs. */
462 di_mnt = di_set_alloc ();
463 if (!di_mnt)
464 xalloc_die ();
466 fill_mount_table ();
469 while (ent && ent != cycle_ent)
471 if (di_set_lookup (di_mnt, ent->fts_statp->st_dev,
472 ent->fts_statp->st_ino) > 0)
474 return true;
476 ent = ent->fts_parent;
479 return false;
482 /* This function is called once for every file system object that fts
483 encounters. fts does a depth-first traversal. This function knows
484 that and accumulates per-directory totals based on changes in
485 the depth of the current entry. It returns true on success. */
487 static bool
488 process_file (FTS *fts, FTSENT *ent)
490 bool ok = true;
491 struct duinfo dui;
492 struct duinfo dui_to_print;
493 size_t level;
494 static size_t n_alloc;
495 /* First element of the structure contains:
496 The sum of the st_size values of all entries in the single directory
497 at the corresponding level. Although this does include the st_size
498 corresponding to each subdirectory, it does not include the size of
499 any file in a subdirectory. Also corresponding last modified date.
500 Second element of the structure contains:
501 The sum of the sizes of all entries in the hierarchy at or below the
502 directory at the specified level. */
503 static struct dulevel *dulvl;
505 const char *file = ent->fts_path;
506 const struct stat *sb = ent->fts_statp;
507 int info = ent->fts_info;
509 if (info == FTS_DNR)
511 /* An error occurred, but the size is known, so count it. */
512 error (0, ent->fts_errno, _("cannot read directory %s"), quoteaf (file));
513 ok = false;
515 else if (info != FTS_DP)
517 bool excluded = excluded_file_name (exclude, file);
518 if (! excluded)
520 /* Make the stat buffer *SB valid, or fail noisily. */
522 if (info == FTS_NSOK)
524 fts_set (fts, ent, FTS_AGAIN);
525 FTSENT const *e = fts_read (fts);
526 assert (e == ent);
527 info = ent->fts_info;
530 if (info == FTS_NS || info == FTS_SLNONE)
532 error (0, ent->fts_errno, _("cannot access %s"), quoteaf (file));
533 return false;
536 /* The --one-file-system (-x) option cannot exclude anything
537 specified on the command-line. By definition, it can exclude
538 a file or directory only when its device number is different
539 from that of its just-processed parent directory, and du does
540 not process the parent of a command-line argument. */
541 if (fts->fts_options & FTS_XDEV
542 && FTS_ROOTLEVEL < ent->fts_level
543 && fts->fts_dev != sb->st_dev)
544 excluded = true;
547 if (excluded
548 || (! opt_count_all
549 && (hash_all || (! S_ISDIR (sb->st_mode) && 1 < sb->st_nlink))
550 && ! hash_ins (di_files, sb->st_ino, sb->st_dev)))
552 /* If ignoring a directory in preorder, skip its children.
553 Ignore the next fts_read output too, as it's a postorder
554 visit to the same directory. */
555 if (info == FTS_D)
557 fts_set (fts, ent, FTS_SKIP);
558 FTSENT const *e = fts_read (fts);
559 assert (e == ent);
562 return true;
565 switch (info)
567 case FTS_D:
568 return true;
570 case FTS_ERR:
571 /* An error occurred, but the size is known, so count it. */
572 error (0, ent->fts_errno, "%s", quotef (file));
573 ok = false;
574 break;
576 case FTS_DC:
577 /* If not following symlinks and not a (bind) mount point. */
578 if (cycle_warning_required (fts, ent)
579 && ! mount_point_in_fts_cycle (ent))
581 emit_cycle_warning (file);
582 return false;
584 return true;
588 duinfo_set (&dui,
589 (apparent_size
590 ? MAX (0, sb->st_size)
591 : (uintmax_t) ST_NBLOCKS (*sb) * ST_NBLOCKSIZE),
592 (time_type == time_mtime ? get_stat_mtime (sb)
593 : time_type == time_atime ? get_stat_atime (sb)
594 : get_stat_ctime (sb)));
596 level = ent->fts_level;
597 dui_to_print = dui;
599 if (n_alloc == 0)
601 n_alloc = level + 10;
602 dulvl = xcalloc (n_alloc, sizeof *dulvl);
604 else
606 if (level == prev_level)
608 /* This is usually the most common case. Do nothing. */
610 else if (level > prev_level)
612 /* Descending the hierarchy.
613 Clear the accumulators for *all* levels between prev_level
614 and the current one. The depth may change dramatically,
615 e.g., from 1 to 10. */
616 size_t i;
618 if (n_alloc <= level)
620 dulvl = xnrealloc (dulvl, level, 2 * sizeof *dulvl);
621 n_alloc = level * 2;
624 for (i = prev_level + 1; i <= level; i++)
626 duinfo_init (&dulvl[i].ent);
627 duinfo_init (&dulvl[i].subdir);
630 else /* level < prev_level */
632 /* Ascending the hierarchy.
633 Process a directory only after all entries in that
634 directory have been processed. When the depth decreases,
635 propagate sums from the children (prev_level) to the parent.
636 Here, the current level is always one smaller than the
637 previous one. */
638 assert (level == prev_level - 1);
639 duinfo_add (&dui_to_print, &dulvl[prev_level].ent);
640 if (!opt_separate_dirs)
641 duinfo_add (&dui_to_print, &dulvl[prev_level].subdir);
642 duinfo_add (&dulvl[level].subdir, &dulvl[prev_level].ent);
643 duinfo_add (&dulvl[level].subdir, &dulvl[prev_level].subdir);
647 prev_level = level;
649 /* Let the size of a directory entry contribute to the total for the
650 containing directory, unless --separate-dirs (-S) is specified. */
651 if (! (opt_separate_dirs && IS_DIR_TYPE (info)))
652 duinfo_add (&dulvl[level].ent, &dui);
654 /* Even if this directory is unreadable or we can't chdir into it,
655 do let its size contribute to the total. */
656 duinfo_add (&tot_dui, &dui);
658 if ((IS_DIR_TYPE (info) && level <= max_depth)
659 || (opt_all && level <= max_depth)
660 || level == 0)
662 /* Print or elide this entry according to the --threshold option. */
663 uintmax_t v = opt_inodes ? dui_to_print.inodes : dui_to_print.size;
664 if (opt_threshold < 0
665 ? v <= -opt_threshold
666 : v >= opt_threshold)
667 print_size (&dui_to_print, file);
670 return ok;
673 /* Recursively print the sizes of the directories (and, if selected, files)
674 named in FILES, the last entry of which is NULL.
675 BIT_FLAGS controls how fts works.
676 Return true if successful. */
678 static bool
679 du_files (char **files, int bit_flags)
681 bool ok = true;
683 if (*files)
685 FTS *fts = xfts_open (files, bit_flags, NULL);
687 while (1)
689 FTSENT *ent;
691 ent = fts_read (fts);
692 if (ent == NULL)
694 if (errno != 0)
696 error (0, errno, _("fts_read failed: %s"),
697 quotef (fts->fts_path));
698 ok = false;
701 /* When exiting this loop early, be careful to reset the
702 global, prev_level, used in process_file. Otherwise, its
703 (level == prev_level - 1) assertion could fail. */
704 prev_level = 0;
705 break;
707 FTS_CROSS_CHECK (fts);
709 ok &= process_file (fts, ent);
712 if (fts_close (fts) != 0)
714 error (0, errno, _("fts_close failed"));
715 ok = false;
719 return ok;
723 main (int argc, char **argv)
725 char *cwd_only[2];
726 bool max_depth_specified = false;
727 bool ok = true;
728 char *files_from = NULL;
730 /* Bit flags that control how fts works. */
731 int bit_flags = FTS_NOSTAT;
733 /* Select one of the three FTS_ options that control if/when
734 to follow a symlink. */
735 int symlink_deref_bits = FTS_PHYSICAL;
737 /* If true, display only a total for each argument. */
738 bool opt_summarize_only = false;
740 cwd_only[0] = bad_cast (".");
741 cwd_only[1] = NULL;
743 initialize_main (&argc, &argv);
744 set_program_name (argv[0]);
745 setlocale (LC_ALL, "");
746 bindtextdomain (PACKAGE, LOCALEDIR);
747 textdomain (PACKAGE);
749 atexit (close_stdout);
751 exclude = new_exclude ();
753 human_options (getenv ("DU_BLOCK_SIZE"),
754 &human_output_opts, &output_block_size);
756 while (true)
758 int oi = -1;
759 int c = getopt_long (argc, argv, "0abd:chHklmst:xB:DLPSX:",
760 long_options, &oi);
761 if (c == -1)
762 break;
764 switch (c)
766 #if DU_DEBUG
767 case FTS_DEBUG:
768 fts_debug = true;
769 break;
770 #endif
772 case '0':
773 opt_nul_terminate_output = true;
774 break;
776 case 'a':
777 opt_all = true;
778 break;
780 case APPARENT_SIZE_OPTION:
781 apparent_size = true;
782 break;
784 case 'b':
785 apparent_size = true;
786 human_output_opts = 0;
787 output_block_size = 1;
788 break;
790 case 'c':
791 print_grand_total = true;
792 break;
794 case 'h':
795 human_output_opts = human_autoscale | human_SI | human_base_1024;
796 output_block_size = 1;
797 break;
799 case HUMAN_SI_OPTION:
800 human_output_opts = human_autoscale | human_SI;
801 output_block_size = 1;
802 break;
804 case 'k':
805 human_output_opts = 0;
806 output_block_size = 1024;
807 break;
809 case 'd': /* --max-depth=N */
811 unsigned long int tmp_ulong;
812 if (xstrtoul (optarg, NULL, 0, &tmp_ulong, NULL) == LONGINT_OK
813 && tmp_ulong <= SIZE_MAX)
815 max_depth_specified = true;
816 max_depth = tmp_ulong;
818 else
820 error (0, 0, _("invalid maximum depth %s"),
821 quote (optarg));
822 ok = false;
825 break;
827 case 'm':
828 human_output_opts = 0;
829 output_block_size = 1024 * 1024;
830 break;
832 case 'l':
833 opt_count_all = true;
834 break;
836 case 's':
837 opt_summarize_only = true;
838 break;
840 case 't':
842 enum strtol_error e;
843 e = xstrtoimax (optarg, NULL, 0, &opt_threshold, "kKmMGTPEZY0");
844 if (e != LONGINT_OK)
845 xstrtol_fatal (e, oi, c, long_options, optarg);
846 if (opt_threshold == 0 && *optarg == '-')
848 /* Do not allow -0, as this wouldn't make sense anyway. */
849 die (EXIT_FAILURE, 0, _("invalid --threshold argument '-0'"));
852 break;
854 case 'x':
855 bit_flags |= FTS_XDEV;
856 break;
858 case 'B':
860 enum strtol_error e = human_options (optarg, &human_output_opts,
861 &output_block_size);
862 if (e != LONGINT_OK)
863 xstrtol_fatal (e, oi, c, long_options, optarg);
865 break;
867 case 'H': /* NOTE: before 2008-12, -H was equivalent to --si. */
868 case 'D':
869 symlink_deref_bits = FTS_COMFOLLOW | FTS_PHYSICAL;
870 break;
872 case 'L': /* --dereference */
873 symlink_deref_bits = FTS_LOGICAL;
874 break;
876 case 'P': /* --no-dereference */
877 symlink_deref_bits = FTS_PHYSICAL;
878 break;
880 case 'S':
881 opt_separate_dirs = true;
882 break;
884 case 'X':
885 if (add_exclude_file (add_exclude, exclude, optarg,
886 EXCLUDE_WILDCARDS, '\n'))
888 error (0, errno, "%s", quotef (optarg));
889 ok = false;
891 break;
893 case FILES0_FROM_OPTION:
894 files_from = optarg;
895 break;
897 case EXCLUDE_OPTION:
898 add_exclude (exclude, optarg, EXCLUDE_WILDCARDS);
899 break;
901 case INODES_OPTION:
902 opt_inodes = true;
903 break;
905 case TIME_OPTION:
906 opt_time = true;
907 time_type =
908 (optarg
909 ? XARGMATCH ("--time", optarg, time_args, time_types)
910 : time_mtime);
911 localtz = tzalloc (getenv ("TZ"));
912 break;
914 case TIME_STYLE_OPTION:
915 time_style = optarg;
916 break;
918 case_GETOPT_HELP_CHAR;
920 case_GETOPT_VERSION_CHAR (PROGRAM_NAME, AUTHORS);
922 default:
923 ok = false;
927 if (!ok)
928 usage (EXIT_FAILURE);
930 if (opt_all && opt_summarize_only)
932 error (0, 0, _("cannot both summarize and show all entries"));
933 usage (EXIT_FAILURE);
936 if (opt_summarize_only && max_depth_specified && max_depth == 0)
938 error (0, 0,
939 _("warning: summarizing is the same as using --max-depth=0"));
942 if (opt_summarize_only && max_depth_specified && max_depth != 0)
944 unsigned long int d = max_depth;
945 error (0, 0, _("warning: summarizing conflicts with --max-depth=%lu"), d);
946 usage (EXIT_FAILURE);
949 if (opt_summarize_only)
950 max_depth = 0;
952 if (opt_inodes)
954 if (apparent_size)
956 error (0, 0, _("warning: options --apparent-size and -b are "
957 "ineffective with --inodes"));
959 output_block_size = 1;
962 /* Process time style if printing last times. */
963 if (opt_time)
965 if (! time_style)
967 time_style = getenv ("TIME_STYLE");
969 /* Ignore TIMESTYLE="locale", for compatibility with ls. */
970 if (! time_style || STREQ (time_style, "locale"))
971 time_style = "long-iso";
972 else if (*time_style == '+')
974 /* Ignore anything after a newline, for compatibility
975 with ls. */
976 char *p = strchr (time_style, '\n');
977 if (p)
978 *p = '\0';
980 else
982 /* Ignore "posix-" prefix, for compatibility with ls. */
983 static char const posix_prefix[] = "posix-";
984 static const size_t prefix_len = sizeof posix_prefix - 1;
985 while (STREQ_LEN (time_style, posix_prefix, prefix_len))
986 time_style += prefix_len;
990 if (*time_style == '+')
991 time_format = time_style + 1;
992 else
994 switch (XARGMATCH ("time style", time_style,
995 time_style_args, time_style_types))
997 case full_iso_time_style:
998 time_format = "%Y-%m-%d %H:%M:%S.%N %z";
999 break;
1001 case long_iso_time_style:
1002 time_format = "%Y-%m-%d %H:%M";
1003 break;
1005 case iso_time_style:
1006 time_format = "%Y-%m-%d";
1007 break;
1012 struct argv_iterator *ai;
1013 if (files_from)
1015 /* When using --files0-from=F, you may not specify any files
1016 on the command-line. */
1017 if (optind < argc)
1019 error (0, 0, _("extra operand %s"), quote (argv[optind]));
1020 fprintf (stderr, "%s\n",
1021 _("file operands cannot be combined with --files0-from"));
1022 usage (EXIT_FAILURE);
1025 if (! (STREQ (files_from, "-") || freopen (files_from, "r", stdin)))
1026 die (EXIT_FAILURE, errno, _("cannot open %s for reading"),
1027 quoteaf (files_from));
1029 ai = argv_iter_init_stream (stdin);
1031 /* It's not easy here to count the arguments, so assume the
1032 worst. */
1033 hash_all = true;
1035 else
1037 char **files = (optind < argc ? argv + optind : cwd_only);
1038 ai = argv_iter_init_argv (files);
1040 /* Hash all dev,ino pairs if there are multiple arguments, or if
1041 following non-command-line symlinks, because in either case a
1042 file with just one hard link might be seen more than once. */
1043 hash_all = (optind + 1 < argc || symlink_deref_bits == FTS_LOGICAL);
1046 if (!ai)
1047 xalloc_die ();
1049 /* Initialize the set of dev,inode pairs. */
1050 di_files = di_set_alloc ();
1051 if (!di_files)
1052 xalloc_die ();
1054 /* If not hashing everything, process_file won't find cycles on its
1055 own, so ask fts_read to check for them accurately. */
1056 if (opt_count_all || ! hash_all)
1057 bit_flags |= FTS_TIGHT_CYCLE_CHECK;
1059 bit_flags |= symlink_deref_bits;
1060 static char *temp_argv[] = { NULL, NULL };
1062 while (true)
1064 bool skip_file = false;
1065 enum argv_iter_err ai_err;
1066 char *file_name = argv_iter (ai, &ai_err);
1067 if (!file_name)
1069 switch (ai_err)
1071 case AI_ERR_EOF:
1072 goto argv_iter_done;
1073 case AI_ERR_READ:
1074 error (0, errno, _("%s: read error"),
1075 quotef (files_from));
1076 ok = false;
1077 goto argv_iter_done;
1078 case AI_ERR_MEM:
1079 xalloc_die ();
1080 default:
1081 assert (!"unexpected error code from argv_iter");
1084 if (files_from && STREQ (files_from, "-") && STREQ (file_name, "-"))
1086 /* Give a better diagnostic in an unusual case:
1087 printf - | du --files0-from=- */
1088 error (0, 0, _("when reading file names from stdin, "
1089 "no file name of %s allowed"),
1090 quoteaf (file_name));
1091 skip_file = true;
1094 /* Report and skip any empty file names before invoking fts.
1095 This works around a glitch in fts, which fails immediately
1096 (without looking at the other file names) when given an empty
1097 file name. */
1098 if (!file_name[0])
1100 /* Diagnose a zero-length file name. When it's one
1101 among many, knowing the record number may help.
1102 FIXME: currently print the record number only with
1103 --files0-from=FILE. Maybe do it for argv, too? */
1104 if (files_from == NULL)
1105 error (0, 0, "%s", _("invalid zero-length file name"));
1106 else
1108 /* Using the standard 'filename:line-number:' prefix here is
1109 not totally appropriate, since NUL is the separator, not NL,
1110 but it might be better than nothing. */
1111 unsigned long int file_number = argv_iter_n_args (ai);
1112 error (0, 0, "%s:%lu: %s", quotef (files_from),
1113 file_number, _("invalid zero-length file name"));
1115 skip_file = true;
1118 if (skip_file)
1119 ok = false;
1120 else
1122 temp_argv[0] = file_name;
1123 ok &= du_files (temp_argv, bit_flags);
1126 argv_iter_done:
1128 argv_iter_free (ai);
1129 di_set_free (di_files);
1130 if (di_mnt)
1131 di_set_free (di_mnt);
1133 if (files_from && (ferror (stdin) || fclose (stdin) != 0) && ok)
1134 die (EXIT_FAILURE, 0, _("error reading %s"), quoteaf (files_from));
1136 if (print_grand_total)
1137 print_size (&tot_dui, _("total"));
1139 return ok ? EXIT_SUCCESS : EXIT_FAILURE;