1 /* locate -- search databases for filenames that match patterns
2 Copyright (C) 1994, 1996, 1998, 1999, 2000, 2003,
3 2004, 2005 Free Software Foundation, Inc.
5 This program is free software; you can redistribute it and/or modify
6 it under the terms of the GNU General Public License as published by
7 the Free Software Foundation; either version 2, or (at your option)
10 This program is distributed in the hope that it will be useful,
11 but WITHOUT ANY WARRANTY; without even the implied warranty of
12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 GNU General Public License for more details.
15 You should have received a copy of the GNU General Public License
16 along with this program; if not, write to the Free Software
17 Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301,
21 /* Usage: locate [options] pattern...
23 Scan a pathname list for the full pathname of a file, given only
24 a piece of the name (possibly containing shell globbing metacharacters).
25 The list has been processed with front-compression, which reduces
26 the list size by a factor of 4-5.
27 Recognizes two database formats, old and new. The old format is
28 bigram coded, which reduces space by a further 20-25% and uses the
29 following encoding of the database bytes:
31 0-28 likeliest differential counts + offset (14) to make nonnegative
32 30 escape code for out-of-range count to follow in next halfword
33 128-255 bigram codes (the 128 most common, as determined by `updatedb')
34 32-127 single character (printable) ASCII remainder
36 Earlier versions of GNU locate used to use a novel two-tiered
37 string search technique, which was described in Usenix ;login:, Vol
38 8, No 1, February/March, 1983, p. 8.
40 However, latterly code changes to provide additional functionality
41 became dificult to make with the existing reading scheme, and so
42 we no longer perform the matching as efficiently as we used to (that is,
43 we no longer use the same algorithm).
45 The old algorithm was:
47 First, match a metacharacter-free subpattern and a partial
48 pathname BACKWARDS to avoid full expansion of the pathname list.
49 The time savings is 40-50% over forward matching, which cannot
50 efficiently handle overlapped search patterns and compressed
53 Then, match the actual shell glob pattern (if in this form)
54 against the candidate pathnames using the slower shell filename
58 Written by James A. Woods <jwoods@adobe.com>.
59 Modified by David MacKenzie <djm@gnu.org>.
60 Additional work by James Youngman and Bas van Gompel.
67 #include <sys/types.h>
74 /* The presence of unistd.h is assumed by gnulib these days, so we
75 * might as well assume it too.
77 /* We need <unistd.h> for isatty(). */
88 #if defined(HAVE_STRING_H) || defined(STDC_HEADERS)
110 # include <libintl.h>
111 # define _(Text) gettext (Text)
113 # define _(Text) Text
114 #define textdomain(Domain)
115 #define bindtextdomain(Package, Directory)
118 # define N_(String) gettext_noop (String)
120 /* We used to use (String) instead of just String, but apparently ISO C
121 * doesn't allow this (at least, that's what HP said when someone reported
122 * this as a compiler bug). This is HP case number 1205608192. See
123 * also http://gcc.gnu.org/bugzilla/show_bug.cgi?id=11250 (which references
124 * ANSI 3.5.7p14-15). The Intel icc compiler also rejects constructs
125 * like: static const char buf[] = ("string");
127 # define N_(String) String
130 #include "locatedb.h"
132 #include "../gnulib/lib/xalloc.h"
133 #include "../gnulib/lib/error.h"
134 #include "../gnulib/lib/human.h"
136 #include "closeout.h"
137 #include "nextelem.h"
140 #include "quotearg.h"
141 #include "printquoted.h"
142 #include "regextype.h"
145 /* Note that this evaluates C many times. */
147 # define TOUPPER(Ch) toupper (Ch)
148 # define TOLOWER(Ch) tolower (Ch)
150 # define TOUPPER(Ch) (islower (Ch) ? toupper (Ch) : (Ch))
151 # define TOLOWER(Ch) (isupper (Ch) ? tolower (Ch) : (Ch))
154 /* typedef enum {false, true} boolean; */
156 /* Warn if a database is older than this. 8 days allows for a weekly
157 update that takes up to a day to perform. */
158 #define WARN_NUMBER_UNITS (8)
159 /* Printable name of units used in WARN_SECONDS */
160 static const char warn_name_units
[] = N_("days");
161 #define SECONDS_PER_UNIT (60 * 60 * 24)
163 #define WARN_SECONDS ((SECONDS_PER_UNIT) * (WARN_NUMBER_UNITS))
167 VISIT_CONTINUE
= 1, /* please call the next visitor */
168 VISIT_ACCEPTED
= 2, /* accepted, call no futher callbacks for this file */
169 VISIT_REJECTED
= 4, /* rejected, process next file. */
170 VISIT_ABORT
= 8 /* rejected, process no more files. */
173 enum ExistenceCheckType
175 ACCEPT_EITHER
, /* Corresponds to lack of -E/-e option */
176 ACCEPT_EXISTING
, /* Corresponds to option -e */
177 ACCEPT_NON_EXISTING
/* Corresponds to option -E */
180 /* Check for existence of files before printing them out? */
181 enum ExistenceCheckType check_existence
= ACCEPT_EITHER
;
183 static int follow_symlinks
= 1;
185 /* What to separate the results with. */
186 static int separator
= '\n';
188 static struct quoting_options
* quote_opts
= NULL
;
189 static bool stdout_is_a_tty
;
190 static bool print_quoted_filename
;
193 static char* slocate_db_pathname
= "/var/lib/slocate/slocate.db";
195 static const char *selected_secure_db
= NULL
;
198 /* Read in a 16-bit int, high byte first (network byte order). */
206 x
= (signed char) fgetc (fp
) << 8;
207 x
|= (fgetc (fp
) & 0xff);
211 const char * const metacharacters
= "*?[]\\";
213 /* Return nonzero if S contains any shell glob characters.
216 contains_metacharacter(const char *s
)
218 if (NULL
== strpbrk(s
, metacharacters
))
226 * Read bytes from FP into the buffer at offset OFFSET in (*BUF),
227 * until we reach DELIMITER or end-of-file. We reallocate the buffer
228 * as necessary, altering (*BUF) and (*SIZ) as appropriate. No assumption
229 * is made regarding the content of the data (i.e. the implementation is
230 * 8-bit clean, the only delimiter is DELIMITER).
232 * Written Fri May 23 18:41:16 2003 by James Youngman, because getstr()
233 * has been removed from gnulib.
235 * We call the function locate_read_str() to avoid a name clash with the curses
239 locate_read_str(char **buf
, size_t *siz
, FILE *fp
, int delimiter
, int offs
)
246 nread
= getdelim(&p
, &sz
, delimiter
, fp
);
251 needed
= offs
+ nread
+ 1u;
254 char *pnew
= realloc(*buf
, needed
);
257 return -1; /* FAIL */
265 memcpy((*buf
)+offs
, p
, nread
);
273 lc_strcpy(char *dest
, const char *src
)
277 *dest
++ = TOLOWER(*src
);
286 uintmax_t items_accepted
;
288 static struct locate_limits limits
;
293 uintmax_t compressed_bytes
;
294 uintmax_t total_filename_count
;
295 uintmax_t total_filename_length
;
296 uintmax_t whitespace_count
;
297 uintmax_t newline_count
;
298 uintmax_t highbit_filename_count
;
300 static struct locate_stats statistics
;
309 static struct stringbuf casebuf
;
315 struct stringbuf
*pbuf
;
318 struct regular_expression
320 struct re_pattern_buffer regex
; /* for --regex */
326 int c
; /* An input byte. */
327 char itemcount
; /* Indicates we're at the beginning of an slocate db. */
328 int count
; /* The length of the prefix shared with the previous database entry. */
330 char *original_filename
; /* The current input database entry. */
331 size_t pathsize
; /* Amount allocated for it. */
332 char *munged_filename
; /* path or base_name(path) */
333 FILE *fp
; /* The pathname database. */
334 const char *dbfile
; /* Its name, or "<stdin>" */
335 int slocatedb_format
; /* Allows us to cope with slocate's format variant */
336 /* for the old database format,
337 the first and second characters of the most common bigrams. */
343 typedef int (*visitfunc
)(struct process_data
*procdata
,
350 struct visitor
*next
;
354 static struct visitor
*inspectors
= NULL
;
355 static struct visitor
*lastinspector
= NULL
;
356 static struct visitor
*past_pat_inspector
= NULL
;
358 /* 0 or 1 pattern(s) */
360 process_simple(struct process_data
*procdata
)
362 int result
= VISIT_CONTINUE
;
363 const struct visitor
*p
= inspectors
;
365 while ( ((VISIT_CONTINUE
| VISIT_ACCEPTED
) & result
) && (NULL
!= p
) )
367 result
= (p
->inspector
)(procdata
, p
->context
);
374 /* Accept if any pattern matches. */
376 process_or (struct process_data
*procdata
)
378 int result
= VISIT_CONTINUE
;
379 const struct visitor
*p
= inspectors
;
381 while ( ((VISIT_CONTINUE
| VISIT_REJECTED
) & result
) && (past_pat_inspector
!= p
) )
383 result
= (p
->inspector
)(procdata
, p
->context
);
387 if (result
== VISIT_CONTINUE
)
388 result
= VISIT_REJECTED
;
389 if (result
& (VISIT_ABORT
| VISIT_REJECTED
))
392 p
= past_pat_inspector
;
393 result
= VISIT_CONTINUE
;
395 while ( (VISIT_CONTINUE
== result
) && (NULL
!= p
) )
397 result
= (p
->inspector
)(procdata
, p
->context
);
401 if (VISIT_CONTINUE
== result
)
402 return VISIT_ACCEPTED
;
407 /* Accept if all pattern match. */
409 process_and (struct process_data
*procdata
)
411 int result
= VISIT_CONTINUE
;
412 const struct visitor
*p
= inspectors
;
414 while ( ((VISIT_CONTINUE
| VISIT_ACCEPTED
) & result
) && (past_pat_inspector
!= p
) )
416 result
= (p
->inspector
)(procdata
, p
->context
);
420 if (result
== VISIT_CONTINUE
)
421 result
= VISIT_REJECTED
;
422 if (result
& (VISIT_ABORT
| VISIT_REJECTED
))
425 p
= past_pat_inspector
;
426 result
= VISIT_CONTINUE
;
428 while ( (VISIT_CONTINUE
== result
) && (NULL
!= p
) )
430 result
= (p
->inspector
)(procdata
, p
->context
);
434 if (VISIT_CONTINUE
== result
)
435 return VISIT_ACCEPTED
;
440 typedef int (*processfunc
)(struct process_data
*procdata
);
442 static processfunc mainprocessor
= NULL
;
445 add_visitor(visitfunc fn
, void *context
)
447 struct visitor
*p
= xmalloc(sizeof(struct visitor
));
449 p
->context
= context
;
452 if (NULL
== lastinspector
)
454 lastinspector
= inspectors
= p
;
458 lastinspector
->next
= p
;
466 visit_justprint_quoted(struct process_data
*procdata
, void *context
)
469 print_quoted (stdout
, quote_opts
, stdout_is_a_tty
,
471 procdata
->original_filename
);
473 return VISIT_CONTINUE
;
477 visit_justprint_unquoted(struct process_data
*procdata
, void *context
)
480 fputs(procdata
->original_filename
, stdout
);
482 return VISIT_CONTINUE
;
486 visit_old_format(struct process_data
*procdata
, void *context
)
491 /* Get the offset in the path where this path info starts. */
492 if (procdata
->c
== LOCATEDB_OLD_ESCAPE
)
493 procdata
->count
+= getw (procdata
->fp
) - LOCATEDB_OLD_OFFSET
;
495 procdata
->count
+= procdata
->c
- LOCATEDB_OLD_OFFSET
;
497 /* Overlay the old path with the remainder of the new. */
498 for (s
= procdata
->original_filename
+ procdata
->count
;
499 (procdata
->c
= getc (procdata
->fp
)) > LOCATEDB_OLD_ESCAPE
;)
500 if (procdata
->c
< 0200)
501 *s
++ = procdata
->c
; /* An ordinary character. */
504 /* Bigram markers have the high bit set. */
506 *s
++ = procdata
->bigram1
[procdata
->c
];
507 *s
++ = procdata
->bigram2
[procdata
->c
];
511 procdata
->munged_filename
= procdata
->original_filename
;
513 return VISIT_CONTINUE
;
518 visit_locate02_format(struct process_data
*procdata
, void *context
)
524 if (procdata
->slocatedb_format
)
526 if (procdata
->itemcount
== 0)
528 ungetc(procdata
->c
, procdata
->fp
);
532 else if (procdata
->itemcount
== 1)
534 procdata
->count
= procdata
->len
-1;
538 if (procdata
->c
== LOCATEDB_ESCAPE
)
539 procdata
->count
+= (short)get_short (procdata
->fp
);
540 else if (procdata
->c
> 127)
541 procdata
->count
+= procdata
->c
- 256;
543 procdata
->count
+= procdata
->c
;
548 if (procdata
->c
== LOCATEDB_ESCAPE
)
549 procdata
->count
+= (short)get_short (procdata
->fp
);
550 else if (procdata
->c
> 127)
551 procdata
->count
+= procdata
->c
- 256;
553 procdata
->count
+= procdata
->c
;
556 if (procdata
->count
> procdata
->len
|| procdata
->count
< 0)
558 /* This should not happen generally , but since we're
559 * reading in data which is outside our control, we
562 error(1, 0, _("locate database `%s' is corrupt or invalid"), procdata
->dbfile
);
565 /* Overlay the old path with the remainder of the new. */
566 nread
= locate_read_str (&procdata
->original_filename
, &procdata
->pathsize
,
567 procdata
->fp
, 0, procdata
->count
);
570 procdata
->c
= getc (procdata
->fp
);
571 procdata
->len
= procdata
->count
+ nread
;
572 s
= procdata
->original_filename
+ procdata
->len
- 1; /* Move to the last char in path. */
573 assert (s
[0] != '\0');
574 assert (s
[1] == '\0'); /* Our terminator. */
575 assert (s
[2] == '\0'); /* Added by locate_read_str. */
577 procdata
->munged_filename
= procdata
->original_filename
;
579 if (procdata
->slocatedb_format
)
581 /* Don't increment indefinitely, it might overflow. */
582 if (procdata
->itemcount
< 6)
584 ++(procdata
->itemcount
);
589 return VISIT_CONTINUE
;
593 visit_basename(struct process_data
*procdata
, void *context
)
596 procdata
->munged_filename
= base_name(procdata
->original_filename
);
598 return VISIT_CONTINUE
;
603 visit_casefold(struct process_data
*procdata
, void *context
)
605 struct stringbuf
*b
= context
;
607 if (*b
->preqlen
+1 > b
->buffersize
)
609 b
->buffer
= xrealloc(b
->buffer
, *b
->preqlen
+1); /* XXX: consider using extendbuf(). */
610 b
->buffersize
= *b
->preqlen
+1;
612 lc_strcpy(b
->buffer
, procdata
->munged_filename
);
614 return VISIT_CONTINUE
;
617 /* visit_existing_follow implements -L -e */
619 visit_existing_follow(struct process_data
*procdata
, void *context
)
624 /* munged_filename has been converted in some way (to lower case,
625 * or is just the base name of the file), and original_filename has not.
626 * Hence only original_filename is still actually the name of the file
627 * whose existence we would need to check.
629 if (stat(procdata
->original_filename
, &st
) != 0)
631 return VISIT_REJECTED
;
635 return VISIT_CONTINUE
;
639 /* visit_non_existing_follow implements -L -E */
641 visit_non_existing_follow(struct process_data
*procdata
, void *context
)
646 /* munged_filename has been converted in some way (to lower case,
647 * or is just the base name of the file), and original_filename has not.
648 * Hence only original_filename is still actually the name of the file
649 * whose existence we would need to check.
651 if (stat(procdata
->original_filename
, &st
) == 0)
653 return VISIT_REJECTED
;
657 return VISIT_CONTINUE
;
661 /* visit_existing_nofollow implements -P -e */
663 visit_existing_nofollow(struct process_data
*procdata
, void *context
)
668 /* munged_filename has been converted in some way (to lower case,
669 * or is just the base name of the file), and original_filename has not.
670 * Hence only original_filename is still actually the name of the file
671 * whose existence we would need to check.
673 if (lstat(procdata
->original_filename
, &st
) != 0)
675 return VISIT_REJECTED
;
679 return VISIT_CONTINUE
;
683 /* visit_non_existing_nofollow implements -P -E */
685 visit_non_existing_nofollow(struct process_data
*procdata
, void *context
)
690 /* munged_filename has been converted in some way (to lower case,
691 * or is just the base name of the file), and original_filename has not.
692 * Hence only original_filename is still actually the name of the file
693 * whose existence we would need to check.
695 if (lstat(procdata
->original_filename
, &st
) == 0)
697 return VISIT_REJECTED
;
701 return VISIT_CONTINUE
;
706 visit_substring_match_nocasefold(struct process_data
*procdata
, void *context
)
708 const char *pattern
= context
;
710 if (NULL
!= strstr(procdata
->munged_filename
, pattern
))
711 return VISIT_ACCEPTED
;
713 return VISIT_REJECTED
;
717 visit_substring_match_casefold(struct process_data
*procdata
, void *context
)
719 const struct casefolder
* p
= context
;
720 const struct stringbuf
* b
= p
->pbuf
;
723 if (NULL
!= strstr(b
->buffer
, p
->pattern
))
724 return VISIT_ACCEPTED
;
726 return VISIT_REJECTED
;
731 visit_globmatch_nofold(struct process_data
*procdata
, void *context
)
733 const char *glob
= context
;
734 if (fnmatch(glob
, procdata
->munged_filename
, 0) != 0)
735 return VISIT_REJECTED
;
737 return VISIT_ACCEPTED
;
742 visit_globmatch_casefold(struct process_data
*procdata
, void *context
)
744 const char *glob
= context
;
745 if (fnmatch(glob
, procdata
->munged_filename
, FNM_CASEFOLD
) != 0)
746 return VISIT_REJECTED
;
748 return VISIT_ACCEPTED
;
753 visit_regex(struct process_data
*procdata
, void *context
)
755 struct regular_expression
*p
= context
;
756 const size_t len
= strlen(procdata
->munged_filename
);
758 int rv
= re_search (&p
->regex
, procdata
->munged_filename
,
760 (struct re_registers
*) NULL
);
763 return VISIT_REJECTED
; /* no match (-1), or internal error (-2) */
767 return VISIT_ACCEPTED
; /* match */
773 visit_stats(struct process_data
*procdata
, void *context
)
775 struct locate_stats
*p
= context
;
776 size_t len
= strlen(procdata
->original_filename
);
778 int highbit
, whitespace
, newline
;
780 ++(p
->total_filename_count
);
781 p
->total_filename_length
+= len
;
783 highbit
= whitespace
= newline
= 0;
784 for (s
=procdata
->original_filename
; *s
; ++s
)
786 if ( (int)(*s
) & 128 )
790 newline
= whitespace
= 1;
792 else if (isspace((unsigned char)*s
))
799 ++(p
->highbit_filename_count
);
801 ++(p
->whitespace_count
);
803 ++(p
->newline_count
);
805 return VISIT_CONTINUE
;
810 visit_limit(struct process_data
*procdata
, void *context
)
812 struct locate_limits
*p
= context
;
816 if (++p
->items_accepted
>= p
->limit
)
819 return VISIT_CONTINUE
;
823 visit_count(struct process_data
*procdata
, void *context
)
825 struct locate_limits
*p
= context
;
830 return VISIT_CONTINUE
;
833 /* Emit the statistics.
836 print_stats(int argc
, size_t database_file_size
)
838 char hbuf
[LONGEST_HUMAN_READABLE
+ 1];
840 printf(_("Locate database size: %s bytes\n"),
841 human_readable ((uintmax_t) database_file_size
,
842 hbuf
, human_ceiling
, 1, 1));
844 printf(_("Filenames: %s "),
845 human_readable (statistics
.total_filename_count
,
846 hbuf
, human_ceiling
, 1, 1));
847 printf(_("with a cumulative length of %s bytes"),
848 human_readable (statistics
.total_filename_length
,
849 hbuf
, human_ceiling
, 1, 1));
851 printf(_("\n\tof which %s contain whitespace, "),
852 human_readable (statistics
.whitespace_count
,
853 hbuf
, human_ceiling
, 1, 1));
854 printf(_("\n\t%s contain newline characters, "),
855 human_readable (statistics
.newline_count
,
856 hbuf
, human_ceiling
, 1, 1));
857 printf(_("\n\tand %s contain characters with the high bit set.\n"),
858 human_readable (statistics
.highbit_filename_count
,
859 hbuf
, human_ceiling
, 1, 1));
862 printf(_("Compression ratio %4.2f%%\n"),
863 100.0 * ((double)statistics
.total_filename_length
864 - (double) database_file_size
)
865 / (double) statistics
.total_filename_length
);
870 * Return nonzero if the data we read in indicates that we are
871 * looking at a LOCATE02 locate database.
874 looking_at_gnu_locatedb (const char *data
, size_t len
)
876 if (len
< sizeof (LOCATEDB_MAGIC
))
878 else if (0 == memcmp (data
, LOCATEDB_MAGIC
, sizeof (LOCATEDB_MAGIC
)))
879 return 1; /* We saw the magic byte sequence */
885 * Return nonzero if the data we read in indicates that we are
886 * looking at an slocate database.
889 looking_at_slocate_locatedb (const char *filename
,
894 char slocate_magic
[] = "1";
895 size_t lenwanted
= sizeof(slocate_magic
);
904 /* Check that the magic number is a one-byte string */
907 if (isdigit((unsigned char)data
[0]))
909 /* looks promising. */
910 *seclevel
= (data
[0] - '0');
914 /* Hmm, well it's probably an slocate database
915 * of some awsomely huge security level, like 2.
916 * We don't know how to handle those.
919 _("locate database `%s' looks like an slocate "
920 "database but it seems to have security level %c, "
921 "which GNU findutils does not currently support"),
933 /* Definitely not slocate. */
939 /* Print or count the entries in DBFILE that match shell globbing patterns in
940 ARGV. Return the number of entries matched. */
943 search_one_database (int argc
,
952 struct locate_limits
*plimit
,
958 char *pathpart
; /* A pattern to consider. */
959 int argn
; /* Index to current pattern in argv. */
960 int need_fold
; /* Set when folding and any pattern is non-glob. */
961 int nread
; /* number of bytes read from an entry. */
962 struct process_data procdata
; /* Storage for data shared with visitors. */
963 int slocate_seclevel
;
964 struct visitor
* pvis
; /* temp for determining past_pat_inspector. */
965 const char *format_name
;
968 regex_options
|= RE_ICASE
;
970 procdata
.len
= procdata
.count
= 0;
971 procdata
.slocatedb_format
= 0;
972 procdata
.itemcount
= 0;
974 procdata
.dbfile
= dbfile
;
977 /* Set up the inspection regime */
979 lastinspector
= NULL
;
980 past_pat_inspector
= NULL
;
982 procdata
.pathsize
= 1026; /* Increased as necessary by locate_read_str. */
983 procdata
.original_filename
= xmalloc (procdata
.pathsize
);
986 nread
= fread (procdata
.original_filename
, 1, SLOCATE_DB_MAGIC_LEN
,
988 if (looking_at_slocate_locatedb(procdata
.dbfile
,
989 procdata
.original_filename
,
994 _("`%s' is an slocate database. "
995 "Support for these is new, expect problems for now "
996 "(you are, after all, using the CVS code)."),
999 /* slocate also uses frcode, but with a different header.
1000 * We handle the header here and then work with the data
1001 * in the normal way.
1003 if (slocate_seclevel
> 1)
1005 /* We don't know what those security levels mean,
1006 * so do nothing further
1010 else if (slocate_seclevel
> 0)
1012 /* Don't show the filenames to the user if they don't exist.
1013 * Showing stats is safe since filenames are only counted
1014 * after the existence check
1016 if (ACCEPT_EXISTING
!= check_existence
)
1021 _("`%s' is an slocate database. "
1022 "Turning on the '-e' option."),
1025 check_existence
= ACCEPT_EXISTING
;
1028 add_visitor(visit_locate02_format
, NULL
);
1029 format_name
= "slocate";
1030 procdata
.slocatedb_format
= 1;
1036 procdata
.slocatedb_format
= 0;
1037 nread2
= fread (procdata
.original_filename
+nread
, 1, sizeof (LOCATEDB_MAGIC
)-nread
,
1039 if (looking_at_gnu_locatedb(procdata
.original_filename
, nread
+nread2
))
1041 add_visitor(visit_locate02_format
, NULL
);
1042 format_name
= "GNU LOCATE02";
1044 else /* Use the old format */
1049 /* Read the list of the most common bigrams in the database. */
1052 int more_read
= fread (procdata
.original_filename
+ nread
, 1,
1053 256 - nread
, procdata
.fp
);
1054 /* XXX: check more_read+nread! */
1057 for (i
= 0; i
< 128; i
++)
1059 procdata
.bigram1
[i
] = procdata
.original_filename
[i
<< 1];
1060 procdata
.bigram2
[i
] = procdata
.original_filename
[(i
<< 1) + 1];
1062 format_name
= "old";
1063 add_visitor(visit_old_format
, NULL
);
1068 add_visitor(visit_basename
, NULL
);
1070 /* See if we need fold. */
1071 if (ignore_case
&& !regex
)
1072 for ( argn
= 0; argn
< argc
; argn
++ )
1074 pathpart
= argv
[argn
];
1075 if (!contains_metacharacter(pathpart
))
1084 add_visitor(visit_casefold
, &casebuf
);
1085 casebuf
.preqlen
= &procdata
.pathsize
;
1088 /* Add an inspector for each pattern we're looking for. */
1089 for ( argn
= 0; argn
< argc
; argn
++ )
1091 pathpart
= argv
[argn
];
1094 struct regular_expression
*p
= xmalloc(sizeof(*p
));
1095 const char *error_message
= NULL
;
1097 memset (&p
->regex
, 0, sizeof (p
->regex
));
1099 re_set_syntax(regex_options
);
1100 p
->regex
.allocated
= 100;
1101 p
->regex
.buffer
= (unsigned char *) xmalloc (p
->regex
.allocated
);
1102 p
->regex
.fastmap
= NULL
;
1103 p
->regex
.syntax
= regex_options
;
1104 p
->regex
.translate
= NULL
;
1106 error_message
= re_compile_pattern (pathpart
, strlen (pathpart
),
1110 error (1, 0, "%s", error_message
);
1114 add_visitor(visit_regex
, p
);
1117 else if (contains_metacharacter(pathpart
))
1120 add_visitor(visit_globmatch_casefold
, pathpart
);
1122 add_visitor(visit_globmatch_nofold
, pathpart
);
1126 /* No glob characters used. Hence we match on
1127 * _any part_ of the filename, not just the
1128 * basename. This seems odd to me, but it is the
1129 * traditional behaviour.
1130 * James Youngman <jay@gnu.org>
1134 struct casefolder
* cf
= xmalloc(sizeof(*cf
));
1135 cf
->pattern
= pathpart
;
1136 cf
->pbuf
= &casebuf
;
1137 add_visitor(visit_substring_match_casefold
, cf
);
1138 /* If we ignore case, convert it to lower now so we don't have to
1141 lc_strcpy(pathpart
, pathpart
);
1145 add_visitor(visit_substring_match_nocasefold
, pathpart
);
1150 pvis
= lastinspector
;
1152 /* We add visit_existing_*() as late as possible to reduce the
1153 * number of stat() calls.
1155 switch (check_existence
)
1157 case ACCEPT_EXISTING
:
1158 if (follow_symlinks
) /* -L, default */
1159 add_visitor(visit_existing_follow
, NULL
);
1161 add_visitor(visit_existing_nofollow
, NULL
);
1164 case ACCEPT_NON_EXISTING
:
1165 if (follow_symlinks
) /* -L, default */
1166 add_visitor(visit_non_existing_follow
, NULL
);
1168 add_visitor(visit_non_existing_nofollow
, NULL
);
1171 case ACCEPT_EITHER
: /* Default, neither -E nor -e */
1172 /* do nothing; no extra processing. */
1176 /* Security issue: The stats visitor must be added after the
1177 * existence checker because otherwise the -S option would leak
1178 * information about files that the caller cannot see.
1181 add_visitor(visit_stats
, &statistics
);
1185 if (print_quoted_filename
)
1186 add_visitor(visit_justprint_quoted
, NULL
);
1188 add_visitor(visit_justprint_unquoted
, NULL
);
1193 add_visitor(visit_limit
, plimit
);
1195 add_visitor(visit_count
, plimit
);
1200 past_pat_inspector
= pvis
->next
;
1202 mainprocessor
= process_and
;
1204 mainprocessor
= process_or
;
1207 mainprocessor
= process_simple
;
1211 printf(_("Database %s is in the %s format.\n"),
1217 procdata
.c
= getc (procdata
.fp
);
1218 /* If we are searching for filename patterns, the inspector list
1219 * will contain an entry for each pattern for which we are searching.
1221 while ( (procdata
.c
!= EOF
) &&
1222 (VISIT_ABORT
!= (mainprocessor
)(&procdata
)) )
1224 /* Do nothing; all the work is done in the visitor functions. */
1230 print_stats(argc
, filesize
);
1233 if (ferror (procdata
.fp
))
1235 error (0, errno
, "%s", procdata
.dbfile
);
1238 return plimit
->items_accepted
;
1244 extern char *version_string
;
1246 /* The name this program was run with. */
1250 usage (FILE *stream
)
1252 fprintf (stream
, _("\
1253 Usage: %s [-d path | --database=path] [-e | -E | --[non-]existing]\n\
1254 [-i | --ignore-case] [-w | --wholename] [-b | --basename] \n\
1255 [--limit=N | -l N] [-S | --statistics] [-0 | --null] [-c | --count]\n\
1256 [-P | -H | --nofollow] [-L | --follow] [-m | --mmap ] [ -s | --stdio ]\n\
1257 [-A | --all] [-p | --print] [-r | --regex ] [--regextype=TYPE]\n\
1258 [-version] [--help]\n\
1261 fputs (_("\nReport bugs to <bug-findutils@gnu.org>.\n"), stream
);
1265 REGEXTYPE_OPTION
= CHAR_MAX
+ 1
1269 static struct option
const longopts
[] =
1271 {"database", required_argument
, NULL
, 'd'},
1272 {"existing", no_argument
, NULL
, 'e'},
1273 {"non-existing", no_argument
, NULL
, 'E'},
1274 {"ignore-case", no_argument
, NULL
, 'i'},
1275 {"all", no_argument
, NULL
, 'A'},
1276 {"help", no_argument
, NULL
, 'h'},
1277 {"version", no_argument
, NULL
, 'v'},
1278 {"null", no_argument
, NULL
, '0'},
1279 {"count", no_argument
, NULL
, 'c'},
1280 {"wholename", no_argument
, NULL
, 'w'},
1281 {"wholepath", no_argument
, NULL
, 'w'}, /* Synonym. */
1282 {"basename", no_argument
, NULL
, 'b'},
1283 {"print", no_argument
, NULL
, 'p'},
1284 {"stdio", no_argument
, NULL
, 's'},
1285 {"mmap", no_argument
, NULL
, 'm'},
1286 {"limit", required_argument
, NULL
, 'l'},
1287 {"regex", no_argument
, NULL
, 'r'},
1288 {"regextype", required_argument
, NULL
, REGEXTYPE_OPTION
},
1289 {"statistics", no_argument
, NULL
, 'S'},
1290 {"follow", no_argument
, NULL
, 'L'},
1291 {"nofollow", no_argument
, NULL
, 'P'},
1292 {NULL
, no_argument
, NULL
, 0}
1299 const char * what
= "failed";
1300 uid_t orig_euid
= geteuid();
1302 /* Use of setgroups() is restrcted to root only. */
1306 groups
[1] = getgid();
1307 if (0 != setgroups(1, groups
))
1309 what
= _("failed to drop group privileges");
1314 if (0 != setuid(getuid()))
1316 what
= _("failed to drop setuid privileges");
1320 /* Defend against the case where the attacker runs us with the
1321 * capability to call setuid() turned off, which on some systems
1322 * will cause the above attempt to drop privileges fail (leaving us
1327 what
= _("Failed to drop privileges");
1335 error(1, errno
, "%s", what
);
1343 /* deliberate infinite loop */
1348 opendb(const char *name
)
1350 int fd
= open(name
, O_RDONLY
1351 #if defined O_LARGEFILE
1357 /* Make sure it won't survive an exec */
1358 if (0 != fcntl(fd
, F_SETFD
, FD_CLOEXEC
))
1368 dolocate (int argc
, char **argv
, int secure_db_fd
)
1371 unsigned long int found
= 0uL;
1373 int ignore_case
= 0;
1376 int basename_only
= 0;
1379 int regex_options
= RE_SYNTAX_EMACS
;
1384 int they_chose_db
= 0;
1385 bool did_stdin
= false; /* Set to prevent rereading stdin. */
1387 program_name
= argv
[0];
1389 #ifdef HAVE_SETLOCALE
1390 setlocale (LC_ALL
, "");
1392 bindtextdomain (PACKAGE
, LOCALEDIR
);
1393 textdomain (PACKAGE
);
1394 atexit (close_stdout
);
1397 limits
.items_accepted
= 0;
1399 quote_opts
= clone_quoting_options (NULL
);
1400 print_quoted_filename
= true;
1402 /* We cannot simultaneously trust $LOCATE_PATH and use the
1403 * setuid-access-controlled database,, since that could cause a leak
1406 dbpath
= getenv ("LOCATE_PATH");
1412 check_existence
= ACCEPT_EITHER
;
1414 while ((optc
= getopt_long (argc
, argv
, "Abcd:eEil:prsm0SwHPL", longopts
, (int *) 0)) != -1)
1419 print_quoted_filename
= false; /* print filename 'raw'. */
1440 check_existence
= ACCEPT_EXISTING
;
1444 check_existence
= ACCEPT_NON_EXISTING
;
1460 printf (_("GNU locate version %s\n"), version_string
);
1471 case REGEXTYPE_OPTION
:
1472 regex_options
= get_regex_type(optarg
);
1480 follow_symlinks
= 1;
1483 /* In find, -P and -H differ in the way they handle paths
1484 * given on the command line. This is not relevant for
1485 * locate, but the -H option is supported because it is
1486 * probably more intuitive to do so.
1490 follow_symlinks
= 0;
1496 strtol_error err
= xstrtoumax(optarg
, &end
, 10, &limits
.limit
, NULL
);
1497 if (LONGINT_OK
!= err
)
1499 STRTOL_FATAL_ERROR(optarg
, _("argument to --limit"), err
);
1505 case 's': /* use stdio */
1506 case 'm': /* use mmap */
1507 /* These options are implemented simply for
1508 * compatibility with FreeBSD
1518 /* If the user gave the -d option or set LOCATE_PATH,
1519 * relinquish access to the secure database.
1523 if (secure_db_fd
>= 0)
1525 close(secure_db_fd
);
1530 if (!just_count
&& !stats
)
1540 if (!just_count
&& optind
== argc
)
1548 if (1 == isatty(STDOUT_FILENO
))
1549 stdout_is_a_tty
= true;
1551 stdout_is_a_tty
= false;
1554 next_element (dbpath
, 0); /* Initialize. */
1556 /* Bail out early if limit already reached. */
1557 while (!use_limit
|| limits
.limit
> limits
.items_accepted
)
1563 statistics
.compressed_bytes
=
1564 statistics
.total_filename_count
=
1565 statistics
.total_filename_length
=
1566 statistics
.whitespace_count
=
1567 statistics
.newline_count
=
1568 statistics
.highbit_filename_count
= 0u;
1572 /* Take the next element from the list of databases */
1573 e
= next_element ((char *) NULL
, 0);
1577 if (0 == strcmp (e
, "-"))
1582 _("warning: the locate database can only be read from stdin once."));
1594 if (0 == strlen(e
) || 0 == strcmp(e
, "."))
1599 /* open the database */
1603 error (0, errno
, "%s", e
);
1610 if (-1 == secure_db_fd
)
1612 /* Already searched the database, it's time to exit the loop */
1617 e
= selected_secure_db
;
1623 /* Check the database to see if it is old. */
1626 error (0, errno
, "%s", e
);
1627 /* continue anyway */
1628 filesize
= (off_t
)0;
1634 filesize
= st
.st_size
;
1636 if ((time_t)-1 == time(&now
))
1638 /* If we can't tell the time, we don't know how old the
1639 * database is. But since the message is just advisory,
1640 * we continue anyway.
1642 error (0, errno
, "time system call");
1646 if (now
- st
.st_mtime
> WARN_SECONDS
)
1649 warning: database `fred' is more than 8 days old */
1651 _("warning: database `%s' is more than %d %s old"),
1652 e
, WARN_NUMBER_UNITS
, _(warn_name_units
));
1657 fp
= fdopen(fd
, "r");
1660 error (0, errno
, "%s", e
);
1664 /* Search this database for all patterns simultaneously */
1665 found
= search_one_database (argc
- optind
, &argv
[optind
],
1667 ignore_case
, print
, basename_only
,
1668 use_limit
, &limits
, stats
,
1669 op_and
, regex
, regex_options
);
1671 /* Close the databsase (even if it is stdin) */
1672 if (fclose (fp
) == EOF
)
1674 error (0, errno
, "%s", e
);
1681 printf("%ld\n", found
);
1684 if (found
|| (use_limit
&& (limits
.limit
==0)) || stats
)
1690 #define ARRAYSIZE(a) (sizeof(a)/sizeof(a[0]))
1692 open_secure_db(void)
1696 const char * secure_db_list
[] =
1699 "/var/lib/slocate/slocate.db",
1702 for (i
=0; secure_db_list
[i
]; ++i
)
1704 fd
= opendb(secure_db_list
[i
]);
1707 selected_secure_db
= secure_db_list
[i
];
1715 main (int argc
, char **argv
)
1717 int dbfd
= open_secure_db();
1720 return dolocate(argc
, argv
, dbfd
);