1 /* strings -- print the strings of printable characters in files
2 Copyright 1993, 1994, 1995, 1996, 1997, 1998, 1999, 2000, 2001,
3 2002 Free Software Foundation, Inc.
5 This program is free software; you can redistribute it and/or modify
6 it under the terms of the GNU General Public License as published by
7 the Free Software Foundation; either version 2, or (at your option)
10 This program is distributed in the hope that it will be useful,
11 but WITHOUT ANY WARRANTY; without even the implied warranty of
12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 GNU General Public License for more details.
15 You should have received a copy of the GNU General Public License
16 along with this program; if not, write to the Free Software
17 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA
20 /* Usage: strings [options] file...
25 - Do not scan only the initialized data section of object files.
28 -f Print the name of the file before each string.
32 -min-len Print graphic char sequences, MIN-LEN or more bytes long,
33 that are followed by a NUL or a newline. Default is 4.
36 -t {o,x,d} Print the offset within the file before each string,
39 -o Like -to. (Some other implementations have -o like -to,
40 others like -td. We chose one arbitrarily.)
42 --encoding={s,b,l,B,L}
44 Select character encoding: single-byte, bigendian 16-bit,
45 littleendian 16-bit, bigendian 32-bit, littleendian 32-bit
48 Specify a non-default object file format.
51 -h Print the usage message on the standard output.
54 -v Print the program version number.
56 Written by Richard Stallman <rms@gnu.ai.mit.edu>
57 and David MacKenzie <djm@gnu.ai.mit.edu>. */
67 #include "libiberty.h"
68 #include "safe-ctype.h"
70 /* Some platforms need to put stdin into binary mode, to read
75 #define O_BINARY _O_BINARY
76 #define setmode _setmode
83 #define SET_BINARY(f) do { if (!isatty(f)) setmode(f,O_BINARY); } while (0)
87 #define isgraphic(c) (ISPRINT (c) || (c) == '\t')
93 /* The BFD section flags that identify an initialized data section. */
94 #define DATA_FLAGS (SEC_ALLOC | SEC_LOAD | SEC_HAS_CONTENTS)
97 typedef off64_t file_off
;
98 #define file_open(s,m) fopen64(s,m)
100 typedef off_t file_off
;
101 #define file_open(s,m) fopen(s,m)
104 /* Radix for printing addresses (must be 8, 10 or 16). */
105 static int address_radix
;
107 /* Minimum length of sequence of graphic chars to trigger output. */
108 static int string_min
;
110 /* true means print address within file for each string. */
111 static boolean print_addresses
;
113 /* true means print filename for each string. */
114 static boolean print_filenames
;
116 /* true means for object files scan only the data section. */
117 static boolean datasection_only
;
119 /* true if we found an initialized data section in the current file. */
120 static boolean got_a_section
;
122 /* The BFD object file format. */
125 /* The character encoding format. */
126 static char encoding
;
127 static int encoding_bytes
;
129 static struct option long_options
[] =
131 {"all", no_argument
, NULL
, 'a'},
132 {"print-file-name", no_argument
, NULL
, 'f'},
133 {"bytes", required_argument
, NULL
, 'n'},
134 {"radix", required_argument
, NULL
, 't'},
135 {"encoding", required_argument
, NULL
, 'e'},
136 {"target", required_argument
, NULL
, 'T'},
137 {"help", no_argument
, NULL
, 'h'},
138 {"version", no_argument
, NULL
, 'v'},
142 static void strings_a_section
PARAMS ((bfd
*, asection
*, PTR
));
143 static boolean strings_object_file
PARAMS ((const char *));
144 static boolean strings_file
PARAMS ((char *file
));
145 static int integer_arg
PARAMS ((char *s
));
146 static void print_strings
PARAMS ((const char *filename
, FILE *stream
,
147 file_off address
, int stop_point
,
148 int magiccount
, char *magic
));
149 static void usage
PARAMS ((FILE *stream
, int status
));
150 static long get_char
PARAMS ((FILE *stream
, file_off
*address
,
151 int *magiccount
, char **magic
));
153 int main
PARAMS ((int, char **));
162 boolean files_given
= false;
164 #if defined (HAVE_SETLOCALE)
165 setlocale (LC_ALL
, "");
167 bindtextdomain (PACKAGE
, LOCALEDIR
);
168 textdomain (PACKAGE
);
170 program_name
= argv
[0];
171 xmalloc_set_program_name (program_name
);
173 print_addresses
= false;
174 print_filenames
= false;
175 datasection_only
= true;
179 while ((optc
= getopt_long (argc
, argv
, "afhHn:ot:e:Vv0123456789",
180 long_options
, (int *) 0)) != EOF
)
185 datasection_only
= false;
189 print_filenames
= true;
197 string_min
= integer_arg (optarg
);
200 fatal (_("invalid number %s"), optarg
);
205 print_addresses
= true;
210 print_addresses
= true;
211 if (optarg
[1] != '\0')
237 if (optarg
[1] != '\0')
239 encoding
= optarg
[0];
244 print_version ("strings");
252 string_min
= optc
- '0';
254 string_min
= string_min
* 10 + optc
- '0';
280 set_default_bfd_target ();
284 datasection_only
= false;
286 SET_BINARY (fileno (stdin
));
288 print_strings ("{standard input}", stdin
, 0, 0, 0, (char *) NULL
);
293 for (; optind
< argc
; ++optind
)
295 if (strcmp (argv
[optind
], "-") == 0)
296 datasection_only
= false;
300 exit_status
|= (strings_file (argv
[optind
]) == false);
305 if (files_given
== false)
308 return (exit_status
);
311 /* Scan section SECT of the file ABFD, whose printable name is FILE.
312 If it contains initialized data,
313 set `got_a_section' and print the strings in it. */
316 strings_a_section (abfd
, sect
, filearg
)
321 const char *file
= (const char *) filearg
;
323 if ((sect
->flags
& DATA_FLAGS
) == DATA_FLAGS
)
325 bfd_size_type sz
= bfd_get_section_size_before_reloc (sect
);
326 PTR mem
= xmalloc (sz
);
327 if (bfd_get_section_contents (abfd
, sect
, mem
, (file_ptr
) 0, sz
))
329 got_a_section
= true;
330 print_strings (file
, (FILE *) NULL
, sect
->filepos
, 0, sz
, mem
);
336 /* Scan all of the sections in FILE, and print the strings
337 in the initialized data section(s).
339 Return true if successful,
340 false if not (such as if FILE is not an object file). */
343 strings_object_file (file
)
346 bfd
*abfd
= bfd_openr (file
, target
);
350 /* Treat the file as a non-object file. */
354 /* This call is mainly for its side effect of reading in the sections.
355 We follow the traditional behavior of `strings' in that we don't
356 complain if we don't recognize a file to be an object file. */
357 if (bfd_check_format (abfd
, bfd_object
) == false)
363 got_a_section
= false;
364 bfd_map_over_sections (abfd
, strings_a_section
, (PTR
) file
);
366 if (!bfd_close (abfd
))
372 return got_a_section
;
375 /* Print the strings in FILE. Return true if ok, false if an error occurs. */
381 /* If we weren't told to scan the whole file,
382 try to open it as an object file and only look at
383 initialized data sections. If that fails, fall back to the
385 if (!datasection_only
|| !strings_object_file (file
))
389 stream
= file_open (file
, FOPEN_RB
);
392 fprintf (stderr
, "%s: ", program_name
);
397 print_strings (file
, stream
, (file_off
) 0, 0, 0, (char *) 0);
399 if (fclose (stream
) == EOF
)
401 fprintf (stderr
, "%s: ", program_name
);
410 /* Read the next character, return EOF if none available.
411 Assume that STREAM is positioned so that the next byte read
412 is at address ADDRESS in the file.
414 If STREAM is NULL, do not read from it.
415 The caller can supply a buffer of characters
416 to be processed before the data in STREAM.
417 MAGIC is the address of the buffer and
418 MAGICCOUNT is how many characters are in it. */
421 get_char (stream
, address
, magiccount
, magic
)
429 unsigned char buf
[4];
431 for (i
= 0; i
< encoding_bytes
; i
++)
442 #ifdef HAVE_GETC_UNLOCKED
443 c
= getc_unlocked (stream
);
461 r
= (buf
[0] << 8) | buf
[1];
464 r
= buf
[0] | (buf
[1] << 8);
467 r
= ((long) buf
[0] << 24) | ((long) buf
[1] << 16) |
468 ((long) buf
[2] << 8) | buf
[3];
471 r
= buf
[0] | ((long) buf
[1] << 8) | ((long) buf
[2] << 16) |
472 ((long) buf
[3] << 24);
482 /* Find the strings in file FILENAME, read from STREAM.
483 Assume that STREAM is positioned so that the next byte read
484 is at address ADDRESS in the file.
485 Stop reading at address STOP_POINT in the file, if nonzero.
487 If STREAM is NULL, do not read from it.
488 The caller can supply a buffer of characters
489 to be processed before the data in STREAM.
490 MAGIC is the address of the buffer and
491 MAGICCOUNT is how many characters are in it.
492 Those characters come at address ADDRESS and the data in STREAM follow. */
495 print_strings (filename
, stream
, address
, stop_point
, magiccount
, magic
)
496 const char *filename
;
503 char *buf
= (char *) xmalloc (sizeof (char) * (string_min
+ 1));
511 /* See if the next `string_min' chars are all graphic chars. */
513 if (stop_point
&& address
>= stop_point
)
516 for (i
= 0; i
< string_min
; i
++)
518 c
= get_char (stream
, &address
, &magiccount
, &magic
);
521 if (c
> 255 || c
< 0 || !isgraphic (c
))
522 /* Found a non-graphic. Try again starting with next char. */
527 /* We found a run of `string_min' graphic characters. Print up
528 to the next non-graphic character. */
531 printf ("%s: ", filename
);
533 switch (address_radix
)
536 #if __STDC_VERSION__ >= 199901L || (defined(__GNUC__) && __GNUC__ >= 2)
537 if (sizeof (start
) > sizeof (long))
538 printf ("%7Lo ", (unsigned long long) start
);
541 # if !BFD_HOST_64BIT_LONG
542 if (start
!= (unsigned long) start
)
543 printf ("++%7lo ", (unsigned long) start
);
547 printf ("%7lo ", (unsigned long) start
);
551 #if __STDC_VERSION__ >= 199901L || (defined(__GNUC__) && __GNUC__ >= 2)
552 if (sizeof (start
) > sizeof (long))
553 printf ("%7Ld ", (unsigned long long) start
);
556 # if !BFD_HOST_64BIT_LONG
557 if (start
!= (unsigned long) start
)
558 printf ("++%7ld ", (unsigned long) start
);
562 printf ("%7ld ", (long) start
);
566 #if __STDC_VERSION__ >= 199901L || (defined(__GNUC__) && __GNUC__ >= 2)
567 if (sizeof (start
) > sizeof (long))
568 printf ("%7Lx ", (unsigned long long) start
);
571 # if !BFD_HOST_64BIT_LONG
572 if (start
!= (unsigned long) start
)
573 printf ("%lx%8.8lx ", start
>> 32, start
& 0xffffffff);
577 printf ("%7lx ", (unsigned long) start
);
586 c
= get_char (stream
, &address
, &magiccount
, &magic
);
589 if (c
> 255 || c
< 0 || !isgraphic (c
))
598 /* Parse string S as an integer, using decimal radix by default,
599 but allowing octal and hex numbers as in C. */
612 else if (*++p
== 'x')
621 while (((c
= *p
++) >= '0' && c
<= '9')
622 || (radix
== 16 && (c
& ~40) >= 'A' && (c
& ~40) <= 'Z'))
625 if (c
>= '0' && c
<= '9')
628 value
+= (c
& ~40) - 'A';
640 fatal (_("invalid integer argument %s"), s
);
646 usage (stream
, status
)
650 fprintf (stream
, _("Usage: %s [option(s)] [file(s)]\n"), program_name
);
651 fprintf (stream
, _(" Display printable strings in [file(s)] (stdin by default)\n"));
652 fprintf (stream
, _(" The options are:\n\
653 -a - --all Scan the entire file, not just the data section\n\
654 -f --print-file-name Print the name of the file before each string\n\
655 -n --bytes=[number] Locate & print any NUL-terminated sequence of at\n\
656 -<number> least [number] characters (default 4).\n\
657 -t --radix={o,x,d} Print the location of the string in base 8, 10 or 16\n\
658 -o An alias for --radix=o\n\
659 -T --target=<BFDNAME> Specify the binary file format\n\
660 -e --encoding={s,b,l,B,L} Select character size and endianness:\n\
661 s = 8-bit, {b,l} = 16-bit, {B,L} = 32-bit\n\
662 -h --help Display this information\n\
663 -v --version Print the program's version number\n"));
664 list_supported_targets (program_name
, stream
);
666 fprintf (stream
, _("Report bugs to %s\n"), REPORT_BUGS_TO
);