1 /* strings -- print the strings of printable characters in files
2 Copyright (C) 1993-2017 Free Software Foundation, Inc.
4 This program is free software; you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation; either version 3, or (at your option)
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program; if not, write to the Free Software
16 Foundation, Inc., 51 Franklin Street - Fifth Floor, Boston, MA
19 /* Usage: strings [options] file...
24 - Scan each file in its entirety.
27 -d Scan only the initialized data section(s) of object files.
30 -f Print the name of the file before each string.
34 -min-len Print graphic char sequences, MIN-LEN or more bytes long,
35 that are followed by a NUL or a newline. Default is 4.
38 -t {o,x,d} Print the offset within the file before each string,
41 --include-all-whitespace
42 -w By default tab and space are the only whitepace included in graphic
43 char sequences. This option considers all of isspace() valid.
45 -o Like -to. (Some other implementations have -o like -to,
46 others like -td. We chose one arbitrarily.)
48 --encoding={s,S,b,l,B,L}
50 Select character encoding: 7-bit-character, 8-bit-character,
51 bigendian 16-bit, littleendian 16-bit, bigendian 32-bit,
56 Specify a non-default object file format.
58 --output-separator=sep_string
59 -s sep_string String used to separate parsed strings in output.
63 -h Print the usage message on the standard output.
67 -v Print the program version number.
69 Written by Richard Stallman <rms@gnu.ai.mit.edu>
70 and David MacKenzie <djm@gnu.ai.mit.edu>. */
75 #include "libiberty.h"
76 #include "safe-ctype.h"
79 #define STRING_ISGRAPHIC(c) \
82 && ((c) == '\t' || ISPRINT (c) || (encoding == 'S' && (c) > 127) \
83 || (include_all_whitespace && ISSPACE (c))) \
90 /* The BFD section flags that identify an initialized data section. */
91 #define DATA_FLAGS (SEC_ALLOC | SEC_LOAD | SEC_HAS_CONTENTS)
93 /* Radix for printing addresses (must be 8, 10 or 16). */
94 static int address_radix
;
96 /* Minimum length of sequence of graphic chars to trigger output. */
97 static int string_min
;
99 /* Whether or not we include all whitespace as a graphic char. */
100 static bfd_boolean include_all_whitespace
;
102 /* TRUE means print address within file for each string. */
103 static bfd_boolean print_addresses
;
105 /* TRUE means print filename for each string. */
106 static bfd_boolean print_filenames
;
108 /* TRUE means for object files scan only the data section. */
109 static bfd_boolean datasection_only
;
111 /* The BFD object file format. */
114 /* The character encoding format. */
115 static char encoding
;
116 static int encoding_bytes
;
118 /* Output string used to separate parsed strings */
119 static char *output_separator
;
121 static struct option long_options
[] =
123 {"all", no_argument
, NULL
, 'a'},
124 {"data", no_argument
, NULL
, 'd'},
125 {"print-file-name", no_argument
, NULL
, 'f'},
126 {"bytes", required_argument
, NULL
, 'n'},
127 {"radix", required_argument
, NULL
, 't'},
128 {"include-all-whitespace", required_argument
, NULL
, 'w'},
129 {"encoding", required_argument
, NULL
, 'e'},
130 {"target", required_argument
, NULL
, 'T'},
131 {"output-separator", required_argument
, NULL
, 's'},
132 {"help", no_argument
, NULL
, 'h'},
133 {"version", no_argument
, NULL
, 'v'},
137 static bfd_boolean
strings_file (char *);
138 static void print_strings (const char *, FILE *, file_ptr
, int, int, char *);
139 static void usage (FILE *, int) ATTRIBUTE_NORETURN
;
141 int main (int, char **);
144 main (int argc
, char **argv
)
148 bfd_boolean files_given
= FALSE
;
152 #if defined (HAVE_SETLOCALE)
153 setlocale (LC_ALL
, "");
155 bindtextdomain (PACKAGE
, LOCALEDIR
);
156 textdomain (PACKAGE
);
158 program_name
= argv
[0];
159 xmalloc_set_program_name (program_name
);
160 bfd_set_error_program_name (program_name
);
162 expandargv (&argc
, &argv
);
165 include_all_whitespace
= FALSE
;
166 print_addresses
= FALSE
;
167 print_filenames
= FALSE
;
168 if (DEFAULT_STRINGS_ALL
)
169 datasection_only
= FALSE
;
171 datasection_only
= TRUE
;
174 output_separator
= NULL
;
176 while ((optc
= getopt_long (argc
, argv
, "adfhHn:wot:e:T:s:Vv0123456789",
177 long_options
, (int *) 0)) != EOF
)
182 datasection_only
= FALSE
;
186 datasection_only
= TRUE
;
190 print_filenames
= TRUE
;
198 string_min
= (int) strtoul (optarg
, &s
, 0);
199 if (s
!= NULL
&& *s
!= 0)
200 fatal (_("invalid integer argument %s"), optarg
);
204 include_all_whitespace
= TRUE
;
208 print_addresses
= TRUE
;
213 print_addresses
= TRUE
;
214 if (optarg
[1] != '\0')
240 if (optarg
[1] != '\0')
242 encoding
= optarg
[0];
246 output_separator
= optarg
;
251 print_version ("strings");
258 numeric_opt
= optind
;
263 if (numeric_opt
!= 0)
265 string_min
= (int) strtoul (argv
[numeric_opt
- 1] + 1, &s
, 0);
266 if (s
!= NULL
&& *s
!= 0)
267 fatal (_("invalid integer argument %s"), argv
[numeric_opt
- 1] + 1);
270 fatal (_("invalid minimum string length %d"), string_min
);
291 set_default_bfd_target ();
295 datasection_only
= FALSE
;
296 SET_BINARY (fileno (stdin
));
297 print_strings ("{standard input}", stdin
, 0, 0, 0, (char *) NULL
);
302 for (; optind
< argc
; ++optind
)
304 if (strcmp (argv
[optind
], "-") == 0)
305 datasection_only
= FALSE
;
309 exit_status
|= !strings_file (argv
[optind
]);
317 return (exit_status
);
320 /* Scan section SECT of the file ABFD, whose printable name is
321 FILENAME. If it contains initialized data set GOT_A_SECTION and
322 print the strings in it. */
325 strings_a_section (bfd
*abfd
, asection
*sect
, const char *filename
,
326 bfd_boolean
*got_a_section
)
328 bfd_size_type sectsize
;
331 if ((sect
->flags
& DATA_FLAGS
) != DATA_FLAGS
)
334 sectsize
= bfd_get_section_size (sect
);
338 if (!bfd_malloc_and_get_section (abfd
, sect
, &mem
))
340 non_fatal (_("%s: Reading section %s failed: %s"),
341 filename
, sect
->name
, bfd_errmsg (bfd_get_error ()));
345 *got_a_section
= TRUE
;
346 print_strings (filename
, NULL
, sect
->filepos
, 0, sectsize
, (char *) mem
);
350 /* Scan all of the sections in FILE, and print the strings
351 in the initialized data section(s).
353 Return TRUE if successful,
354 FALSE if not (such as if FILE is not an object file). */
357 strings_object_file (const char *file
)
361 bfd_boolean got_a_section
;
363 abfd
= bfd_openr (file
, target
);
366 /* Treat the file as a non-object file. */
369 /* This call is mainly for its side effect of reading in the sections.
370 We follow the traditional behavior of `strings' in that we don't
371 complain if we don't recognize a file to be an object file. */
372 if (!bfd_check_format (abfd
, bfd_object
))
378 got_a_section
= FALSE
;
379 for (s
= abfd
->sections
; s
!= NULL
; s
= s
->next
)
380 strings_a_section (abfd
, s
, file
, &got_a_section
);
382 if (!bfd_close (abfd
))
388 return got_a_section
;
391 /* Print the strings in FILE. Return TRUE if ok, FALSE if an error occurs. */
394 strings_file (char *file
)
398 /* get_file_size does not support non-S_ISREG files. */
400 if (stat (file
, &st
) < 0)
403 non_fatal (_("'%s': No such file"), file
);
405 non_fatal (_("Warning: could not locate '%s'. reason: %s"),
406 file
, strerror (errno
));
409 else if (S_ISDIR (st
.st_mode
))
411 non_fatal (_("Warning: '%s' is a directory"), file
);
415 /* If we weren't told to scan the whole file,
416 try to open it as an object file and only look at
417 initialized data sections. If that fails, fall back to the
419 if (!datasection_only
|| !strings_object_file (file
))
423 stream
= fopen (file
, FOPEN_RB
);
426 fprintf (stderr
, "%s: ", program_name
);
431 print_strings (file
, stream
, (file_ptr
) 0, 0, 0, (char *) 0);
433 if (fclose (stream
) == EOF
)
435 fprintf (stderr
, "%s: ", program_name
);
444 /* Read the next character, return EOF if none available.
445 Assume that STREAM is positioned so that the next byte read
446 is at address ADDRESS in the file.
448 If STREAM is NULL, do not read from it.
449 The caller can supply a buffer of characters
450 to be processed before the data in STREAM.
451 MAGIC is the address of the buffer and
452 MAGICCOUNT is how many characters are in it. */
455 get_char (FILE *stream
, file_ptr
*address
, int *magiccount
, char **magic
)
460 for (i
= 0; i
< encoding_bytes
; i
++)
472 /* Only use getc_unlocked if we found a declaration for it.
473 Otherwise, libc is not thread safe by default, and we
474 should not use it. */
476 #if defined(HAVE_GETC_UNLOCKED) && HAVE_DECL_GETC_UNLOCKED
477 c
= getc_unlocked (stream
);
486 r
= (r
<< 8) | (c
& 0xff);
494 r
= ((r
& 0xff) << 8) | ((r
& 0xff00) >> 8);
497 r
= (((r
& 0xff) << 24) | ((r
& 0xff00) << 8)
498 | ((r
& 0xff0000) >> 8) | ((r
& 0xff000000) >> 24));
505 /* Find the strings in file FILENAME, read from STREAM.
506 Assume that STREAM is positioned so that the next byte read
507 is at address ADDRESS in the file.
508 Stop reading at address STOP_POINT in the file, if nonzero.
510 If STREAM is NULL, do not read from it.
511 The caller can supply a buffer of characters
512 to be processed before the data in STREAM.
513 MAGIC is the address of the buffer and
514 MAGICCOUNT is how many characters are in it.
515 Those characters come at address ADDRESS and the data in STREAM follow. */
518 print_strings (const char *filename
, FILE *stream
, file_ptr address
,
519 int stop_point
, int magiccount
, char *magic
)
521 char *buf
= (char *) xmalloc (sizeof (char) * (string_min
+ 1));
529 /* See if the next `string_min' chars are all graphic chars. */
531 if (stop_point
&& address
>= stop_point
)
534 for (i
= 0; i
< string_min
; i
++)
536 c
= get_char (stream
, &address
, &magiccount
, &magic
);
542 if (! STRING_ISGRAPHIC (c
))
543 /* Found a non-graphic. Try again starting with next char. */
548 /* We found a run of `string_min' graphic characters. Print up
549 to the next non-graphic character. */
552 printf ("%s: ", filename
);
554 switch (address_radix
)
557 #ifdef HAVE_LONG_LONG
558 if (sizeof (start
) > sizeof (long))
561 printf ("%7llo ", (unsigned long long) start
);
563 printf ("%7I64o ", (unsigned long long) start
);
567 #elif !BFD_HOST_64BIT_LONG
568 if (start
!= (unsigned long) start
)
569 printf ("++%7lo ", (unsigned long) start
);
572 printf ("%7lo ", (unsigned long) start
);
576 #ifdef HAVE_LONG_LONG
577 if (sizeof (start
) > sizeof (long))
580 printf ("%7lld ", (unsigned long long) start
);
582 printf ("%7I64d ", (unsigned long long) start
);
586 #elif !BFD_HOST_64BIT_LONG
587 if (start
!= (unsigned long) start
)
588 printf ("++%7ld ", (unsigned long) start
);
591 printf ("%7ld ", (long) start
);
595 #ifdef HAVE_LONG_LONG
596 if (sizeof (start
) > sizeof (long))
599 printf ("%7llx ", (unsigned long long) start
);
601 printf ("%7I64x ", (unsigned long long) start
);
605 #elif !BFD_HOST_64BIT_LONG
606 if (start
!= (unsigned long) start
)
607 printf ("%lx%8.8lx ", (unsigned long) (start
>> 32),
608 (unsigned long) (start
& 0xffffffff));
611 printf ("%7lx ", (unsigned long) start
);
620 c
= get_char (stream
, &address
, &magiccount
, &magic
);
623 if (! STRING_ISGRAPHIC (c
))
628 if (output_separator
)
629 fputs (output_separator
, stdout
);
637 usage (FILE *stream
, int status
)
639 fprintf (stream
, _("Usage: %s [option(s)] [file(s)]\n"), program_name
);
640 fprintf (stream
, _(" Display printable strings in [file(s)] (stdin by default)\n"));
641 fprintf (stream
, _(" The options are:\n"));
643 if (DEFAULT_STRINGS_ALL
)
644 fprintf (stream
, _("\
645 -a - --all Scan the entire file, not just the data section [default]\n\
646 -d --data Only scan the data sections in the file\n"));
648 fprintf (stream
, _("\
649 -a - --all Scan the entire file, not just the data section\n\
650 -d --data Only scan the data sections in the file [default]\n"));
652 fprintf (stream
, _("\
653 -f --print-file-name Print the name of the file before each string\n\
654 -n --bytes=[number] Locate & print any NUL-terminated sequence of at\n\
655 -<number> least [number] characters (default 4).\n\
656 -t --radix={o,d,x} Print the location of the string in base 8, 10 or 16\n\
657 -w --include-all-whitespace Include all whitespace as valid string characters\n\
658 -o An alias for --radix=o\n\
659 -T --target=<BFDNAME> Specify the binary file format\n\
660 -e --encoding={s,S,b,l,B,L} Select character size and endianness:\n\
661 s = 7-bit, S = 8-bit, {b,l} = 16-bit, {B,L} = 32-bit\n\
662 -s --output-separator=<string> String used to separate strings in output.\n\
663 @<file> Read options from <file>\n\
664 -h --help Display this information\n\
665 -v -V --version Print the program's version number\n"));
666 list_supported_targets (program_name
, stream
);
667 if (REPORT_BUGS_TO
[0] && status
== 0)
668 fprintf (stream
, _("Report bugs to %s\n"), REPORT_BUGS_TO
);