Merge tag 'trace-v4.19-rc4' of git://git.kernel.org/pub/scm/linux/kernel/git/rostedt...
[linux-2.6/btrfs-unstable.git] / scripts / leaking_addresses.pl
blob6a897788f5a7ecd3eb699ebd6aec21ee1125aecd
1 #!/usr/bin/env perl
3 # (c) 2017 Tobin C. Harding <me@tobin.cc>
4 # Licensed under the terms of the GNU GPL License version 2
6 # leaking_addresses.pl: Scan the kernel for potential leaking addresses.
7 # - Scans dmesg output.
8 # - Walks directory tree and parses each file (for each directory in @DIRS).
10 # Use --debug to output path before parsing, this is useful to find files that
11 # cause the script to choke.
14 # When the system is idle it is likely that most files under /proc/PID will be
15 # identical for various processes. Scanning _all_ the PIDs under /proc is
16 # unnecessary and implies that we are thoroughly scanning /proc. This is _not_
17 # the case because there may be ways userspace can trigger creation of /proc
18 # files that leak addresses but were not present during a scan. For these two
19 # reasons we exclude all PID directories under /proc except '1/'
21 use warnings;
22 use strict;
23 use POSIX;
24 use File::Basename;
25 use File::Spec;
26 use Cwd 'abs_path';
27 use Term::ANSIColor qw(:constants);
28 use Getopt::Long qw(:config no_auto_abbrev);
29 use Config;
30 use bigint qw/hex/;
31 use feature 'state';
33 my $P = $0;
35 # Directories to scan.
36 my @DIRS = ('/proc', '/sys');
38 # Timer for parsing each file, in seconds.
39 my $TIMEOUT = 10;
41 # Kernel addresses vary by architecture. We can only auto-detect the following
42 # architectures (using `uname -m`). (flag --32-bit overrides auto-detection.)
43 my @SUPPORTED_ARCHITECTURES = ('x86_64', 'ppc64', 'x86');
45 # Command line options.
46 my $help = 0;
47 my $debug = 0;
48 my $raw = 0;
49 my $output_raw = ""; # Write raw results to file.
50 my $input_raw = ""; # Read raw results from file instead of scanning.
51 my $suppress_dmesg = 0; # Don't show dmesg in output.
52 my $squash_by_path = 0; # Summary report grouped by absolute path.
53 my $squash_by_filename = 0; # Summary report grouped by filename.
54 my $kernel_config_file = ""; # Kernel configuration file.
55 my $opt_32bit = 0; # Scan 32-bit kernel.
56 my $page_offset_32bit = 0; # Page offset for 32-bit kernel.
58 # Skip these absolute paths.
59 my @skip_abs = (
60 '/proc/kmsg',
61 '/proc/device-tree',
62 '/proc/1/syscall',
63 '/sys/firmware/devicetree',
64 '/sys/kernel/debug/tracing/trace_pipe',
65 '/sys/kernel/security/apparmor/revision');
67 # Skip these under any subdirectory.
68 my @skip_any = (
69 'pagemap',
70 'events',
71 'access',
72 'registers',
73 'snapshot_raw',
74 'trace_pipe_raw',
75 'ptmx',
76 'trace_pipe',
77 'fd',
78 'usbmon');
80 sub help
82 my ($exitcode) = @_;
84 print << "EOM";
86 Usage: $P [OPTIONS]
88 Options:
90 -o, --output-raw=<file> Save results for future processing.
91 -i, --input-raw=<file> Read results from file instead of scanning.
92 --raw Show raw results (default).
93 --suppress-dmesg Do not show dmesg results.
94 --squash-by-path Show one result per unique path.
95 --squash-by-filename Show one result per unique filename.
96 --kernel-config-file=<file> Kernel configuration file (e.g /boot/config)
97 --32-bit Scan 32-bit kernel.
98 --page-offset-32-bit=o Page offset (for 32-bit kernel 0xABCD1234).
99 -d, --debug Display debugging output.
100 -h, --help, --version Display this help and exit.
102 Scans the running kernel for potential leaking addresses.
105 exit($exitcode);
108 GetOptions(
109 'd|debug' => \$debug,
110 'h|help' => \$help,
111 'version' => \$help,
112 'o|output-raw=s' => \$output_raw,
113 'i|input-raw=s' => \$input_raw,
114 'suppress-dmesg' => \$suppress_dmesg,
115 'squash-by-path' => \$squash_by_path,
116 'squash-by-filename' => \$squash_by_filename,
117 'raw' => \$raw,
118 'kernel-config-file=s' => \$kernel_config_file,
119 '32-bit' => \$opt_32bit,
120 'page-offset-32-bit=o' => \$page_offset_32bit,
121 ) or help(1);
123 help(0) if ($help);
125 if ($input_raw) {
126 format_output($input_raw);
127 exit(0);
130 if (!$input_raw and ($squash_by_path or $squash_by_filename)) {
131 printf "\nSummary reporting only available with --input-raw=<file>\n";
132 printf "(First run scan with --output-raw=<file>.)\n";
133 exit(128);
136 if (!(is_supported_architecture() or $opt_32bit or $page_offset_32bit)) {
137 printf "\nScript does not support your architecture, sorry.\n";
138 printf "\nCurrently we support: \n\n";
139 foreach(@SUPPORTED_ARCHITECTURES) {
140 printf "\t%s\n", $_;
142 printf("\n");
144 printf("If you are running a 32-bit architecture you may use:\n");
145 printf("\n\t--32-bit or --page-offset-32-bit=<page offset>\n\n");
147 my $archname = `uname -m`;
148 printf("Machine hardware name (`uname -m`): %s\n", $archname);
150 exit(129);
153 if ($output_raw) {
154 open my $fh, '>', $output_raw or die "$0: $output_raw: $!\n";
155 select $fh;
158 parse_dmesg();
159 walk(@DIRS);
161 exit 0;
163 sub dprint
165 printf(STDERR @_) if $debug;
168 sub is_supported_architecture
170 return (is_x86_64() or is_ppc64() or is_ix86_32());
173 sub is_32bit
175 # Allow --32-bit or --page-offset-32-bit to override
176 if ($opt_32bit or $page_offset_32bit) {
177 return 1;
180 return is_ix86_32();
183 sub is_ix86_32
185 state $arch = `uname -m`;
187 chomp $arch;
188 if ($arch =~ m/i[3456]86/) {
189 return 1;
191 return 0;
194 sub is_arch
196 my ($desc) = @_;
197 my $arch = `uname -m`;
199 chomp $arch;
200 if ($arch eq $desc) {
201 return 1;
203 return 0;
206 sub is_x86_64
208 state $is = is_arch('x86_64');
209 return $is;
212 sub is_ppc64
214 state $is = is_arch('ppc64');
215 return $is;
218 # Gets config option value from kernel config file.
219 # Returns "" on error or if config option not found.
220 sub get_kernel_config_option
222 my ($option) = @_;
223 my $value = "";
224 my $tmp_file = "";
225 my @config_files;
227 # Allow --kernel-config-file to override.
228 if ($kernel_config_file ne "") {
229 @config_files = ($kernel_config_file);
230 } elsif (-R "/proc/config.gz") {
231 my $tmp_file = "/tmp/tmpkconf";
233 if (system("gunzip < /proc/config.gz > $tmp_file")) {
234 dprint "$0: system(gunzip < /proc/config.gz) failed\n";
235 return "";
236 } else {
237 @config_files = ($tmp_file);
239 } else {
240 my $file = '/boot/config-' . `uname -r`;
241 chomp $file;
242 @config_files = ($file, '/boot/config');
245 foreach my $file (@config_files) {
246 dprint("parsing config file: %s\n", $file);
247 $value = option_from_file($option, $file);
248 if ($value ne "") {
249 last;
253 if ($tmp_file ne "") {
254 system("rm -f $tmp_file");
257 return $value;
260 # Parses $file and returns kernel configuration option value.
261 sub option_from_file
263 my ($option, $file) = @_;
264 my $str = "";
265 my $val = "";
267 open(my $fh, "<", $file) or return "";
268 while (my $line = <$fh> ) {
269 if ($line =~ /^$option/) {
270 ($str, $val) = split /=/, $line;
271 chomp $val;
272 last;
276 close $fh;
277 return $val;
280 sub is_false_positive
282 my ($match) = @_;
284 if (is_32bit()) {
285 return is_false_positive_32bit($match);
288 # 64 bit false positives.
290 if ($match =~ '\b(0x)?(f|F){16}\b' or
291 $match =~ '\b(0x)?0{16}\b') {
292 return 1;
295 if (is_x86_64() and is_in_vsyscall_memory_region($match)) {
296 return 1;
299 return 0;
302 sub is_false_positive_32bit
304 my ($match) = @_;
305 state $page_offset = get_page_offset();
307 if ($match =~ '\b(0x)?(f|F){8}\b') {
308 return 1;
311 if (hex($match) < $page_offset) {
312 return 1;
315 return 0;
318 # returns integer value
319 sub get_page_offset
321 my $page_offset;
322 my $default_offset = 0xc0000000;
324 # Allow --page-offset-32bit to override.
325 if ($page_offset_32bit != 0) {
326 return $page_offset_32bit;
329 $page_offset = get_kernel_config_option('CONFIG_PAGE_OFFSET');
330 if (!$page_offset) {
331 return $default_offset;
333 return $page_offset;
336 sub is_in_vsyscall_memory_region
338 my ($match) = @_;
340 my $hex = hex($match);
341 my $region_min = hex("0xffffffffff600000");
342 my $region_max = hex("0xffffffffff601000");
344 return ($hex >= $region_min and $hex <= $region_max);
347 # True if argument potentially contains a kernel address.
348 sub may_leak_address
350 my ($line) = @_;
351 my $address_re;
353 # Signal masks.
354 if ($line =~ '^SigBlk:' or
355 $line =~ '^SigIgn:' or
356 $line =~ '^SigCgt:') {
357 return 0;
360 if ($line =~ '\bKEY=[[:xdigit:]]{14} [[:xdigit:]]{16} [[:xdigit:]]{16}\b' or
361 $line =~ '\b[[:xdigit:]]{14} [[:xdigit:]]{16} [[:xdigit:]]{16}\b') {
362 return 0;
365 $address_re = get_address_re();
366 while ($line =~ /($address_re)/g) {
367 if (!is_false_positive($1)) {
368 return 1;
372 return 0;
375 sub get_address_re
377 if (is_ppc64()) {
378 return '\b(0x)?[89abcdef]00[[:xdigit:]]{13}\b';
379 } elsif (is_32bit()) {
380 return '\b(0x)?[[:xdigit:]]{8}\b';
383 return get_x86_64_re();
386 sub get_x86_64_re
388 # We handle page table levels but only if explicitly configured using
389 # CONFIG_PGTABLE_LEVELS. If config file parsing fails or config option
390 # is not found we default to using address regular expression suitable
391 # for 4 page table levels.
392 state $ptl = get_kernel_config_option('CONFIG_PGTABLE_LEVELS');
394 if ($ptl == 5) {
395 return '\b(0x)?ff[[:xdigit:]]{14}\b';
397 return '\b(0x)?ffff[[:xdigit:]]{12}\b';
400 sub parse_dmesg
402 open my $cmd, '-|', 'dmesg';
403 while (<$cmd>) {
404 if (may_leak_address($_)) {
405 print 'dmesg: ' . $_;
408 close $cmd;
411 # True if we should skip this path.
412 sub skip
414 my ($path) = @_;
416 foreach (@skip_abs) {
417 return 1 if (/^$path$/);
420 my($filename, $dirs, $suffix) = fileparse($path);
421 foreach (@skip_any) {
422 return 1 if (/^$filename$/);
425 return 0;
428 sub timed_parse_file
430 my ($file) = @_;
432 eval {
433 local $SIG{ALRM} = sub { die "alarm\n" }; # NB: \n required.
434 alarm $TIMEOUT;
435 parse_file($file);
436 alarm 0;
439 if ($@) {
440 die unless $@ eq "alarm\n"; # Propagate unexpected errors.
441 printf STDERR "timed out parsing: %s\n", $file;
445 sub parse_file
447 my ($file) = @_;
449 if (! -R $file) {
450 return;
453 if (! -T $file) {
454 return;
457 open my $fh, "<", $file or return;
458 while ( <$fh> ) {
459 if (may_leak_address($_)) {
460 print $file . ': ' . $_;
463 close $fh;
466 # Checks if the actual path name is leaking a kernel address.
467 sub check_path_for_leaks
469 my ($path) = @_;
471 if (may_leak_address($path)) {
472 printf("Path name may contain address: $path\n");
476 # Recursively walk directory tree.
477 sub walk
479 my @dirs = @_;
481 while (my $pwd = shift @dirs) {
482 next if (!opendir(DIR, $pwd));
483 my @files = readdir(DIR);
484 closedir(DIR);
486 foreach my $file (@files) {
487 next if ($file eq '.' or $file eq '..');
489 my $path = "$pwd/$file";
490 next if (-l $path);
492 # skip /proc/PID except /proc/1
493 next if (($path =~ /^\/proc\/[0-9]+$/) &&
494 ($path !~ /^\/proc\/1$/));
496 next if (skip($path));
498 check_path_for_leaks($path);
500 if (-d $path) {
501 push @dirs, $path;
502 next;
505 dprint "parsing: $path\n";
506 timed_parse_file($path);
511 sub format_output
513 my ($file) = @_;
515 # Default is to show raw results.
516 if ($raw or (!$squash_by_path and !$squash_by_filename)) {
517 dump_raw_output($file);
518 return;
521 my ($total, $dmesg, $paths, $files) = parse_raw_file($file);
523 printf "\nTotal number of results from scan (incl dmesg): %d\n", $total;
525 if (!$suppress_dmesg) {
526 print_dmesg($dmesg);
529 if ($squash_by_filename) {
530 squash_by($files, 'filename');
533 if ($squash_by_path) {
534 squash_by($paths, 'path');
538 sub dump_raw_output
540 my ($file) = @_;
542 open (my $fh, '<', $file) or die "$0: $file: $!\n";
543 while (<$fh>) {
544 if ($suppress_dmesg) {
545 if ("dmesg:" eq substr($_, 0, 6)) {
546 next;
549 print $_;
551 close $fh;
554 sub parse_raw_file
556 my ($file) = @_;
558 my $total = 0; # Total number of lines parsed.
559 my @dmesg; # dmesg output.
560 my %files; # Unique filenames containing leaks.
561 my %paths; # Unique paths containing leaks.
563 open (my $fh, '<', $file) or die "$0: $file: $!\n";
564 while (my $line = <$fh>) {
565 $total++;
567 if ("dmesg:" eq substr($line, 0, 6)) {
568 push @dmesg, $line;
569 next;
572 cache_path(\%paths, $line);
573 cache_filename(\%files, $line);
576 return $total, \@dmesg, \%paths, \%files;
579 sub print_dmesg
581 my ($dmesg) = @_;
583 print "\ndmesg output:\n";
585 if (@$dmesg == 0) {
586 print "<no results>\n";
587 return;
590 foreach(@$dmesg) {
591 my $index = index($_, ': ');
592 $index += 2; # skid ': '
593 print substr($_, $index);
597 sub squash_by
599 my ($ref, $desc) = @_;
601 print "\nResults squashed by $desc (excl dmesg). ";
602 print "Displaying [<number of results> <$desc>], <example result>\n";
604 if (keys %$ref == 0) {
605 print "<no results>\n";
606 return;
609 foreach(keys %$ref) {
610 my $lines = $ref->{$_};
611 my $length = @$lines;
612 printf "[%d %s] %s", $length, $_, @$lines[0];
616 sub cache_path
618 my ($paths, $line) = @_;
620 my $index = index($line, ': ');
621 my $path = substr($line, 0, $index);
623 $index += 2; # skip ': '
624 add_to_cache($paths, $path, substr($line, $index));
627 sub cache_filename
629 my ($files, $line) = @_;
631 my $index = index($line, ': ');
632 my $path = substr($line, 0, $index);
633 my $filename = basename($path);
635 $index += 2; # skip ': '
636 add_to_cache($files, $filename, substr($line, $index));
639 sub add_to_cache
641 my ($cache, $key, $value) = @_;
643 if (!$cache->{$key}) {
644 $cache->{$key} = ();
646 push @{$cache->{$key}}, $value;