|  | #!/usr/bin/perl | 
|  |  | 
|  | use File::Basename; | 
|  | use Math::BigInt; | 
|  |  | 
|  | # Copyright 2008, Intel Corporation | 
|  | # | 
|  | # This file is part of the Linux kernel | 
|  | # | 
|  | # This program file is free software; you can redistribute it and/or modify it | 
|  | # under the terms of the GNU General Public License as published by the | 
|  | # Free Software Foundation; version 2 of the License. | 
|  | # | 
|  | # Authors: | 
|  | # 	Arjan van de Ven <arjan@linux.intel.com> | 
|  |  | 
|  |  | 
|  | my $vmlinux_name = $ARGV[0]; | 
|  | if (!defined($vmlinux_name)) { | 
|  | my $kerver = `uname -r`; | 
|  | chomp($kerver); | 
|  | $vmlinux_name = "/lib/modules/$kerver/build/vmlinux"; | 
|  | print "No vmlinux specified, assuming $vmlinux_name\n"; | 
|  | } | 
|  | my $filename = $vmlinux_name; | 
|  | # | 
|  | # Step 1: Parse the oops to find the EIP value | 
|  | # | 
|  |  | 
|  | my $target = "0"; | 
|  | my $function; | 
|  | my $module = ""; | 
|  | my $func_offset = 0; | 
|  | my $vmaoffset = 0; | 
|  |  | 
|  | my %regs; | 
|  |  | 
|  |  | 
|  | sub parse_x86_regs | 
|  | { | 
|  | my ($line) = @_; | 
|  | if ($line =~ /EAX: ([0-9a-f]+) EBX: ([0-9a-f]+) ECX: ([0-9a-f]+) EDX: ([0-9a-f]+)/) { | 
|  | $regs{"%eax"} = $1; | 
|  | $regs{"%ebx"} = $2; | 
|  | $regs{"%ecx"} = $3; | 
|  | $regs{"%edx"} = $4; | 
|  | } | 
|  | if ($line =~ /ESI: ([0-9a-f]+) EDI: ([0-9a-f]+) EBP: ([0-9a-f]+) ESP: ([0-9a-f]+)/) { | 
|  | $regs{"%esi"} = $1; | 
|  | $regs{"%edi"} = $2; | 
|  | $regs{"%esp"} = $4; | 
|  | } | 
|  | if ($line =~ /RAX: ([0-9a-f]+) RBX: ([0-9a-f]+) RCX: ([0-9a-f]+)/) { | 
|  | $regs{"%eax"} = $1; | 
|  | $regs{"%ebx"} = $2; | 
|  | $regs{"%ecx"} = $3; | 
|  | } | 
|  | if ($line =~ /RDX: ([0-9a-f]+) RSI: ([0-9a-f]+) RDI: ([0-9a-f]+)/) { | 
|  | $regs{"%edx"} = $1; | 
|  | $regs{"%esi"} = $2; | 
|  | $regs{"%edi"} = $3; | 
|  | } | 
|  | if ($line =~ /RBP: ([0-9a-f]+) R08: ([0-9a-f]+) R09: ([0-9a-f]+)/) { | 
|  | $regs{"%r08"} = $2; | 
|  | $regs{"%r09"} = $3; | 
|  | } | 
|  | if ($line =~ /R10: ([0-9a-f]+) R11: ([0-9a-f]+) R12: ([0-9a-f]+)/) { | 
|  | $regs{"%r10"} = $1; | 
|  | $regs{"%r11"} = $2; | 
|  | $regs{"%r12"} = $3; | 
|  | } | 
|  | if ($line =~ /R13: ([0-9a-f]+) R14: ([0-9a-f]+) R15: ([0-9a-f]+)/) { | 
|  | $regs{"%r13"} = $1; | 
|  | $regs{"%r14"} = $2; | 
|  | $regs{"%r15"} = $3; | 
|  | } | 
|  | } | 
|  |  | 
|  | sub reg_name | 
|  | { | 
|  | my ($reg) = @_; | 
|  | $reg =~ s/r(.)x/e\1x/; | 
|  | $reg =~ s/r(.)i/e\1i/; | 
|  | $reg =~ s/r(.)p/e\1p/; | 
|  | return $reg; | 
|  | } | 
|  |  | 
|  | sub process_x86_regs | 
|  | { | 
|  | my ($line, $cntr) = @_; | 
|  | my $str = ""; | 
|  | if (length($line) < 40) { | 
|  | return ""; # not an asm istruction | 
|  | } | 
|  |  | 
|  | # find the arguments to the instruction | 
|  | if ($line =~ /([0-9a-zA-Z\,\%\(\)\-\+]+)$/) { | 
|  | $lastword = $1; | 
|  | } else { | 
|  | return ""; | 
|  | } | 
|  |  | 
|  | # we need to find the registers that get clobbered, | 
|  | # since their value is no longer relevant for previous | 
|  | # instructions in the stream. | 
|  |  | 
|  | $clobber = $lastword; | 
|  | # first, remove all memory operands, they're read only | 
|  | $clobber =~ s/\([a-z0-9\%\,]+\)//g; | 
|  | # then, remove everything before the comma, thats the read part | 
|  | $clobber =~ s/.*\,//g; | 
|  |  | 
|  | # if this is the instruction that faulted, we haven't actually done | 
|  | # the write yet... nothing is clobbered. | 
|  | if ($cntr == 0) { | 
|  | $clobber = ""; | 
|  | } | 
|  |  | 
|  | foreach $reg (keys(%regs)) { | 
|  | my $clobberprime = reg_name($clobber); | 
|  | my $lastwordprime = reg_name($lastword); | 
|  | my $val = $regs{$reg}; | 
|  | if ($val =~ /^[0]+$/) { | 
|  | $val = "0"; | 
|  | } else { | 
|  | $val =~ s/^0*//; | 
|  | } | 
|  |  | 
|  | # first check if we're clobbering this register; if we do | 
|  | # we print it with a =>, and then delete its value | 
|  | if ($clobber =~ /$reg/ || $clobberprime =~ /$reg/) { | 
|  | if (length($val) > 0) { | 
|  | $str = $str . " $reg => $val "; | 
|  | } | 
|  | $regs{$reg} = ""; | 
|  | $val = ""; | 
|  | } | 
|  | # now check if we're reading this register | 
|  | if ($lastword =~ /$reg/ || $lastwordprime =~ /$reg/) { | 
|  | if (length($val) > 0) { | 
|  | $str = $str . " $reg = $val "; | 
|  | } | 
|  | } | 
|  | } | 
|  | return $str; | 
|  | } | 
|  |  | 
|  | # parse the oops | 
|  | while (<STDIN>) { | 
|  | my $line = $_; | 
|  | if ($line =~ /EIP: 0060:\[\<([a-z0-9]+)\>\]/) { | 
|  | $target = $1; | 
|  | } | 
|  | if ($line =~ /RIP: 0010:\[\<([a-z0-9]+)\>\]/) { | 
|  | $target = $1; | 
|  | } | 
|  | if ($line =~ /EIP is at ([a-zA-Z0-9\_]+)\+0x([0-9a-f]+)\/0x[a-f0-9]/) { | 
|  | $function = $1; | 
|  | $func_offset = $2; | 
|  | } | 
|  | if ($line =~ /RIP: 0010:\[\<[0-9a-f]+\>\]  \[\<[0-9a-f]+\>\] ([a-zA-Z0-9\_]+)\+(0x[0-9a-f]+)\/0x[a-f0-9]/) { | 
|  | $function = $1; | 
|  | $func_offset = $2; | 
|  | } | 
|  |  | 
|  | # check if it's a module | 
|  | if ($line =~ /EIP is at ([a-zA-Z0-9\_]+)\+(0x[0-9a-f]+)\/0x[a-f0-9]+\W\[([a-zA-Z0-9\_\-]+)\]/) { | 
|  | $module = $3; | 
|  | } | 
|  | if ($line =~ /RIP: 0010:\[\<[0-9a-f]+\>\]  \[\<[0-9a-f]+\>\] ([a-zA-Z0-9\_]+)\+(0x[0-9a-f]+)\/0x[a-f0-9]+\W\[([a-zA-Z0-9\_\-]+)\]/) { | 
|  | $module = $3; | 
|  | } | 
|  | parse_x86_regs($line); | 
|  | } | 
|  |  | 
|  | my $decodestart = Math::BigInt->from_hex("0x$target") - Math::BigInt->from_hex("0x$func_offset"); | 
|  | my $decodestop = Math::BigInt->from_hex("0x$target") + 8192; | 
|  | if ($target eq "0") { | 
|  | print "No oops found!\n"; | 
|  | print "Usage: \n"; | 
|  | print "    dmesg | perl scripts/markup_oops.pl vmlinux\n"; | 
|  | exit; | 
|  | } | 
|  |  | 
|  | # if it's a module, we need to find the .ko file and calculate a load offset | 
|  | if ($module ne "") { | 
|  | my $modulefile = `modinfo $module | grep '^filename:' | awk '{ print \$2 }'`; | 
|  | chomp($modulefile); | 
|  | $filename = $modulefile; | 
|  | if ($filename eq "") { | 
|  | print "Module .ko file for $module not found. Aborting\n"; | 
|  | exit; | 
|  | } | 
|  | # ok so we found the module, now we need to calculate the vma offset | 
|  | open(FILE, "objdump -dS $filename |") || die "Cannot start objdump"; | 
|  | while (<FILE>) { | 
|  | if ($_ =~ /^([0-9a-f]+) \<$function\>\:/) { | 
|  | my $fu = $1; | 
|  | $vmaoffset = hex($target) - hex($fu) - hex($func_offset); | 
|  | } | 
|  | } | 
|  | close(FILE); | 
|  | } | 
|  |  | 
|  | my $counter = 0; | 
|  | my $state   = 0; | 
|  | my $center  = 0; | 
|  | my @lines; | 
|  | my @reglines; | 
|  |  | 
|  | sub InRange { | 
|  | my ($address, $target) = @_; | 
|  | my $ad = "0x".$address; | 
|  | my $ta = "0x".$target; | 
|  | my $delta = hex($ad) - hex($ta); | 
|  |  | 
|  | if (($delta > -4096) && ($delta < 4096)) { | 
|  | return 1; | 
|  | } | 
|  | return 0; | 
|  | } | 
|  |  | 
|  |  | 
|  |  | 
|  | # first, parse the input into the lines array, but to keep size down, | 
|  | # we only do this for 4Kb around the sweet spot | 
|  |  | 
|  | open(FILE, "objdump -dS --adjust-vma=$vmaoffset --start-address=$decodestart --stop-address=$decodestop $filename |") || die "Cannot start objdump"; | 
|  |  | 
|  | while (<FILE>) { | 
|  | my $line = $_; | 
|  | chomp($line); | 
|  | if ($state == 0) { | 
|  | if ($line =~ /^([a-f0-9]+)\:/) { | 
|  | if (InRange($1, $target)) { | 
|  | $state = 1; | 
|  | } | 
|  | } | 
|  | } else { | 
|  | if ($line =~ /^([a-f0-9][a-f0-9][a-f0-9][a-f0-9][a-f0-9][a-f0-9]+)\:/) { | 
|  | my $val = $1; | 
|  | if (!InRange($val, $target)) { | 
|  | last; | 
|  | } | 
|  | if ($val eq $target) { | 
|  | $center = $counter; | 
|  | } | 
|  | } | 
|  | $lines[$counter] = $line; | 
|  |  | 
|  | $counter = $counter + 1; | 
|  | } | 
|  | } | 
|  |  | 
|  | close(FILE); | 
|  |  | 
|  | if ($counter == 0) { | 
|  | print "No matching code found \n"; | 
|  | exit; | 
|  | } | 
|  |  | 
|  | if ($center == 0) { | 
|  | print "No matching code found \n"; | 
|  | exit; | 
|  | } | 
|  |  | 
|  | my $start; | 
|  | my $finish; | 
|  | my $codelines = 0; | 
|  | my $binarylines = 0; | 
|  | # now we go up and down in the array to find how much we want to print | 
|  |  | 
|  | $start = $center; | 
|  |  | 
|  | while ($start > 1) { | 
|  | $start = $start - 1; | 
|  | my $line = $lines[$start]; | 
|  | if ($line =~ /^([a-f0-9]+)\:/) { | 
|  | $binarylines = $binarylines + 1; | 
|  | } else { | 
|  | $codelines = $codelines + 1; | 
|  | } | 
|  | if ($codelines > 10) { | 
|  | last; | 
|  | } | 
|  | if ($binarylines > 20) { | 
|  | last; | 
|  | } | 
|  | } | 
|  |  | 
|  |  | 
|  | $finish = $center; | 
|  | $codelines = 0; | 
|  | $binarylines = 0; | 
|  | while ($finish < $counter) { | 
|  | $finish = $finish + 1; | 
|  | my $line = $lines[$finish]; | 
|  | if ($line =~ /^([a-f0-9]+)\:/) { | 
|  | $binarylines = $binarylines + 1; | 
|  | } else { | 
|  | $codelines = $codelines + 1; | 
|  | } | 
|  | if ($codelines > 10) { | 
|  | last; | 
|  | } | 
|  | if ($binarylines > 20) { | 
|  | last; | 
|  | } | 
|  | } | 
|  |  | 
|  |  | 
|  | my $i; | 
|  |  | 
|  |  | 
|  | # start annotating the registers in the asm. | 
|  | # this goes from the oopsing point back, so that the annotator | 
|  | # can track (opportunistically) which registers got written and | 
|  | # whos value no longer is relevant. | 
|  |  | 
|  | $i = $center; | 
|  | while ($i >= $start) { | 
|  | $reglines[$i] = process_x86_regs($lines[$i], $center - $i); | 
|  | $i = $i - 1; | 
|  | } | 
|  |  | 
|  | $i = $start; | 
|  | while ($i < $finish) { | 
|  | my $line; | 
|  | if ($i == $center) { | 
|  | $line =  "*$lines[$i] "; | 
|  | } else { | 
|  | $line =  " $lines[$i] "; | 
|  | } | 
|  | print $line; | 
|  | if (defined($reglines[$i]) && length($reglines[$i]) > 0) { | 
|  | my $c = 60 - length($line); | 
|  | while ($c > 0) { print " "; $c = $c - 1; }; | 
|  | print "| $reglines[$i]"; | 
|  | } | 
|  | if ($i == $center) { | 
|  | print "<--- faulting instruction"; | 
|  | } | 
|  | print "\n"; | 
|  | $i = $i +1; | 
|  | } | 
|  |  |