kernel-source/symsets.pl

578 lines
16 KiB
Perl
Raw Normal View History

#!/usr/bin/env perl
=head1 NAME
symsets.pl - tool to generate symsets for the kernel packages
=head1 SYNOPSIS
symsets.pl --list-exported-symbols modules...
symsets.pl --generate-symsets [--reference=DIR] --output-dir=DIR modules...
symsets.pl --list-symsets [--reference=DIR] modules...
symsets.pl --check-kabi --reference=DIR modules...
=head1 OPTIONS
=head3 MODE OPTIONS
One of the following options has to be selected:
=over
=item B<--list-exported-symbols>
List symbols exported by modules in a Module.symvers style format.
=item B<--generate-symsets>
Group exported symbols into symsets. Symbols from modules from the same
directory end up in one symset. This option requires B<--output-dir>.
=item B<--list-symsets>
Like B<--generate-symsets>, but only print the symset names on stdout.
=item B<--check-kabi>
Check for kabi changes. This requires B<--reference>.
=back
=head3 OTHER OPTIONS
=over
=item B<-v, --verbose>
Increase verbosity.
=item B<--symvers-file=Module.symvers>
Load built-in symbols from Module.symvers. Only symbols provided by the main
kernel image (marked as vmlinux or built-in) are read from this file.
=item B<--modules=FILE>
Read list of modules from FILE instead of command line. This option can be used
multiple times to read modules from multiple files.
=item B<--required-modules=FILE>
List of modules that are installed by packages required by this package. If
a module moves from subpackage A to subpackage B, this can result in a changed
symset checksum in A. Together with B<--reference>, this option ensures that
the old checksum is provided in the subpackage that installs or requires
all modules from the symset.
=item B<--reference=DIR>
Load symsets of a previous kernel package from DIR and add them to the output
if the symbols are still provided by this kernel package.
=item B<--fake=FILE>
List of exports in Module.symvers format that do not exist, but are
considered unimportant to break a symset. Symsets that contain these fake
symbols are created as ".$name.$hash.fake", so that KMPs don't see them.
This option only makes sense with when B<--reference> is given.
=item B<--output-dir=DIR>
Write symsets into DIR (B<--generate-symsets> only).
=item B<--max-badness=NUM>
Set maximum allowed badness to NUM. Meaningful values are 4, 6, 8, 15 or 31
(B<--check-kabi> only).
=item B<--commonsyms=FILE>
Read common symbols from FILE. Badness for changes to common symbols is
incremented by 8 (the resulting badness is 16 by default). (B<--check-kabi>
only).
=item B<--usedsyms=FILE>
Read used symbols from FILE. Badness for changes to used symbols is incremented
by 16 (the resulting badness is 24 by default). (B<--check-kabi> only).
=item B<--severities=FILE>
Read a table of kabi change severities from FILE. Each line consists of a
GLOB-SEVERITY pair separated by whitespace. Changes in modules matching GLOB
will have severity SEVERITY instead of the default 8. (B<--check-kabi> only).
=back
=cut
use strict;
use warnings;
#use diagnostics;
use Digest::MD5 qw(md5_hex);
use Getopt::Long;
eval { require Pod::Usage; };
if ($@) {
sub pod2usage {
my %opts = @_;
print STDERR
"Usage:
symsets.pl --list-exported-symbols ...
symsets.pl --generate-symsets [--reference=DIR] --output-dir=DIR ...
symsets.pl --list-symsets [--reference=DIR] ...
symsets.pl --check-kabi --reference=DIR ...
Install Pod::Usage for a better help message.
";
exit $opts{-exitval};
}
} else {
Pod::Usage->import('pod2usage');
}
our ($opt_verbose);
our $kabi_badness = 0;
our (%commonsyms, %usedsyms, @severities);
our ($opt_list_exp, $opt_gen_sets, $opt_list_sets, $opt_check_kabi) = (0,0,0,0);
our ($opt_max_badness, $opt_commonsyms, $opt_usedsyms, $opt_severities);
our ($opt_symvers_file, $opt_reference, $opt_fake);
our ($opt_output_dir);
sub main {
my (@modules, @pulled_modules);
my $res = GetOptions(
'verbose|v' => \$opt_verbose,
'list-exported-symbols' => \$opt_list_exp,
'generate-symsets' => \$opt_gen_sets,
'list-symsets' => \$opt_list_sets,
'check-kabi' => \$opt_check_kabi,
'max-badness=i' => \$opt_max_badness,
'commonsyms|common-syms=s' => \$opt_commonsyms,
'usedsyms|used-syms=s' => \$opt_usedsyms,
'severities=s' => \$opt_severities,
'symvers-file=s' => \$opt_symvers_file,
'modules=s' => sub { push(@modules, load_list($_[1])); },
'required-modules=s' => sub { push(@pulled_modules, load_list($_[1])); },
'reference=s' => \$opt_reference,
'fake=s' => \$opt_fake,
'output-dir=s' => \$opt_output_dir,
'usage' => sub { pod2usage(-exitval => 0, -verbose => 0); },
'help' => sub { pod2usage(-exitval => 0, -verbose => 1); },
);
# boring option checking
my $opt_err = sub {
print STDERR "ERROR: @_\n";
$res = 0;
};
&$opt_err("Please choose one of --list-exported-symbols, --generate-symsets, --list-symsets or --check-kabi")
if ($opt_list_exp + $opt_gen_sets + $opt_list_sets > 1 ||
!($opt_list_exp + $opt_gen_sets + $opt_list_sets + $opt_check_kabi));
&$opt_err("--check-kabi doesn't work with --list-exported-symbols")
if ($opt_list_exp && $opt_check_kabi);
&$opt_err("--check-kabi requires --reference")
if ($opt_check_kabi && !$opt_reference);
&$opt_err("--fake only makes sense with --reference")
if ($opt_fake && !$opt_reference);
&$opt_err("--output-dir only makes sense with --generate-symsets")
if ($opt_output_dir && !$opt_gen_sets);
&$opt_err("--generate-symsets requires --output-dir")
if ($opt_gen_sets && !$opt_output_dir);
if (!$opt_check_kabi) {
for my $opt qw(max-badness commonsyms usedsyms severities) {
no strict 'refs';
my $var = "opt_$opt";
$var =~ s/-/_/g;
if (defined(${$var})) {
&$opt_err("--$opt only makes sense with --check-kabi");
}
}
}
# get list of modules
if (@modules == 0) {
@modules = @ARGV;
}
if (@modules == 0 && !defined($opt_symvers_file)) {
&$opt_err("No modules supplied");
}
if (!$res) {
pod2usage(-exitval => 1, -verbose => 0, -output => ">&2");
}
# get list of exports
my (@exports, @pulled_exports, @fake_exports);
for my $file (@modules) {
push(@exports, module_exports($file));
}
if (defined($opt_symvers_file)) {
push(@exports, builtin_exports(parse_symset($opt_symvers_file)));
}
if ($opt_list_exp) {
print format_exports(@exports);
exit 0;
}
for my $file (@pulled_modules) {
push(@pulled_exports, module_exports($file));
}
if ($opt_fake) {
push(@fake_exports, parse_symset($opt_fake));
}
# generate symsets and optionally check kabi
my (@ref, @sets);
@sets = split_into_symsets(@exports);
if (defined($opt_reference)) {
@ref = load_symsets($opt_reference);
if ($opt_check_kabi) {
load_kabi_files($opt_commonsyms, $opt_usedsyms, $opt_severities);
}
# records kabi breakage if $opt_check_kabi is set
preserve_symsets(\@sets, \@ref, \@pulled_exports, \@fake_exports);
}
if ($opt_gen_sets) {
write_symsets($opt_output_dir, @sets);
} elsif ($opt_list_sets) {
write_symsets(undef, @sets);
}
if ($kabi_badness) {
print STDERR "KABI: badness is $kabi_badness";
if (!defined($opt_max_badness) || $kabi_badness <= $opt_max_badness) {
print STDERR " (tolerated)\n";
} else {
print STDERR " (exceeds threshold $opt_max_badness), aborting\n";
exit 1;
}
}
exit 0;
}
# structures used:
# %export:
# (crc => $crc, sym => $sym, mod => $module, type => $type)
# @exportlist
# ({crc => $crc, sym => $sym, mod => $module, type => $type}, ...)
# @symset:
# ($name,
# [{crc => $crc, sym => $sym, mod => $module, type => $type}, ...],
# $fake
# )
# @symsetlist:
# (
# [$name,
# [{crc => $crc, sym => $sym, mod => $module, type => $type}, ...]
# $fake
# ],
# ...
# )
#
# parse a Modules.symvers-style file
# returns an exportlist
sub parse_symset {
my ($file) = @_;
my @res;
open(my $fh, '<', $file) or die "Error opening $file: $!\n";
while (<$fh>) {
my @l = split(/\s+/);
if (@l < 4) {
print STDERR "$file:$.: unknown line\n";
next;
}
$l[0] =~ s/^0x//;
push(@res, {crc => $l[0], sym => $l[1], mod => $l[2], type => $l[3]});
}
close($fh);
return @res;
}
# greps an exportlist for built-in symbols
sub builtin_exports {
return grep { $_->{mod} =~ /(^vmlinux$)|(\/built-in$)/ } @_;
}
my %export_types = (
__ksymtab => "EXPORT_SYMBOL",
__ksymtab_unused => "EXPORT_UNUSED_SYMBOL",
__ksymtab_gpl => "EXPORT_SYMBOL_GPL",
__ksymtab_unused_gpl => "EXPORT_UNUSED_SYMBOL_GPL",
__ksymtab_gpl_future => "EXPORT_SYMBOL_GPL_FUTURE"
);
# returns an exportlist for a given module
sub module_exports {
my ($file) = @_;
my (%crcs, %types, @res);
my $mod = $file;
$mod =~ s/.*\/lib\/modules\/[^\/]*\/kernel\///;
$mod =~ s/\.(k?o|a)$//;
open(my $pipe, '-|', 'objdump', '-t', $file) or die "objdump -t $file: $!\n";
while (<$pipe>) {
my $l = $_;
my @l = split(/\s+/);
next if (@l < 3);
next if ($l =~ /^[^ ]* .....d/); # debug symbol
my $sym = $l[$#l];
my $sec = $l[$#l - 2];
if ($sym =~ /^__crc_(.*)/) {
$crcs{$1} = $l[0];
$crcs{$1} =~ s/^0{8}//;
} elsif ($sym =~ /^__ksymtab_(.*)/ && exists($export_types{$sec})) {
$types{$1} = $export_types{$sec};
}
}
close($pipe);
if ($? != 0) {
die "objdump returned an error\n";
}
for my $sym (keys(%types)) {
push(@res, {sym => $sym, crc => $crcs{$sym} || "0"x8, mod => $mod,
type => $types{$sym}});
}
return @res;
}
# format an exportlist for output
sub format_exports {
my $res = "";
for my $exp (sort { $a->{sym} cmp $b->{sym} } @_) {
$res .= "0x$exp->{crc}\t$exp->{sym}\t$exp->{mod}\t$exp->{type}\n";
}
return $res;
}
# splits exports by directories, returns a symsetlist
sub split_into_symsets {
my %sets;
for my $exp (@_) {
my $set = $exp->{mod};
$set =~ s/\/[^\/]+$//;
$set =~ s/\//_/g;
$sets{$set} ||= [];
push(@{$sets{$set}}, $exp);
}
return map { [$_, $sets{$_}] } keys(%sets)
}
# loads symsets from a directory created by write_symsets
# returns symsetlist
# FIXME: multiple versions of a symset
sub load_symsets {
my ($dir) = @_;
my @sets;
opendir(my $dh, $dir) or die "Error reading directory $dir: $!\n";
for my $file (readdir($dh)) {
next if $file =~ /^\.\.?$/;
if (!-f "$dir/$file" ||
$file !~ /^\.?([\w-]+)\.[0-9a-f]{16}(\.fake)?$/) {
print STDERR "Ignoring unknown file $dir/$file\n";
next;
}
my $set = $1;
push(@sets, [$set, [parse_symset("$dir/$file")]]);
}
closedir($dh);
return @sets;
}
sub hash {
return substr(md5_hex(@_), 0, 16);
}
# writes symsets as returned by split_into_symsets/load_symsets into $dir
sub write_symsets {
my $dir = shift;
my @sets = @_;
my $print_only = (!defined($dir));
for my $set (@sets) {
my $name = $set->[0];
my $exports = $set->[1];
my $fake = $set->[2];
my $data = format_exports(@$exports);
my $hash = hash($data);
if ($print_only) {
print "$name.$hash\n";
} else {
my $f;
if ($fake) {
$f = "$dir/.$name.$hash.fake";
} else {
$f = "$dir/$name.$hash";
}
open(my $fh, '>', $f) or die "error creating $f: $!\n";
print $fh $data;
close($fh);
}
}
}
# loads kabi check configurations into %commonsyms, %usedsyms and %severities
sub load_kabi_files {
my ($csfile, $usfile, $sevfile) = @_;
if (defined($csfile)) {
open(my $fh, '<', $csfile) or die "Can't open $csfile: $!\n";
%commonsyms = map { s/\s+//g; ; $_ => 1 } <$fh>;
close($fh);
}
if (defined($usfile)) {
open(my $fh, '<', $usfile) or die "Can't open $usfile: $!\n";
%usedsyms = map { s/\s+//g; $_ => 1 } <$fh>;
close($fh);
}
if (defined($sevfile)) {
open(my $fh, '<', $sevfile) or die "Can't open $sevfile: $!\n";
while (<$fh>) {
chomp;
s/#.*//;
next if /^\s*$/;
my @f = split(/\s+/);
if (@f != 2) {
print STDERR "$sevfile:$.: unknown line\n";
next;
}
if ($f[1] !~ /^\d+$/) {
print STDERR "$sevfile:$.: invalid severity $f[1]\n";
next;
}
# simple glob -> regexp conversion
$f[0] =~ s/\*/.*/g;
$f[0] =~ s/\?/./g;
$f[0] =~ s/.*/^$&\$/;
push(@severities, [@f]);
}
close($fh);
}
}
# loads a list of filenames from file
sub load_list {
my ($file) = @_;
my ($fh, @res);
if ($file eq '-') {
open($fh, '<&STDIN');
} else {
open($fh, '<', $file) or die "Error opening $file: $!\n";
}
@res = <$fh>;
chomp(@res);
close($fh);
return @res;
}
# record kabi changes
sub kabi_change {
my $exp = shift;
my $sev;
return if !$opt_check_kabi;
$sev = 8;
for my $rule (@severities) {
if ($exp->{mod} =~ $rule->[0]) {
$sev = $rule->[1];
last;
}
}
if (exists($usedsyms{$exp->{sym}})) {
$sev += 16;
} elsif (exists($commonsyms{$exp->{sym}})) {
$sev += 8;
}
print STDERR "KABI: symbol $exp->{sym}.$exp->{crc} (badness $sev): @_\n";
$kabi_badness = $sev if ($sev > $kabi_badness);
}
# check if all symbols from $old symsetlist are provided by $new symsetlist,
# add compatible symsets to $new
# $pulled_exports is a exportlist of modules, that are pulled as dependencies
# of this package (thus also "provided" by this package).
sub preserve_symsets {
my ($new, $old, $pulled_exports, $fake_exports) = @_;
my (%symcrcs, %pulled_symcrcs, %fake_symcrcs, %symsethashes);
for my $set (@$new) {
my $name = $set->[0];
my $exports = $set->[1];
$symsethashes{$name} = hash(format_exports(@$exports));
for my $exp (@$exports) {
$symcrcs{$exp->{sym}} = $exp->{crc};
}
}
for my $exp (@$pulled_exports) {
$pulled_symcrcs{$exp->{sym}} = $exp->{crc};
}
for my $exp (@$fake_exports) {
$fake_symcrcs{$exp->{sym}} = $exp->{crc};
}
for my $set (@$old) {
my $name = $set->[0];
my $exports = $set->[1];
my $hash = hash(format_exports(@$exports));
if (exists($symsethashes{$name}) && $symsethashes{$name} eq $hash) {
next;
}
my $compatible = 1;
my $fake = 0;
my $oursyms = 0;
for my $exp (@$exports) {
my $crc;
if (exists($symcrcs{$exp->{sym}})) {
$oursyms++;
$crc = $symcrcs{$exp->{sym}};
} elsif (exists($pulled_symcrcs{$exp->{sym}})) {
$crc = $pulled_symcrcs{$exp->{sym}};
}
if ($crc && $crc eq $exp->{crc}) {
next;
}
if (exists($fake_symcrcs{$exp->{sym}}) &&
$fake_symcrcs{$exp->{sym}} eq $exp->{crc}) {
$fake = 1;
next;
}
if (!$crc) {
kabi_change($exp, "missing");
$compatible = 0;
next;
} else {
kabi_change($exp, "crc changed to $crc\n");
$compatible = 0;
}
}
if ($compatible) {
if ($oursyms == 0) {
# this symset is fully provided by a package we require,
# so do not duplicate it in our symsets
next;
}
if ($opt_verbose && $opt_check_kabi) {
print STDERR "KABI: symset $name.$hash preserved";
print STDERR "using fake exports" if $fake;
print STDERR "\n";
}
push(@$new, [$name, $exports, $fake]);
} else {
print STDERR "KABI: symset $name.$hash NOT preserved\n"
if $opt_check_kabi;
}
}
}
main();
# vim: sw=4:et:sts=4