scripts: get_abi.pl: detect softlinks

The way sysfs works is that the same leave may be present under
/sys/devices, /sys/bus and /sys/class, etc, linked via soft
symlinks.

To make it harder to parse, the ABI definition usually refers
only to one of those locations.

So, improve the logic in order to retrieve the symlinks.

Signed-off-by: Mauro Carvalho Chehab <mchehab+huawei@kernel.org>
Link: https://lore.kernel.org/r/77c49f7d158d88e17f18d40652b75cdde9e179eb.1631957565.git.mchehab+huawei@kernel.org
Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
This commit is contained in:
Mauro Carvalho Chehab 2021-09-18 11:52:13 +02:00 committed by Greg Kroah-Hartman
parent f090db4395
commit ab02c5150b
1 changed files with 165 additions and 42 deletions

View File

@ -8,8 +8,10 @@ use Pod::Usage;
use Getopt::Long;
use File::Find;
use Fcntl ':mode';
use Cwd 'abs_path';
my $help = 0;
my $hint = 0;
my $man = 0;
my $debug = 0;
my $enable_lineno = 0;
@ -28,6 +30,7 @@ GetOptions(
"rst-source!" => \$description_is_rst,
"dir=s" => \$prefix,
'help|?' => \$help,
"show-hints" => \$hint,
man => \$man
) or pod2usage(2);
@ -526,7 +529,7 @@ sub search_symbols {
}
# Exclude /sys/kernel/debug and /sys/kernel/tracing from the search path
sub skip_debugfs {
sub dont_parse_special_attributes {
if (($File::Find::dir =~ m,^/sys/kernel,)) {
return grep {!/(debug|tracing)/ } @_;
}
@ -539,64 +542,178 @@ sub skip_debugfs {
}
my %leaf;
my %aliases;
my @files;
my $escape_symbols = qr { ([\x01-\x08\x0e-\x1f\x21-\x29\x2b-\x2d\x3a-\x40\x7b-\xff]) }x;
my $escape_symbols = qr { ([\x01-\x08\x0e-\x1f\x21-\x29\x2b-\x2d\x3a-\x40\x7b-\xfe]) }x;
sub parse_existing_sysfs {
my $file = $File::Find::name;
my $mode = (lstat($file))[2];
my $abs_file = abs_path($file);
my $mode = (stat($file))[2];
return if ($mode & S_IFDIR);
if (S_ISLNK($mode)) {
$aliases{$file} = $abs_file;
return;
}
return if (S_ISDIR($mode));
# Trivial: file is defined exactly the same way at ABI What:
return if (defined($data{$file}));
return if (defined($data{$abs_file}));
push @files, $abs_file;
}
sub check_undefined_symbols {
foreach my $file (sort @files) {
# sysfs-module is special, as its definitions are inside
# a text. For now, just ignore them.
next if ($file =~ m#^/sys/module/#);
# Ignore cgroup and firmware
next if ($file =~ m#^/sys/(fs/cgroup|firmware)/#);
my $defined = 0;
my $exact = 0;
my $whats = "";
my $leave = $file;
$leave =~ s,.*/,,;
my $path = $file;
$path =~ s,(.*/).*,$1,;
if (defined($leaf{$leave})) {
# FIXME: need to check if the path makes sense
my $what = $leaf{$leave};
$whats .= " $what" if (!($whats =~ m/$what/));
$what =~ s/,/ /g;
foreach my $w (split / /, $what) {
if ($file =~ m#^$w$#) {
$exact = 1;
last;
}
}
# Check for aliases
#
# TODO: this algorithm is O(w * n²). It can be
# improved in the future in order to handle it
# faster, by changing parse_existing_sysfs to
# store the sysfs inside a tree, at the expense
# on making the code less readable and/or using some
# additional perl library.
foreach my $a (keys %aliases) {
my $new = $aliases{$a};
my $len = length($new);
$what =~ s/\<[^\>]+\>/.*/g;
$what =~ s/\{[^\}]+\}/.*/g;
$what =~ s/\[[^\]]+\]/.*/g;
$what =~ s,/\.\.\./,/.*/,g;
$what =~ s,/\*/,/.*/,g;
if (substr($file, 0, $len) eq $new) {
my $newf = $a . substr($file, $len);
$what =~ s/\s+/ /g;
# Escape all other symbols
$what =~ s/$escape_symbols/\\$1/g;
foreach my $i (split / /,$what) {
if ($file =~ m#^$i$#) {
# print "$file: $i: OK!\n";
return;
foreach my $w (split / /, $what) {
if ($newf =~ m#^$w$#) {
$exact = 1;
last;
}
}
}
}
print "$file: $leave is defined at $what\n";
return;
$defined++;
}
next if ($exact);
# Ignore some sysfs nodes
next if ($file =~ m#/(sections|notes)/#);
# Would need to check at
# Documentation/admin-guide/kernel-parameters.txt, but this
# is not easily parseable.
next if ($file =~ m#/parameters/#);
if ($hint && $defined) {
print "$leave at $path might be one of:$whats\n";
next;
}
print "$file not found.\n";
}
}
sub undefined_symbols {
find({
wanted =>\&parse_existing_sysfs,
preprocess =>\&dont_parse_special_attributes,
no_chdir => 1
}, $sysfs_prefix);
foreach my $w (sort keys %data) {
foreach my $what (split /\xac /,$w) {
next if (!($what =~ m/^$sysfs_prefix/));
# Convert what into regular expressions
$what =~ s,/\.\.\./,/*/,g;
$what =~ s,\*,.*,g;
# Temporarily change [0-9]+ type of patterns
$what =~ s/\[0\-9\]\+/\xff/g;
# Temporarily change [\d+-\d+] type of patterns
$what =~ s/\[0\-\d+\]/\xff/g;
$what =~ s/\[(\d+)\]/\xf4$1\xf5/g;
# Temporarily change [0-9] type of patterns
$what =~ s/\[(\d)\-(\d)\]/\xf4$1-$2\xf5/g;
# Handle multiple option patterns
$what =~ s/[\{\<\[]([\w_]+)(?:[,|]+([\w_]+)){1,}[\}\>\]]/($1|$2)/g;
# Handle wildcards
$what =~ s/\<[^\>]+\>/.*/g;
$what =~ s/\{[^\}]+\}/.*/g;
$what =~ s/\[[^\]]+\]/.*/g;
$what =~ s/[XYZ]/.*/g;
# Recover [0-9] type of patterns
$what =~ s/\xf4/[/g;
$what =~ s/\xf5/]/g;
# Remove duplicated spaces
$what =~ s/\s+/ /g;
# Special case: this ABI has a parenthesis on it
$what =~ s/sqrt\(x^2\+y^2\+z^2\)/sqrt\(x^2\+y^2\+z^2\)/;
# Special case: drop comparition as in:
# What: foo = <something>
# (this happens on a few IIO definitions)
$what =~ s,\s*\=.*$,,;
my $leave = $what;
$leave =~ s,.*/,,;
if (defined($leaf{$leave})) {
$leaf{$leave} .= " " . $what;
} else {
$leaf{$leave} = $what;
}
}
}
next if ($leave =~ m/^\.\*/ || $leave eq "");
find({wanted =>\&parse_existing_sysfs, preprocess =>\&skip_debugfs, no_chdir => 1}, $sysfs_prefix);
# Escape all other symbols
$what =~ s/$escape_symbols/\\$1/g;
$what =~ s/\\\\/\\/g;
$what =~ s/\\([\[\]\(\)\|])/$1/g;
$what =~ s/(\d+)\\(-\d+)/$1$2/g;
$leave =~ s/[\(\)]//g;
foreach my $l (split /\|/, $leave) {
if (defined($leaf{$l})) {
next if ($leaf{$l} =~ m/$what/);
$leaf{$l} .= " " . $what;
} else {
$leaf{$l} = $what;
}
}
}
}
check_undefined_symbols;
}
# Ensure that the prefix will always end with a slash
@ -646,7 +763,8 @@ abi_book.pl - parse the Linux ABI files and produce a ReST book.
=head1 SYNOPSIS
B<abi_book.pl> [--debug] [--enable-lineno] [--man] [--help]
[--(no-)rst-source] [--dir=<dir>] <COMAND> [<ARGUMENT>]
[--(no-)rst-source] [--dir=<dir>] [--show-hints]
<COMAND> [<ARGUMENT>]
Where <COMMAND> can be:
@ -688,6 +806,11 @@ Enable output of #define LINENO lines.
Put the script in verbose mode, useful for debugging. Can be called multiple
times, to increase verbosity.
=item B<--show-hints>
Show hints about possible definitions for the missing ABI symbols.
Used only when B<undefined>.
=item B<--help>
Prints a brief help message and exits.