Linux ip-172-26-7-228 5.4.0-1103-aws #111~18.04.1-Ubuntu SMP Tue May 23 20:04:10 UTC 2023 x86_64
Your IP : 13.58.32.115
# -*- perl -*-
# Lintian::Data -- interface to query lists of keywords
# Copyright (C) 2008 Russ Allbery
#
# This program is free software; you can redistribute it and/or modify it
# under the terms of the GNU General Public License as published by the Free
# Software Foundation; either version 2 of the License, or (at your option)
# any later version.
#
# This program is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
# more details.
#
# You should have received a copy of the GNU General Public License along with
# this program. If not, see <http://www.gnu.org/licenses/>.
package Lintian::Data;
use strict;
use warnings;
use autodie;
use Carp qw(croak confess);
use POSIX qw(ENOENT);
use Lintian::Util qw(strip);
our $LAZY_LOAD = 1;
sub _checked_open {
my ($path) = @_;
my $fd;
eval {open($fd, '<', $path);};
if (my $err = $@) {
die($err) if not ref $err or $err->errno != ENOENT;
return;
}
return $fd;
}
sub new {
my ($class, @args) = @_;
my $data_name = $args[0];
my $self = {};
my $data;
croak 'no data type specified' unless $data_name;
bless $self, $class;
$data = $self->_get_data($data_name);
if ($data) {
# We already loaded this data file - just pull from cache
$self->{'data'} = $data;
} else {
# Pretend we loaded this data file, but leave a "reminder" to
# do it later.
$self->{'promise'} = \@args;
$self->_force_promise if not $LAZY_LOAD;
}
return $self;
}
# _get_data fetches an already loaded dataset by type. It is
# mostly useful for determining whether it makes sense to make
# sense to be "lazy".
#
# _load_data loads a dataset into %data, which is private to this
# module. Use %data as a cache to avoid loading the same dataset more
# than once (which means lintian doesn't support having the list
# change over the life of the process). The returned object knows
# what dataset, stored in %data, it is supposed to act on.
{
my %data;
sub _get_data {
my ($self, $data_name) = @_;
return $data{$data_name};
}
sub _load_data {
my ($self, $data_spec) = @_;
my $data_name = $data_spec->[0];
unless (exists($data{$data_name})) {
my $vendors = $self->_get_vendor_names;
my ($dataset, $keyorder) = ({}, []);
my ($fd, $vno) = $self->_open_data_file($data_name, $vendors, 0);
$self->_parse_file($data_name, $fd, $dataset, $keyorder,
$data_spec, $vendors, $vno);
close($fd);
$data{$data_name} = {dataset => $dataset, keyorder => $keyorder};
}
return $self->{'data'} = $data{$data_name};
}
}
{
my $profile;
# Set vendor profile
sub set_vendor {
my (undef, $vendor) = @_;
$profile = $vendor;
return;
}
# Returns a listref of profile names
sub _get_vendor_names {
my ($self) = @_;
croak 'No vendor given' unless $profile;
my @vendors;
push @vendors, reverse @{ $profile->profile_list };
return \@vendors;
}
# Open the (next) data file
#
# $self->_open_data_file ($data_name, $vendors, $start)
# - $data_name is the data file (e.g. "common/architectures")
# - $vendors is the listref return by _get_vendor_names
# - $start is an index into $vendors (the first $vendor to try)
sub _open_data_file {
my ($self, $data_name, $vendors, $start) = @_;
my ($fd, $file);
my $cur = $start;
OUTER: for (; $cur < scalar @$vendors ; $cur++) {
my $vendorpart = "vendors/$vendors->[$cur]/data/$data_name";
foreach my $datafile ($profile->include_path($vendorpart)) {
$fd =_checked_open($datafile);
next if not $fd;
$file = $datafile;
last OUTER;
}
}
if (not defined $file and $cur == scalar @$vendors) {
foreach my $datafile ($profile->include_path("data/$data_name")) {
$fd =_checked_open($datafile);
next if not $fd;
$file = $datafile;
last;
}
$cur++;
}
if (not defined $file) {
croak "Unknown data file: $data_name" unless $start;
croak "No parent data file for $vendors->[$start]";
}
return ($fd, $cur);
}
}
sub _parse_file {
my ($self, $data_name, $fd, $dataset, $keyorder, $data_spec, $vendors,$vno)
= @_;
my (undef, $separator, $code) = @{$data_spec};
my $filename = $data_name;
$filename = $vendors->[$vno] . '/' . $data_name if $vno < scalar @$vendors;
local $.;
while (my $line = <$fd>) {
strip($line);
next if $line =~ m{ \A \#}xsm or $line eq '';
if ($line =~ s/^\@//) {
my ($op, $value) = split(m{ \s++ }xsm, $line, 2);
if ($op eq 'delete') {
croak "Missing key after \@delete in $filename at line $."
unless defined $value && length $value;
@{$keyorder} = grep { $_ ne $value } @{$keyorder};
delete $dataset->{$value};
} elsif ($op eq 'include-parent') {
my ($pfd, $pvo)
= $self->_open_data_file($data_name, $vendors,$vno +1);
$self->_parse_file($data_name, $pfd, $dataset, $keyorder,
$data_spec, $vendors, $pvo);
close($pfd);
} elsif ($op eq 'if-vendor-is' or $op eq 'if-vendor-is-not') {
my ($desired_name, $remain) = split(m{ \s++ }xsm, $value, 2);
my $actual_name;
croak "Missing vendor name after \@$op"
unless $desired_name;
croak "Missing command after vendor name for \@$op"
unless $remain;
$actual_name = (split('/', $vendors->[0], 2))[0];
if ($op eq 'if-vendor-is') {
next if $actual_name ne $desired_name;
} else {
next if $actual_name eq $desired_name;
}
$line = $remain;
redo;
} else {
croak "Unknown operation \@$op in $filename at line $.";
}
next;
}
my ($key, $val);
if (defined $separator) {
($key, $val) = split(/$separator/, $line, 2);
if ($code) {
my $pval = $dataset->{$key};
$val = $code->($key, $val, $pval);
if (not defined($val)) {
next if defined($pval);
croak "undefined value for $key (data-name: $data_name)";
}
}
} else {
($key, $val) = ($line => 1);
}
push @{$keyorder}, $key unless exists $dataset->{$key};
$dataset->{$key} = $val;
}
return;
}
sub _force_promise {
my ($self) = @_;
my $promise = $self->{promise};
my $data = $self->_load_data($promise);
delete $self->{promise};
return $data;
}
# Query a data object for whether a particular keyword is valid.
sub known {
my ($self, $keyword) = @_;
if(!defined($keyword)) {
return;
}
my $data = $self->{data} || $self->_force_promise;
return (exists $data->{'dataset'}{$keyword}) ? 1 : undef;
}
# Return all known keywords (in no particular order).
sub all {
my ($self) = @_;
my $data = $self->{data} || $self->_force_promise;
return @{$data->{'keyorder'}};
}
# Query a data object for the value attached to a particular keyword.
sub value {
my ($self, $keyword) = @_;
my $data = $self->{data} || $self->_force_promise;
return $data->{'dataset'}{$keyword} // undef;
}
1;
=head1 NAME
Lintian::Data - Lintian interface to query lists of keywords
=head1 SYNOPSIS
my $keyword;
my $list = Lintian::Data->new('type');
if ($list->known($keyword)) {
# do something ...
}
my $hash = Lintian::Data->new('another-type', qr{\s++});
if ($hash->value($keyword) > 1) {
# do something ...
}
if ($list->value($keyword) > 1) {
# do something ...
}
my @keywords = $list->all;
=head1 DESCRIPTION
Lintian::Data provides a way of loading a list of keywords or key/value
pairs from a file in the Lintian root and then querying that list.
The lists are stored in the F<data> directory of the Lintian root and
consist of one keyword or key/value pair per line. Blank lines and
lines beginning with C<#> are ignored. Leading and trailing whitespace
is stripped.
If requested, the lines are split into key/value pairs with a given
separator regular expression. Otherwise, keywords are taken verbatim
as they are listed in the file and may include spaces.
This module allows lists such as menu sections, doc-base sections,
obsolete packages, package fields, and so forth to be stored in simple,
easily editable files.
NB: By default Lintian::Data is lazy and defers loading of the data
file until it is actually needed.
=head2 Interface for the CODE argument
This section describes the interface between for the CODE argument
for the class method new.
The sub will be called once for each key/pair with three arguments,
KEY, VALUE and CURVALUE. The first two are the key/value pair parsed
from the data file and CURVALUE is current value associated with the
key. CURVALUE will be C<undef> the first time the sub is called with
that KEY argument.
The sub can then modify VALUE in some way and return the new value for
that KEY. If CURVALUE is not C<undef>, the sub may return C<undef> to
indicate that the current value should still be used. It is not
permissible for the sub to return C<undef> if CURVALUE is C<undef>.
Where Perl semantics allow it, the sub can modify CURVALUE and the
changes will be reflected in the result. As an example, if CURVALUE
is a hashref, new keys can be inserted etc.
=head1 CLASS METHODS
=over 4
=item new(TYPE [,SEPARATOR[, CODE]])
Creates a new Lintian::Data object for the given TYPE. TYPE is a partial
path relative to the F<data> directory and should correspond to a file in
that directory. The contents of that file will be loaded into memory and
returned as part of the newly created object. On error, new() throws an
exception.
If SEPARATOR is given, it will be used as a regular expression for splitting
the lines into key/value pairs.
If CODE is also given, it is assumed to be a sub that will pre-process
the key/value pairs. See the L</Interface for the CODE argument> above.
A given file will only be loaded once. If new() is called again with the
same TYPE argument, the data previously loaded will be reused, avoiding
multiple file reads.
=item set_vendor(PROFILE)
Specifies vendor profile. It must be set before the first data file
is loaded.
=back
=head1 INSTANCE METHODS
=over 4
=item all()
Returns all keywords listed in the data file as a list in original order.
In a scalar context, returns the number of keywords.
=item known(KEYWORD)
Returns true if KEYWORD was listed in the data file represented by this
Lintian::Data instance and false otherwise.
=item value(KEYWORD)
Returns the value attached to KEYWORD if it was listed in the data
file represented by this Lintian::Data instance and the undefined value
otherwise. If SEPARATOR was not given, the value will '1'.
=back
=head1 DIAGNOSTICS
=over 4
=item no data type specified
new() was called without a TYPE argument.
=item unknown data type %s
The TYPE argument to new() did not correspond to a file in the F<data>
directory of the Lintian root.
=item undefined value for %s (type: %s)
The CODE argument return undef for the KEY and no previous value for
that KEY was available.
=back
=head1 FILES
=over 4
=item LINTIAN_INCLUDE_DIR/data
The files loaded by this module must be located in this directory.
Relative paths containing a C</> are permitted, so files may be organized
in subdirectories in this directory.
Note that lintian supports multiple LINTIAN_INCLUDE_DIRs.
=back
=head1 AUTHOR
Originally written by Russ Allbery <rra@debian.org> for Lintian.
=head1 SEE ALSO
lintian(1), L<https://lintian.debian.org/manual/section-2.6.html>
=cut
1;
# Local Variables:
# indent-tabs-mode: nil
# cperl-indent-level: 4
# End:
# vim: syntax=perl sw=4 sts=4 sr et
|