File: //proc/thread-self/root/usr/share/perl5/Dpkg/Changelog.pm
# Copyright © 2005, 2007 Frank Lichtenheld <frank@lichtenheld.de>
# Copyright © 2009       Raphaël Hertzog <hertzog@debian.org>
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program.  If not, see <https://www.gnu.org/licenses/>.
=encoding utf8
=head1 NAME
Dpkg::Changelog - base class to implement a changelog parser
=head1 DESCRIPTION
Dpkg::Changelog is a class representing a changelog file
as an array of changelog entries (L<Dpkg::Changelog::Entry>).
By deriving this class and implementing its parse() method, you
add the ability to fill this object with changelog entries.
=cut
package Dpkg::Changelog 2.00;
use strict;
use warnings;
use Carp;
use Dpkg::Gettext;
use Dpkg::ErrorHandling qw(:DEFAULT report REPORT_WARN);
use Dpkg::Control;
use Dpkg::Control::Changelog;
use Dpkg::Control::Fields;
use Dpkg::Index;
use Dpkg::Version;
use Dpkg::Vendor qw(run_vendor_hook);
use parent qw(Dpkg::Interface::Storable);
use overload
    '@{}' => sub { return $_[0]->{data} };
=head1 METHODS
=over 4
=item $c = Dpkg::Changelog->new(%options)
Creates a new changelog object.
=cut
sub new {
    my ($this, %opts) = @_;
    my $class = ref($this) || $this;
    my $self = {
	verbose => 1,
	parse_errors => []
    };
    bless $self, $class;
    $self->set_options(%opts);
    return $self;
}
=item $c->set_options(%opts)
Change the value of some options. "verbose" (defaults to 1) defines
whether parse errors are displayed as warnings by default. "reportfile"
is a string to use instead of the name of the file parsed, in particular
in error messages. "range" defines the range of entries that we want to
parse, the parser will stop as soon as it has parsed enough data to
satisfy $c->get_range($opts{range}).
=cut
sub set_options {
    my ($self, %opts) = @_;
    $self->{$_} = $opts{$_} foreach keys %opts;
}
=item $count = $c->parse($fh, $description)
Read the filehandle and parse a changelog in it. The data in the object is
reset before parsing new data.
Returns the number of changelog entries that have been parsed with success.
This method needs to be implemented by one of the specialized changelog
format subclasses.
=item $count = $c->load($filename)
Parse $filename contents for a changelog.
Returns the number of changelog entries that have been parsed with success.
=item $c->reset_parse_errors()
Can be used to delete all information about errors occurred during
previous parse() runs.
=cut
sub reset_parse_errors {
    my $self = shift;
    $self->{parse_errors} = [];
}
=item $c->parse_error($file, $line_nr, $error, [$line])
Record a new parse error in $file at line $line_nr. The error message is
specified with $error and a copy of the line can be recorded in $line.
=cut
sub parse_error {
    my ($self, $file, $line_nr, $error, $line) = @_;
    push @{$self->{parse_errors}}, [ $file, $line_nr, $error, $line ];
    if ($self->{verbose}) {
	if ($line) {
	    warning("%20s(l$line_nr): $error\nLINE: $line", $file);
	} else {
	    warning("%20s(l$line_nr): $error", $file);
	}
    }
}
=item $c->get_parse_errors()
Returns all error messages from the last parse() run.
If called in scalar context returns a human readable
string representation. If called in list context returns
an array of arrays. Each of these arrays contains
=over 4
=item 1.
a string describing the origin of the data (a filename usually). If the
reportfile configuration option was given, its value will be used instead.
=item 2.
the line number where the error occurred
=item 3.
an error description
=item 4.
the original line
=back
=cut
sub get_parse_errors {
    my $self = shift;
    if (wantarray) {
	return @{$self->{parse_errors}};
    } else {
	my $res = '';
	foreach my $e (@{$self->{parse_errors}}) {
	    if ($e->[3]) {
		$res .= report(REPORT_WARN, g_("%s(l%s): %s\nLINE: %s"), @$e);
	    } else {
		$res .= report(REPORT_WARN, g_('%s(l%s): %s'), @$e);
	    }
	}
	return $res;
    }
}
=item $c->set_unparsed_tail($tail)
Add a string representing unparsed lines after the changelog entries.
Use undef as $tail to remove the unparsed lines currently set.
=item $c->get_unparsed_tail()
Return a string representing the unparsed lines after the changelog
entries. Returns undef if there's no such thing.
=cut
sub set_unparsed_tail {
    my ($self, $tail) = @_;
    $self->{unparsed_tail} = $tail;
}
sub get_unparsed_tail {
    my $self = shift;
    return $self->{unparsed_tail};
}
=item @{$c}
Returns all the L<Dpkg::Changelog::Entry> objects contained in this changelog
in the order in which they have been parsed.
=item $c->get_range($range)
Returns an array (if called in list context) or a reference to an array of
L<Dpkg::Changelog::Entry> objects which each represent one entry of the
changelog. $range is a hash reference describing the range of entries
to return. See section L</RANGE SELECTION>.
=cut
sub _sanitize_range {
    my ($self, $r) = @_;
    my $data = $self->{data};
    if (defined($r->{offset}) and not defined($r->{count})) {
	warning(g_("'offset' without 'count' has no effect")) if $self->{verbose};
	delete $r->{offset};
    }
    ## no critic (ControlStructures::ProhibitUntilBlocks)
    if ((defined($r->{count}) || defined($r->{offset})) &&
        (defined($r->{from}) || defined($r->{since}) ||
	 defined($r->{to}) || defined($r->{until})))
    {
	warning(g_("you can't combine 'count' or 'offset' with any other " .
		   'range option')) if $self->{verbose};
	delete $r->{from};
	delete $r->{since};
	delete $r->{to};
	delete $r->{until};
    }
    if (defined($r->{from}) && defined($r->{since})) {
	warning(g_("you can only specify one of 'from' and 'since', using " .
		   "'since'")) if $self->{verbose};
	delete $r->{from};
    }
    if (defined($r->{to}) && defined($r->{until})) {
	warning(g_("you can only specify one of 'to' and 'until', using " .
		   "'until'")) if $self->{verbose};
	delete $r->{to};
    }
    # Handle non-existing versions
    my (%versions, @versions);
    foreach my $entry (@{$data}) {
        my $version = $entry->get_version();
        next unless defined $version;
        $versions{$version->as_string()} = 1;
        push @versions, $version->as_string();
    }
    if ((defined($r->{since}) and not exists $versions{$r->{since}})) {
        warning(g_("'%s' option specifies non-existing version '%s'"), 'since', $r->{since});
        warning(g_('use newest entry that is earlier than the one specified'));
        foreach my $v (@versions) {
            if (version_compare_relation($v, REL_LT, $r->{since})) {
                $r->{since} = $v;
                last;
            }
        }
        if (not exists $versions{$r->{since}}) {
            # No version was earlier, include all
            warning(g_('none found, starting from the oldest entry'));
            delete $r->{since};
            $r->{from} = $versions[-1];
        }
    }
    if ((defined($r->{from}) and not exists $versions{$r->{from}})) {
        warning(g_("'%s' option specifies non-existing version '%s'"), 'from', $r->{from});
        warning(g_('use oldest entry that is later than the one specified'));
        my $oldest;
        foreach my $v (@versions) {
            if (version_compare_relation($v, REL_GT, $r->{from})) {
                $oldest = $v;
            }
        }
        if (defined($oldest)) {
            $r->{from} = $oldest;
        } else {
            warning(g_("no such entry found, ignoring '%s' parameter '%s'"), 'from', $r->{from});
            delete $r->{from}; # No version was oldest
        }
    }
    if (defined($r->{until}) and not exists $versions{$r->{until}}) {
        warning(g_("'%s' option specifies non-existing version '%s'"), 'until', $r->{until});
        warning(g_('use oldest entry that is later than the one specified'));
        my $oldest;
        foreach my $v (@versions) {
            if (version_compare_relation($v, REL_GT, $r->{until})) {
                $oldest = $v;
            }
        }
        if (defined($oldest)) {
            $r->{until} = $oldest;
        } else {
            warning(g_("no such entry found, ignoring '%s' parameter '%s'"), 'until', $r->{until});
            delete $r->{until}; # No version was oldest
        }
    }
    if (defined($r->{to}) and not exists $versions{$r->{to}}) {
        warning(g_("'%s' option specifies non-existing version '%s'"), 'to', $r->{to});
        warning(g_('use newest entry that is earlier than the one specified'));
        foreach my $v (@versions) {
            if (version_compare_relation($v, REL_LT, $r->{to})) {
                $r->{to} = $v;
                last;
            }
        }
        if (not exists $versions{$r->{to}}) {
            # No version was earlier
            warning(g_("no such entry found, ignoring '%s' parameter '%s'"), 'to', $r->{to});
            delete $r->{to};
        }
    }
    if (defined($r->{since}) and $data->[0]->get_version() eq $r->{since}) {
	warning(g_("'since' option specifies most recent version '%s', ignoring"), $r->{since});
	delete $r->{since};
    }
    if (defined($r->{until}) and $data->[-1]->get_version() eq $r->{until}) {
	warning(g_("'until' option specifies oldest version '%s', ignoring"), $r->{until});
	delete $r->{until};
    }
    ## use critic
}
sub get_range {
    my ($self, $range) = @_;
    $range //= {};
    my $res = $self->_data_range($range);
    return unless defined $res;
    if (wantarray) {
        return reverse @{$res} if $range->{reverse};
        return @{$res};
    } else {
	return $res;
    }
}
sub _is_full_range {
    my ($self, $range) = @_;
    return 1 if $range->{all};
    # If no range delimiter is specified, we want everything.
    foreach my $delim (qw(since until from to count offset)) {
        return 0 if exists $range->{$delim};
    }
    return 1;
}
sub _data_range {
    my ($self, $range) = @_;
    my $data = $self->{data} or return;
    return [ @$data ] if $self->_is_full_range($range);
    $self->_sanitize_range($range);
    my ($start, $end);
    if (defined($range->{count})) {
	my $offset = $range->{offset} // 0;
	my $count = $range->{count};
	# Convert count/offset in start/end
	if ($offset > 0) {
	    $offset -= ($count < 0);
	} elsif ($offset < 0) {
	    $offset = $#$data + ($count > 0) + $offset;
	} else {
	    $offset = $#$data if $count < 0;
	}
	$start = $end = $offset;
	$start += $count+1 if $count < 0;
	$end += $count-1 if $count > 0;
	# Check limits
	$start = 0 if $start < 0;
	return if $start > $#$data;
	$end = $#$data if $end > $#$data;
	return if $end < 0;
	$end = $start if $end < $start;
	return [ @{$data}[$start .. $end] ];
    }
    ## no critic (ControlStructures::ProhibitUntilBlocks)
    my @result;
    my $include = 1;
    $include = 0 if defined($range->{to}) or defined($range->{until});
    foreach my $entry (@{$data}) {
	my $v = $entry->get_version();
	$include = 1 if defined($range->{to}) and $v eq $range->{to};
	last if defined($range->{since}) and $v eq $range->{since};
	push @result, $entry if $include;
	$include = 1 if defined($range->{until}) and $v eq $range->{until};
	last if defined($range->{from}) and $v eq $range->{from};
    }
    ## use critic
    return \@result if scalar(@result);
    return;
}
=item $c->abort_early()
Returns true if enough data have been parsed to be able to return all
entries selected by the range set at creation (or with set_options).
=cut
sub abort_early {
    my $self = shift;
    my $data = $self->{data} or return;
    my $r = $self->{range} or return;
    my $count = $r->{count} // 0;
    my $offset = $r->{offset} // 0;
    return if $self->_is_full_range($r);
    return if $offset < 0 or $count < 0;
    if (defined($r->{count})) {
	if ($offset > 0) {
	    $offset -= ($count < 0);
	}
	my $start = my $end = $offset;
	$end += $count-1 if $count > 0;
        return $start < @{$data} > $end;
    }
    return unless defined($r->{since}) or defined($r->{from});
    foreach my $entry (@{$data}) {
	my $v = $entry->get_version();
	return 1 if defined($r->{since}) and $v eq $r->{since};
	return 1 if defined($r->{from}) and $v eq $r->{from};
    }
    return;
}
=item $str = $c->output()
=item "$c"
Returns a string representation of the changelog (it's a concatenation of
the string representation of the individual changelog entries).
=item $c->output($fh)
Output the changelog to the given filehandle.
=cut
sub output {
    my ($self, $fh) = @_;
    my $str = '';
    foreach my $entry (@{$self}) {
	my $text = $entry->output();
	print { $fh } $text if defined $fh;
	$str .= $text if defined wantarray;
    }
    my $text = $self->get_unparsed_tail();
    if (defined $text) {
	print { $fh } $text if defined $fh;
	$str .= $text if defined wantarray;
    }
    return $str;
}
=item $c->save($filename)
Save the changelog in the given file.
=cut
our ( @URGENCIES, %URGENCIES );
BEGIN {
    @URGENCIES = qw(
        low
        medium
        high
        critical
        emergency
    );
    my $i = 1;
    %URGENCIES = map { $_ => $i++ } @URGENCIES;
}
sub _format_dpkg {
    my ($self, $range) = @_;
    my @data = $self->get_range($range) or return;
    my $src = shift @data;
    my $c = Dpkg::Control::Changelog->new();
    $c->{Urgency} = $src->get_urgency() || 'unknown';
    $c->{Source} = $src->get_source() || 'unknown';
    $c->{Version} = $src->get_version() // 'unknown';
    $c->{Distribution} = join ' ', $src->get_distributions();
    $c->{Maintainer} = $src->get_maintainer() // '';
    $c->{Date} = $src->get_timestamp() // '';
    $c->{Timestamp} = $src->get_timepiece && $src->get_timepiece->epoch // '';
    $c->{Changes} = $src->get_dpkg_changes();
    # handle optional fields
    my $opts = $src->get_optional_fields();
    my %closes;
    foreach my $f (keys %{$opts}) {
        if ($f eq 'Urgency') {
            # Already handled.
        } elsif ($f eq 'Closes') {
	    $closes{$_} = 1 foreach (split(/\s+/, $opts->{Closes}));
	} else {
            field_transfer_single($opts, $c, $f);
	}
    }
    foreach my $bin (@data) {
        my $oldurg = $c->{Urgency} // '';
        my $oldurgn = $URGENCIES{$c->{Urgency}} // -1;
	my $newurg = $bin->get_urgency() // '';
	my $newurgn = $URGENCIES{$newurg} // -1;
        $c->{Urgency} = ($newurgn > $oldurgn) ? $newurg : $oldurg;
        $c->{Changes} .= "\n" . $bin->get_dpkg_changes();
	# handle optional fields
	$opts = $bin->get_optional_fields();
        foreach my $f (keys %{$opts}) {
            if ($f eq 'Closes') {
		$closes{$_} = 1 foreach (split(/\s+/, $opts->{Closes}));
            } elsif (not exists $c->{$f}) {
                # Don't overwrite an existing field
                field_transfer_single($opts, $c, $f);
	    }
	}
    }
    if (scalar keys %closes) {
        $c->{Closes} = join ' ', sort { $a <=> $b } keys %closes;
    }
    run_vendor_hook('post-process-changelog-entry', $c);
    return $c;
}
sub _format_rfc822 {
    my ($self, $range) = @_;
    my @data = $self->get_range($range) or return;
    my @ctrl;
    foreach my $entry (@data) {
        my $c = Dpkg::Control::Changelog->new();
        $c->{Urgency} = $entry->get_urgency() || 'unknown';
        $c->{Source} = $entry->get_source() || 'unknown';
        $c->{Version} = $entry->get_version() // 'unknown';
        $c->{Distribution} = join ' ', $entry->get_distributions();
        $c->{Maintainer} = $entry->get_maintainer() // '';
        $c->{Date} = $entry->get_timestamp() // '';
        $c->{Timestamp} = $entry->get_timepiece && $entry->get_timepiece->epoch // '';
        $c->{Changes} = $entry->get_dpkg_changes();
	# handle optional fields
	my $opts = $entry->get_optional_fields();
        foreach my $f (keys %{$opts}) {
            field_transfer_single($opts, $c, $f) unless exists $c->{$f};
	}
        run_vendor_hook('post-process-changelog-entry', $c);
        push @ctrl, $c;
    }
    return @ctrl;
}
=item $control = $c->format_range($format, $range)
Formats the changelog into L<Dpkg::Control::Changelog> objects representing
the entries selected by the optional range specifier (see L</RANGE SELECTION>
for details). In scalar context returns a L<Dpkg::Index> object containing
the selected entries, in list context returns an array of
L<Dpkg::Control::Changelog> objects.
With format B<dpkg> the returned L<Dpkg::Control::Changelog> object is
coalesced from the entries in the changelog that are part of the range
requested, with the fields described below, but considering that
"selected entry" means the first entry of the selected range.
With format B<rfc822> each returned L<Dpkg::Control::Changelog> objects
represents one entry in the changelog that is part of the range requested,
with the fields described below, but considering that "selected entry"
means for each entry.
The different formats return undef if no entries are matched. The following
fields are contained in the object(s) returned:
=over 4
=item Source
package name (selected entry)
=item Version
packages' version (selected entry)
=item Distribution
target distribution (selected entry)
=item Urgency
urgency (highest of all entries in range)
=item Maintainer
person that created the (selected) entry
=item Date
date of the (selected) entry
=item Timestamp
date of the (selected) entry as a timestamp in seconds since the epoch
=item Closes
bugs closed by the (selected) entry/entries, sorted by bug number
=item Changes
content of the (selected) entry/entries
=back
=cut
sub format_range {
    my ($self, $format, $range) = @_;
    my @ctrl;
    if ($format eq 'dpkg') {
        @ctrl = $self->_format_dpkg($range);
    } elsif ($format eq 'rfc822') {
        @ctrl = $self->_format_rfc822($range);
    } else {
        croak "unknown changelog output format $format";
    }
    if (wantarray) {
        return @ctrl;
    } else {
        my $index = Dpkg::Index->new(type => CTRL_CHANGELOG);
        foreach my $c (@ctrl) {
            $index->add($c);
        }
        return $index;
    }
}
=back
=head1 RANGE SELECTION
A range selection is described by a hash reference where
the allowed keys and values are described below.
The following options take a version number as value.
=over 4
=item since
Causes changelog information from all versions strictly
later than B<version> to be used.
=item until
Causes changelog information from all versions strictly
earlier than B<version> to be used.
=item from
Similar to C<since> but also includes the information for the
specified B<version> itself.
=item to
Similar to C<until> but also includes the information for the
specified B<version> itself.
=back
The following options don't take version numbers as values:
=over 4
=item all
If set to a true value, all entries of the changelog are returned,
this overrides all other options.
=item count
Expects a signed integer as value. Returns C<value> entries from the
top of the changelog if set to a positive integer, and C<abs(value)>
entries from the tail if set to a negative integer.
=item offset
Expects a signed integer as value. Changes the starting point for
C<count>, either counted from the top (positive integer) or from
the tail (negative integer). C<offset> has no effect if C<count>
wasn't given as well.
=back
Some examples for the above options. Imagine an example changelog with
entries for the versions 1.2, 1.3, 2.0, 2.1, 2.2, 3.0 and 3.1.
  Range                        Included entries
  -----                        ----------------
  since => '2.0'               3.1, 3.0, 2.2
  until => '2.0'               1.3, 1.2
  from  => '2.0'               3.1, 3.0, 2.2, 2.1, 2.0
  to    => '2.0'               2.0, 1.3, 1.2
  count =>  2                  3.1, 3.0
  count => -2                  1.3, 1.2
  count =>  3, offset => 2     2.2, 2.1, 2.0
  count =>  2, offset => -3    2.0, 1.3
  count => -2, offset => 3     3.0, 2.2
  count => -2, offset => -3    2.2, 2.1
Any combination of one option of C<since> and C<from> and one of
C<until> and C<to> returns the intersection of the two results
with only one of the options specified.
=head1 CHANGES
=head2 Version 2.00 (dpkg 1.20.0)
Remove methods: $c->dpkg(), $c->rfc822().
=head2 Version 1.01 (dpkg 1.18.8)
New method: $c->format_range().
Deprecated methods: $c->dpkg(), $c->rfc822().
New field Timestamp in output formats.
=head2 Version 1.00 (dpkg 1.15.6)
Mark the module as public.
=cut
1;