eval '(exit $?0)' && eval 'exec perl -wS "$0" "$@"' & eval 'exec perl -wS "$0" $argv:q' if 0; # This file is part of GNU Mailutils. # Copyright (C) 2017 Free Software Foundation, Inc. # # GNU Mailutils is free software; you can redistribute it and/or # modify it under the terms of the GNU General Public License as # published by the Free Software Foundation; either version 3, or (at # your option) any later version. # # GNU Mailutils is distributed in the hope that it will be useful, but # WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU # General Public License for more details. # # You should have received a copy of the GNU General Public License # along with GNU Mailutils. If not, see . use strict; use POSIX qw(strftime); use Getopt::Long qw(:config gnu_getopt no_ignore_case); use Text::Wrap; use Data::Dumper; use threads; use Thread::Queue; use Safe; use Pod::Usage; use Pod::Man; use Pod::Find qw(pod_where); my @append_files; my $force; my $verbose; my $changelog_file = 'ChangeLog'; my $since_date; my $until_date; my $strip_cherry_pick; my $amend_file; my %amendment; my $append_dot; my $ignore_errors; my $email; my $exit_status = 0; =head1 NAME gencl - generate ChangeLog from git log output =head1 SYNOPSIS B [B<-fiv>] [B<-a> I] [B<-m> I] [B<-F> I] [B<--amend=>I] [B<--append-dot>] [B<--append=>I] [B<--email=>I] [B<--file=>I] [B<--force>] [B<--ignore-errors>] [B<--since=>I] [B<--strip-cherry-pick>] [B<--until=>I] [B<--verbose>] B B<-h> | B<--help> | B<--usage> =head1 DESCRIPTION Retrieves git log messages and reformats them as a valid ChangeLog file. The file begins with an automatically generated entry stating the SHA1 hash of the git HEAD commit. This entry is followed by the log entries recreated from the git log, in reverse chronological order. By default, entire log is converted. This can be changed by using B<--since> and/or B<--until> options. Files specified with the B<--append> options (if any), are appended after the converted entries. The file ends with the B B stanza. If the B file exists, B verifies if the source tree has changed since the file was created. The file is re-created only if there were some changes (whether committed or not). The the B<--force> (B<-f>) option instructs B to recreate the file unconditionally. The file supplied with the B<--amend> option is used to correct spelling (and other) errors in the log entries. It consists of entries delimited with one or more empty lines. Each entry begins with a full SHA1 hash of the commit it applies to. The hash is followed by one or more lines with a valid Perl code (typically, B statements). Comments are introduced with the B<#> sign. For each git log entry, its hash is looked up in that file. If found, the B<$_> variable is set to the commit subject, followed by the commit body and the code is evaluated. =head1 OPTIONS =over 4 =item B<-a>, B<--append=>I Append I to the end of the generated file. Multiple B<--append> are processed in the order of their occurrence on the command line. The content of I is appended verbatim, except that the line beginning with the text B is taken to mark the end of file. =item B<-m>, B<--email=>I Sets email address to use in the topmost automatically generated entry. In the absense of this option, B constructs the email from the current user name and the domain (or host) name. =item B<-F>, B<--file=>I Create I instead of the B. =item B<-f>, B<--force> Force recreating the ChangeLog, even if no new commits were added to the repository since its creation. =item B<-i>, B<--ignore-errors> Ignore non-fatal errors. With this option in effect, B exits with code 0 even if some errors were encountered while running. =item B<-v>, B<--verbose> Increase output verbosity. =item B<--since=>I Convert only the logs since I (B). =item B<--until=>I Convert only the logs until I (B). =item B<--strip-cherry-pick> Remove data inserted by B. This includes the "cherry picked from commit ..." line, and the possible final "Conflicts:" paragraph. =item B<--amend=>I Read amendment instructions from I. =item B<--append-dot> Append a dot to the subject line of each commit message if there is no other punctuation the end. =back =head1 EXIT CODES =over 4 =item B<0> Success. =item B<1> Fatal error. =item B<2> Non-fatal error. The B<--ignore-errors> (B<-i>) option instructs B to exit with code B<0>, instead of B<2>. =back =head1 DIFFERENCES FROM GITLOG-TO-CHANGELOG =over 4 =item 1 B writes output to the disk file, whereas B prints it to the standard output. =item 2 The created B begins with an automatically generated entry and ends with the B stanza. =item 3 The B file is re-created only if the source tree was changed since it was written (whether these changes have been committed or not). =item 4 Arbitrary number of files can be concatenated to the produced file. This is handy for projects that switched to B from other VCS. =item 5 Each entry is reformatted using B. =item 6 The following B options are not implemented: B<--cluster>, B<--ignore-matching>, B<--ignore-line>. =back =cut sub pod_usage_msg { my ($obj) = @_; open my $fd, '>', \my $msg; pod2usage(-verbose => 99, -sections => 'NAME', -output => $fd, -exitval => 'NOEXIT'); my @a = split /\n/, $msg; $msg = $a[1]; $msg =~ s/^\s+//; $msg =~ s/ - /: /; return $msg; } GetOptions( 'h' => sub { pod2usage(-message => pod_usage_msg(), -exitstatus => 0, -input => pod_where({-inc => 1}, $0)) }, 'help' => sub { pod2usage(-exitstatus => 0, -verbose => 2, -input => pod_where({-inc => 1}, $0)); }, 'usage' => sub { pod2usage(-exitstatus => 0, -verbose => 0, -input => pod_where({-inc => 1}, $0)); }, 'append|a=s@' => \@append_files, 'file|F=s' => \$changelog_file, 'force|f' => \$force, 'verbose|v' => \$verbose, 'since=s' => \$since_date, 'until=s' => \$until_date, 'strip-cherry-pick' => \$strip_cherry_pick, 'amend=s' => \$amend_file, 'append-dot' => \$append_dot, 'ignore-errors|i' => \$ignore_errors, 'email|m=s' => \$email ) or exit(1); if (! -d '.git') { exit 0; } unless (defined($email)) { if (exists($ENV{EMAIL})) { $email = $ENV{EMAIL}; } else { my ($user, $domain); if (exists($ENV{USER})) { $user = $ENV{USER}; } elsif (my ($name) = getpwuid(getuid())) { $user = $name; } else { die "can't get user name"; } if (chomp($domain = `domainname`) && $domain ne "(none)") { ; } elsif (exists($ENV{HOSTNAME})) { $domain = $ENV{HOSTNAME}; } elsif ($domain = `hostname`) { chomp $domain; } else { $domain = 'localhost'; } $email = $user . '@' . $domain; } } read_amend_file($amend_file) if $amend_file; $Text::Wrap::columns = 72; # Work over bug #79766 in Text::Wrap $Text::Wrap::huge = 'overflow' if $Text::Wrap::VERSION eq '2012.0818'; create_changelog(); $exit_status = 0 if $ignore_errors; exit $exit_status; sub toplevel_entry { my ($hash, $date) = split / /, `git log --max-count=1 --pretty=format:'%H %ad' --date=short HEAD`; my @modlines; if (open(my $fd, '-|', 'git diff-index --name-status HEAD 2>/dev/null')) { chomp(@modlines = map {chomp; [split /\s+/, $_, 2]} <$fd>); close $fd; } if (@modlines) { $date = strftime '%Y-%m-%d', localtime; } my @header; push @header, "$date Automatically generated <$email>"; push @header, ''; push @header, "\tHEAD $hash."; push @header, ''; my %status = ( A => 'New file', C => 'Copied file', D => 'Removed file', M => 'Changed', R => 'Renamed', T => 'Type change', U => 'Unmerged', X => 'Unknown' ); if (@modlines) { push @header, "\tUncommitted changes:"; push @header, ''; push @header, map { "\t* $_->[1]: " . ($status{$_->[0]} || 'Unknown') . ";" } @modlines; push @header, ''; } return @header; } sub headcmp { my $file = shift; if (open(my $fd, '<', $changelog_file)) { # Skip first line $_ = <$fd>; shift; while (<$fd>) { my $line = shift; last unless defined($line); chomp; return 0 unless $line eq $_; } return 1 unless @_; } return 0; } sub read_amend_file { my ($file) = @_; open(my $fd, '<', $file) or die "can't open $file for reading: $!"; use constant { STATE_INIT => 1, STATE_HASH => 2, }; my $state = STATE_INIT; my $silent; my $hash; my $code; my $locus; while (<$fd>) { chomp; s/^\s+//; next if /^#/; if ($state == STATE_INIT) { if (/^([0-9a-fA-F]{40})$/) { $hash = lc $1; if (exists($amendment{$hash})) { warn "$file:$.: duplicate SHA1 hash"; warn $amendment{$hash}{locus} . ": previously defined here"; $exit_status = 2; } $code = ''; $locus = "$file:$."; $state = STATE_HASH; $silent = 0; } elsif (/^$/) { next; } else { warn "$file:$.: expected SHA1, but found $_" unless $silent; $exit_status = 2; $silent = 1; } } elsif ($state == STATE_HASH) { if (/^$/) { $amendment{$hash}{code} = $code; $amendment{$hash}{locus} = $locus; $state = STATE_INIT; } else { $code .= "$_\n"; } } } if ($state == STATE_HASH) { $amendment{$hash}{code} .= $code; $amendment{$hash}{locus} = $locus; } } sub tokenize_gitlog { my ($q) = @_; my @cmd = qw(git log --log-size --no-merges --pretty=format:%H:%ct:%an:%ae%n%s%n%b); push @cmd, "--since=$since_date" if defined $since_date; push @cmd, "--until=$until_date" if defined $until_date; print STDERR "starting @cmd\n" if $verbose > 1; open(my $fd, '-|', @cmd) or die "failed to run git log: $!"; while (<$fd>) { chomp; next if /^$/; my %ent = (); unless (/^log size (\d+)/) { warn "unexpected input: '$_'"; $exit_status = 2; next; } my $size = $1; my $log; read($fd, $log, $size) == $size or die "unexpected EOF"; my ($head, $text) = split /\n/, $log, 2; ($ent{hash},$ent{date},$ent{author},$ent{email}) = split /:/, $head; if (defined($amendment{$ent{hash}})) { my $code = $amendment{$ent{hash}}{code}; print STDERR "amending $ent{hash}\n" if $verbose > 1; print STDERR "code: $code\n" if $verbose > 1; my $s = new Safe; $_ = $text; if (defined(my $r = $s->reval($code))) { $text = $_; delete $amendment{$ent{hash}}; } else { warn "$.:$ent{hash}: failed to eval \"$code\" on \"$_\": \n$@\n"; warn $amendment{$ent{hash}}{locus} . ": code was defined here"; $exit_status = 2; } } my @body; ($ent{subject}, @body) = split /\n/, $text; if ($append_dot && $ent{subject} !~ /[[:punct:]]$/) { $ent{subject} .= '.'; } foreach my $line (@body) { if ($line =~ /^Co-authored-by:(.*)$/) { my $author = $1; if ($author =~ /\s*(.*?)<.+?>$/) { push @{$ent{coauthor}}, [ $1, $2 ]; } } elsif ($line =~ /^(?:Signed-off-by |Copyright-paperwork-exempt |Tiny-change):\s*$/x) { next; } elsif ($strip_cherry_pick && $line =~ /^\s* (?:Conflicts: |\(cherry picked from commit [\da-f]+\)$) /x) { next; } elsif ($line =~ /^\*/) { push @{$ent{body}}, $line; } elsif ($line =~ /^(?:\s |(?:\(.+?\)\s* |\[.+?\]\s* |<.+?>\s*)+:)/x) { push @{$ent{body}}, $line; } elsif (exists($ent{body})) { ${$ent{body}}[-1] .= "\n" . $line; } else { if (!exists($ent{description}) || ${$ent{description}}[-1] eq '' || $line eq '') { push @{$ent{description}}, $line; } else { ${$ent{description}}[-1] .= "\n" . $line; } } } if (exists($ent{body}) && ${$ent{body}}[-1] ne '') { push @{$ent{body}}, ''; } if (exists($ent{description}) && ${$ent{description}}[-1] ne '') { push @{$ent{description}}, ''; } $q->enqueue(\%ent); } $q->enqueue(undef); close $fd; my @unused; while (my ($hash, $ref) = each %amendment) { my $line = $ref->{locus}; $line =~ s/^.*://; push @unused, [ $line, $ref->{locus}, $hash ]; } if (@unused) { $exit_status = 2; foreach my $ent (sort { $a->[0] <=> $b->[0] } @unused) { warn "$ent->[1]: unused entry: $ent->[2]\n"; } } print STDERR "tokenize_gitlog finished\n" if $verbose > 1; } sub convert_entry { my ($q) = @_; while (my $ent = $q->dequeue()) { print STDERR "Writing $ent->{hash}\n" if $verbose > 1; my $date = strftime('%Y-%m-%d', localtime($ent->{date})); print $date, ' ', $ent->{author}, ' <', $ent->{email}, ">\n"; if (exists($ent->{coauthor})) { foreach my $coauthor (@{$ent->{coauthor}}) { print ' ', $coauthor->[0], ' ', $coauthor->[1], "\n"; } } print "\n"; my $tabs = "\t"; print wrap($tabs, $tabs, $ent->{subject}), "\n\n"; if (exists($ent->{description})) { foreach my $para (@{$ent->{description}}) { print fill($tabs, $tabs, $para), "\n"; } } if (exists($ent->{body})) { foreach my $para (@{$ent->{body}}) { print fill($tabs, $tabs, $para), "\n"; } } } print STDERR "convert_entry finished\n" if $verbose > 1; } sub create_changelog { my @header = toplevel_entry; if (!$force && headcmp($changelog_file, @header)) { print STDERR "$changelog_file is up to date\n" if $verbose > 1; return; } open(my $fd, '>', $changelog_file) or die "can't open $changelog_file for writing: $!"; print " GEN $changelog_file\n" if $verbose; print STDERR "updating $changelog_file\n" if $verbose > 1; $fd = select($fd); # Print header for (@header) { print "$_\n"; } # Print converted entries my $q = Thread::Queue->new(); my $tok_thr = threads->create(\&tokenize_gitlog, $q); my $cvt_thr = threads->create(\&convert_entry, $q); $tok_thr->join(); $cvt_thr->join(); if ($tok_thr->error() || $cvt_thr->error()) { exit 1; } # Print additional files foreach my $file (@append_files) { if (open(my $in, '<', $file)) { while (<$in>) { chomp; last if /^Local Variables:/; next if /^\f$/; print "$_\n"; } close $in; } else { warn "can't open $file: $!"; $exit_status = 2; } } # Print trailer print "\f\nLocal Variables:\n"; print <<'EOT'; mode: change-log version-control: never buffer-read-only: t End: EOT ; $fd = select($fd); close $fd; } # Local Variables: # mode: perl # End: