'count|c!',
'simplify|s:s',
'ignore-case|i!',
+ 'fuzzy!',
'min|min-count|unique|u:i',
'max|max-count|show|n:i',
'version|V' => sub { Getopt::Long::VersionMessage() },
local $| = 1;
local $/ = "\0";
-my $HEADERMATCH = qr/ [a-z]+ (?: (?:-\w+)+ | \ by ) /ix;
+my $HEADERMATCH = qr/ [a-z]+ (?: (?:-\w+)+ | \ by ) | cc | reference /ix;
my (%headercount, @headercache);
while (readline) {
- s/(.+)\n//m;
+ s/^([0-9a-f]{4,40})\n//m and
my $hash = $1;
# strip commit seperator
# if invalid, assume it's latin1
$_ = decode(cp1252 => $_) if $@;
- my $prefix = 0;
my %attr;
BLOCK:
for (reverse split /\n\n/) {
my @headers;
+ my $prefix = 0;
LINE:
for (split /\n/) {
push @header, $_ if defined $opt{max};
+ if ($opt{fuzzy}) {
+ for ($header[0]) {
+ tr/ _/-/;
+
+ state $BY = qr{ (?: -? b[yu] )? \Z }ix;
+ s{^ si (?:ge?n|n?g) (?:e?[dt])? -? (?:of+)? $BY}{Signed-off-by}ix;
+ s{^ ack (?:ed|de)? $BY}{Acked-by}ix;
+ s{^ review (?:e?d)? $BY}{Reviewed-by}ix;
+ s{^ teste[dt] $BY}{Tested-by}ix;
+ }
+ }
+
given ($opt{simplify} // 'none') {
when (['email', 'authors']) {
$header[1] =~ s{
}{<...>}imsx;
}
when (['var', 'vars', '']) {
- when ($header[0] =~ /[ _-] (?: by | to ) $/imsx) {
+ when ($header[0] =~ /[ _-] (?: by | to ) $ | ^cc$/imsx) {
$header[1] = undef;
}
for ($header[1]) {
s{\b (https?)://\S+ }{[$1]}gmsx; # url
s{(?: < | \A ) [^@>\s]+ @ [^>]+ (?: > | \Z )}{<...>}igmsx; # address
s{\b [0-9]+ \b}{[num]}gmsx; # number
- s{\b I? [0-9a-f]{40} \b}{[sha1]}gmsx; # hash
+ s{\b [Ig]? [0-9a-f]{ 40} \b}{[sha1]}gmsx; # hash
+ s{\b [Ig]? [0-9a-f]{6,40} \b}{[hash]}gmsx; # abbrev
}
}
when (['all', 'contents']) {
next BLOCK if not @headers;
if ($opt{debug} and $prefix) {
- say "infix junk in commit $hash";
+ say sprintf ': invalid lines in %s (%s)', $hash // 'block', $prefix;
}
for (@headers) {
my $line = $_->[2] // join(': ', @$_);
+ $line =~ s/^/$hash / if defined $hash;
+
if (defined $opt{min} or $opt{max}) {
my $counter = \$headercount{ $_->[0] }->{ $_->[1] // '' };
my $excess = $$counter++ - ($opt{min} // 0);
C<Signed-off-by> and C<Acked-by>.
Sections are identified by at least one leading keyword containing a dash
+(or exceptionally recognised)
followed by a colon.
=head1 OPTIONS