'simplify|s:s',
'ignore-case|i!',
'fuzzy!',
+ 'grep|S=s',
'min|min-count|unique|u:i',
'max|max-count|show|n:i',
'version|V' => sub { Getopt::Long::VersionMessage() },
local $| = 1;
local $/ = "\0";
-my $HEADERMATCH = qr/ [a-z]+ (?: (?:-\w+)+ | \ by ) /ix;
+my $HEADERMATCH = qr/ [a-z]+ (?: (?:-\w+)+ | \ by ) | cc | reference /ix;
my (%headercount, @headercache);
while (readline) {
- s/(.+)\n//m;
+ s/^([0-9a-f]{4,40})\n//m and
my $hash = $1;
# strip commit seperator
# if invalid, assume it's latin1
$_ = decode(cp1252 => $_) if $@;
- my $prefix = 0;
my %attr;
BLOCK:
for (reverse split /\n\n/) {
my @headers;
+ my $prefix = 0;
LINE:
for (split /\n/) {
}
}
+ if (defined $opt{grep}) {
+ $_ ~~ qr/$opt{grep}/i or next LINE;
+ }
+
given ($opt{simplify} // 'none') {
when (['email', 'authors']) {
$header[1] =~ s{
}{<...>}imsx;
}
when (['var', 'vars', '']) {
- when ($header[0] =~ /[ _-] (?: by | to ) $/imsx) {
+ when ($header[0] =~ /[ _-] (?: by | to ) $ | ^cc$/imsx) {
$header[1] = undef;
}
for ($header[1]) {
next BLOCK if not @headers;
if ($opt{debug} and $prefix) {
- say "infix junk in commit $hash";
+ say sprintf ': invalid lines in %s (%s)', $hash // 'block', $prefix;
}
for (@headers) {
my $line = $_->[2] // join(': ', @$_);
- if (defined $opt{min} or $opt{max}) {
+ $line =~ s/^/$hash / if defined $hash;
+
+ if (defined $opt{min} or $opt{max} or $opt{count}) {
my $counter = \$headercount{ $_->[0] }->{ $_->[1] // '' };
my $excess = $$counter++ - ($opt{min} // 0);
next if $excess >= ($opt{max} || 1);
C<Signed-off-by> and C<Acked-by>.
Sections are identified by at least one leading keyword containing a dash
+(or exceptionally recognised)
followed by a colon.
=head1 OPTIONS
=back
+=item --grep=<pattern>
+
+Only include lines matching the specified regular expression.
+Case insensitivity can be disabled by prepending C<(?-i)>.
+
=item -u, --unique[=<threshold>]
Each match is only shown once,
but simplifications still apply for duplicate determination.
Additional samples are optionally given upto the given maximum.
+=item -c, --count
+
+Prefixes (unique) lines by the number of occurrences.
+Causes output to be buffered until all input has been read (obviously).
+
=back
=head1 AUTHOR