grep option

[git-grep-footer.git] / git-grep-footer
diff --git a/git-grep-footer b/git-grep-footer

index 0c26549197cfddfa4eeb8e511edd4aab1134dcde..c5d94400521c8bf56c06938762734ee68c8a28fd 100755 (executable)
--- a/git-grep-footer
+++ b/git-grep-footer
@@ -13,6 +13,7 @@ GetOptions(\my %opt,
         'simplify|s:s',
         'ignore-case|i!',
         'fuzzy!',
+       'grep|S=s',
         'min|min-count|unique|u:i',
         'max|max-count|show|n:i',
         'version|V'  => sub { Getopt::Long::VersionMessage() },
@@ -23,12 +24,12 @@ GetOptions(\my %opt,
  local $| = 1;
  local $/ = "\0";
  
-my $HEADERMATCH = qr/ [a-z]+ (?: (?:-\w+)+ | \ by ) /ix;
+my $HEADERMATCH = qr/ [a-z]+ (?: (?:-\w+)+ | \ by ) | cc | reference /ix;
  
  my (%headercount, @headercache);
  
  while (readline) {
-       s/(.+)\n//m;
+       s/^([0-9a-f]{4,40})\n//m and
         my $hash = $1;
  
         # strip commit seperator
@@ -40,12 +41,12 @@ while (readline) {
         # if invalid, assume it's latin1
                $_ = decode(cp1252 => $_) if $@;
  
-       my $prefix = 0;
         my %attr;
  
         BLOCK:
         for (reverse split /\n\n/) {
                 my @headers;
+               my $prefix = 0;
  
                 LINE:
                 for (split /\n/) {
@@ -75,6 +76,10 @@ while (readline) {
                                 }
                         }
  
+                       if (defined $opt{grep}) {
+                               $_ ~~ qr/$opt{grep}/i or next LINE;
+                       }
+
                         given ($opt{simplify} // 'none') {
                                 when (['email', 'authors']) {
                                         $header[1] =~ s{
@@ -85,7 +90,7 @@ while (readline) {
                                         }{<...>}imsx;
                                 }
                                 when (['var', 'vars', '']) {
-                                       when ($header[0] =~ /[ _-] (?: by | to ) $/imsx) {
+                                       when ($header[0] =~ /[ _-] (?: by | to ) $ | ^cc$/imsx) {
                                                 $header[1] = undef;
                                         }
                                         for ($header[1]) {
@@ -118,12 +123,14 @@ while (readline) {
                 next BLOCK if not @headers;
  
                 if ($opt{debug} and $prefix) {
-                       say "infix junk in commit $hash";
+                       say sprintf ': invalid lines in %s (%s)', $hash // 'block', $prefix;
                 }
  
                 for (@headers) {
                         my $line = $_->[2] // join(': ', @$_);
-                       if (defined $opt{min} or $opt{max}) {
+                       $line =~ s/^/$hash / if defined $hash;
+
+                       if (defined $opt{min} or $opt{max} or $opt{count}) {
                                 my $counter = \$headercount{ $_->[0] }->{ $_->[1] // '' };
                                 my $excess = $$counter++ - ($opt{min} // 0);
                                 next if $excess >= ($opt{max} || 1);
@@ -161,6 +168,7 @@ a common convention to list custom metadata such as
  C<Signed-off-by> and C<Acked-by>.
  
  Sections are identified by at least one leading keyword containing a dash
+(or exceptionally recognised)
  followed by a colon.
  
  =head1 OPTIONS
@@ -197,6 +205,11 @@ Values will be hidden entirely, so only attribute names remain.
  
  =back
  
+=item --grep=<pattern>
+
+Only include lines matching the specified regular expression.
+Case insensitivity can be disabled by prepending C<(?-i)>.
+
  =item -u, --unique[=<threshold>]
  
  Each match is only shown once,
@@ -208,6 +221,11 @@ The original line is given for each match,
  but simplifications still apply for duplicate determination.
  Additional samples are optionally given upto the given maximum.
  
+=item -c, --count
+
+Prefixes (unique) lines by the number of occurrences.
+Causes output to be buffered until all input has been read (obviously).
+
  =back
  
  =head1 AUTHOR