git.shiar.nl
/
sheet.git
/ blobdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
|
commitdiff
|
tree
raw
|
inline
| side by side
codec: calculate theoretical minimal overhead
[sheet.git]
/
tools
/
mkusage-wikimedia
diff --git
a/tools/mkusage-wikimedia
b/tools/mkusage-wikimedia
index 7a59ba54bc0e8af83469b53ae37e996a112d7b2b..4470c50394cc1d5ed6dfbc2ec257ac225f330e24 100755
(executable)
--- a/
tools/mkusage-wikimedia
+++ b/
tools/mkusage-wikimedia
@@
-34,14
+34,21
@@
my %count = (
-site => 'https://analytics.wikimedia.org/',
);
-site => 'https://analytics.wikimedia.org/',
);
-my $recent = qr/^2019-/;
-
(readline =~ y/\t//) == 3 or die "unexpected amount of columns in header\n";
(readline =~ y/\t//) == 3 or die "unexpected amount of columns in header\n";
+my @lines = readline;
+
+my $recent; # minimum date to include
+for (reverse @lines) {
+ my ($date) = /(\S+)/;
+ $recent ne $date or next if $recent; # same day
+ $recent = $date; # override older date
+ last if state $i++ >= 2; # repeat twice
+}
-
while (my $row = readline
) {
+
for my $row (@lines
) {
$row =~ s/\r?\n\z//;
my ($date, $name, $version, $pct) = split /\t/, $row;
$row =~ s/\r?\n\z//;
my ($date, $name, $version, $pct) = split /\t/, $row;
- $date
=~
$recent or next;
+ $date
ge
$recent or next;
$name =~ y/ /-/;
my $browser = $BROWSERID{$name};
if (not $browser) {
$name =~ y/ /-/;
my $browser = $BROWSERID{$name};
if (not $browser) {