X-Git-Url: http://git.shiar.net/gitweb.cgi/perl/list-index.git/blobdiff_plain/a621cd10e5c167968a778cb6a1a4f319d4949a7a..fd5749ab518cdf3c68e94fbad168aa2a7725d592:/lib/List/Index.pm
diff --git a/lib/List/Index.pm b/lib/List/Index.pm
index 513ce4f..339bd7d 100644
--- a/lib/List/Index.pm
+++ b/lib/List/Index.pm
@@ -4,11 +4,14 @@ use 5.010;
use strict;
use warnings;
-our $VERSION = '1.00';
+use Exporter 'import';
+
+our $VERSION = '1.01';
+our @EXPORT_OK = qw(rangematch);
sub new {
my ($class, $values) = @_;
- bless [map { tr/{/./; $_ } sort map { s/[^a-z]/{/g; $_ } @$values], $class;
+ bless [sort map { s/[^a-z]/./g; $_ } @$values], $class;
}
sub ranges {
@@ -20,49 +23,165 @@ sub ranges {
my $pages = $options->{pages } || 1 + int $#$self / $pagesize;
$pagesize = @$self / $pages;
- my $offset = 0;
- my @links;
+ my $offset = $pagesize + .5;
+ my $penalty = 0;
+ my @links = ('');
while ($offset < @$self) {
my $link = substr $self->[$offset], 0, $length;
if ($context) {
- my $trim = 1;
- my $before = $offset > $context ? $self->[$offset - $context] : '';
- for my $match (split //, $before) {
- scalar $link =~ /\G\Q$match/g or last;
- $trim++;
+ if ($offset > $context - 1 + $penalty) {
+ # take a value slightly before the current offset
+ my $before = $self->[$offset - $context - 1 + $penalty];
+ # see how much of it matches the current link
+ my $trim = 1;
+ for my $match (split //, $before) {
+ scalar $link =~ /\G\Q$match/g or last;
+ $trim++;
+ }
+ # truncate link upto where the earlier value starts to differ
+ substr($link, $trim) = '' unless $trim > length $link;
+ }
+
+ $penalty = 0;
+ if ($offset + $context < $#$self) {
+ # take a value after the current offset
+ my $after = $self->[$offset + $context];
+ # see how much of it matches the current link
+ my $trim = 1;
+ for my $match (split //, $after) {
+ scalar $link =~ /\G\Q$match/g or last;
+ $trim++;
+ }
+ # use this link if it's shorter
+ if ($trim < length $link) {
+ $link = substr $after, 0, $trim;
+ for ($offset .. $#$self) {
+ last if $self->[$offset + $penalty] =~ /^\Q$link/;
+ $penalty++;
+ }
+ }
}
- substr($link, $trim) = '' unless $trim > length $link;
}
- push @links, [$link];
+ push @links, $link;
$offset += $pagesize;
}
+ use List::MoreUtils 'uniq';
+ @links = uniq @links;
for my $i (0 .. $#links - 1) {
- my ($link, $lastchar) = $links[$i + 1]->[0] =~ /(.*)(.)/;
- $link .= $lastchar eq '.' ? 'z' : chr( ord($lastchar) - 1 )
- unless $lastchar eq 'a';
- $links[$i]->[1] = $link;
+ my ($link, $lastchar) = $links[$i + 1] =~ /(.*)(.)/;
+ $link .= $lastchar le 'a' ? '.' : chr( ord($lastchar) - 1 );
+ next if $link eq $links[$i] and $i;
+ $links[$i] .= '-'.$link;
}
- $links[-1]->[1] = '';
+ $links[-1] .= '-';
return \@links;
}
+sub rangematch {
+ my ($link) = @_;
+ my ($s1, $s2) = $link =~ /([^-]*) - ([^-]*)/x
+ or return qr/^\Q$link/i;
+ $s1 =~ s/\.$//;
+ my @allow;
+
+ if (length $s1) {
+ if (length $s2) {
+ $s1 le $s2 or $s1 =~ /^\Q$s2/ or return undef;
+ }
+
+ my $prefix = '';
+ my $char;
+ for my $i (0 .. length($s1) - 1) {
+ my $lasti = $i == length($s1) - 1;
+ $char = substr $s1, $i, 1;
+ my $next = $char;
+ # do not include prefix character in final range
+ $next = chr( ord($char) + 1 ) unless $lasti;
+
+ my $last = 'z';
+ next if $next gt $last;
+ if (length $s2 > $i) {
+ if ($s2 =~ /^\Q$prefix/) {
+ $last = substr $s2, $i, 1;
+ next if $char eq $last;
+ $last = chr( ord($last) - (length $s2 > 1) );
+ next if $next gt $last;
+ }
+ }
+
+ if ($char eq '.') {
+ if ($last eq 'z') {
+# push @allow, $prefix if $i and $lasti;
+# next;
+ }
+# if ($last eq 'z') {
+# push @allow, $prefix if $i and $lasti;
+# next;
+# }
+ $next = 'a';
+ }
+
+ push @allow, $prefix."[$next-$last]";
+ }
+ continue {
+ $prefix .= $char eq '.' ? '[^a-z]' : $char;
+ }
+ }
+
+ if (length $s2) {
+ my $prefix = '';
+ my $char;
+ for my $i (0 .. length($s2) - 1) {
+ $char = substr $s2, $i, 1;
+ my $last = 'z';
+ if (length $s1 > $i) {
+ my $c1 = substr $s1, $i, 1;
+ if ($s1 =~ /^\Q$prefix/) {
+ next if $c1 le $char;
+ }
+ }
+
+ if ($char eq '.') {
+ next if $i < length($s2) - 1;
+ }
+
+ push @allow, $prefix.'(?!['.($char eq '.' ? 'a' : $char)."-$last])"
+ if $i or $s1 eq '';
+ }
+ continue {
+ $prefix .= $char eq '.' ? '[^a-z]' : $char;
+ }
+
+ push @allow, $prefix
+ if $s2 =~ /^\Q$prefix/ and $s1 le $s2
+ and not (length $s2 == 1 && length $s1 >= length $s2 && $s1 ne $s2);
+ }
+
+ my $match = sprintf @allow <= 1 ? '%s' : '(?:%s)', join('|', @allow);
+ return qr/^$match/i;
+}
+
1;
__END__
=head1 NAME
-List::Index - Paginate alphabetic entries by finding minimal prefixes
+List::Index - Find and apply prefix ranges to paginate keywords
=head1 SYNOPSIS
use List::Index;
my $index = List::Index->new(\@values);
my @pages = $index->ranges({pagesize => 50});
- printf '%1$s ', @$_ for @pages;
+ say "$_" for @pages;
+
+ use List::Index 'rangematch';
+ my $limit = rangematch('b-bmq'); # ge 'b' && le 'bmq'
+ @request = grep { $limit } @values;
=head1 DESCRIPTION