use strict;
use warnings;
-use Test::More tests => 6;
+use Test::More tests => 9;
use Test::NoWarnings;
use Data::Dump 'pp';
.-bp bq-dm dn-fi fj-hf hg-i j-k l-m n-os ot-qp qq-sm sn-uj uk-wf wg-x y-
)], 'default ranges');
- is_deeply($index->ranges({pagesize => 300}), [qw(-c d-o p-)], 'large pagesize');
+ is_deeply($index->ranges({pagesize => 300}), [qw(-c d-n o-)], 'large pagesize');
+};
+
+subtest 'context' => sub {
+ plan tests => 9;
+ my $index = List::Index->new([qw(
+ kkeg kl km kmlu knsy koxb kpeo kuaa kuab kuac
+ kuapa kuq kur kux kzb lc lg lgu lgua lguc
+ lguq lgur lgws lgx lka lkq lks lln llq llx
+ )]) or return;
+ is_deeply(
+ $index->ranges({ pagesize=>10, context=>0, length=>5 }),
+ # ranges should match offsets exactly
+ [qw(-kuap. kuapa-lgup lguq-)],
+ 'no context'
+ );
+ is_deeply(
+ $index->ranges({ pagesize=>10, context=>0 }),
+ # default length limits to 4 chars
+ [qw(-kuao kuap-lgup lguq-)],
+ 'default length'
+ );
+ is_deeply(
+ $index->ranges({ pagesize=>10, context=>1 }),
+ # lookbehinds aren't shorter (kuac<kuap, lguc<lguq)
+ # 'kuap' can advance to 'kuq'
+ [qw(-kup kuq-lgup lguq-)],
+ 'lookahead'
+ );
+TODO: {
+ local $TODO = 'backtrack';
+ is_deeply(
+ $index->ranges({ pagesize=>10, context=>2 }),
+ # allowed to advance to 'kur', but provides no benefits over 'kuq'
+ [qw(-kup kuq-lgup lguq-)],
+ 'minimal lookahead'
+ );
+}
+ is_deeply(
+ $index->ranges({ pagesize=>10, context=>3 }),
+ # shorten 'kuap' to 'ku' because lookbehind is 'kp...'
+ # 'lguq' matches 'lg', but may only backtrack to 'lgu'
+ [qw(-kt ku-lgt lgu-)],
+ 'lookbehind'
+ );
+ is_deeply(
+ $index->ranges({ pagesize=>10, context=>4 }),
+ [qw(-kt ku-lf lg-)],
+ 'maximal lookahead'
+ );
+ is_deeply(
+ $index->ranges({ pagesize=>10, context=>5 }),
+ # after forwarding 'kuap' to 'lc'
+ # disallow backtracking of 'lguq' to 'lc' to prevent qw[-k l-]
+ # so only lookahead (to 'lkq') remains
+ [qw(-k l-lj lk-)],
+ 'lookbehind forbidden'
+ );
+ is_deeply(
+ $index->ranges({ pagesize=>10, context=>9 }),
+ # allow a single (10-9) entry (l-lf = lc) to remain
+ [qw(-k l-lf lg-)],
+ 'lookbehind penalty'
+ );
+ is_deeply(
+ $index->ranges({ pagesize=>10, context=>10 }),
+ # allow the last page to go back upto 'lc', replacing the 2nd page
+ [qw(-k l-)],
+ 'full overlap'
+ );
+};
+
+subtest 'distribution' => sub {
+ plan tests => 2;
+ my $index = List::Index->new([qw(
+ gnihka gniub go gsearnrqns gtdvcxyt gw gwoufolwcvmtueyg gysgphci h habkdgifjfxoh
+ hbbvjf hbqleexnqts hccg hd hdoeqwdmgqwaoya hfbegicieuxz hfm hj hkoysmws hmylu
+ hnvtvpievbdlkrmb hs hvdvcqn hvn hyrybeur iaiaab ib ibavqyar idfniqvxpohbk idh
+ )]) or return;
+ is_deeply(
+ $index->ranges({ pagesize=>10, context=>8 }),
+ [qw(-g h i-)],
+ 'large context'
+ );
+ is_deeply(
+ $index->ranges({ pagesize=>10, context=>7 }),
+ # after 2nd page is enlarged by lookbehind to 'h', limit subsequent lookahead
+ # to prevent the page from getting too large (17 entries if forwarded to 'i')
+ [qw(-g h-hm hn-)],
+ 'lookahead penalty'
+ );
+ # page #14 [gn-g] (8): gnihka gniub go gsearnrqns gtdvcxyt gwawkvmueovdjtfj gwoufolwcvmtueyg gysgphci
+ # page #15 [h] (17): h habkdgifjfxoh hbbvjf hbqleexnqts hccgszftbaymfu hdaqzkow hdoeqwdmgqwaoya hfbegicieu hfmlpzzioqjbthz hj hkoysmws hmylu hnvtvpievbdlkrmb hsodfpkatk hvdvcqn hvn hyrybeurqtevjfmi
+ # page #16 [i-ie] (5): i iaab ibiavqyar idfniqvxpohbk idh
+};
+
+subtest 'modulo' => sub {
+ plan tests => 2;
+ my $index = List::Index->new([qw(
+ a b ccb ccd cce gf gg gh i j
+ )]) or return;
+ # 10 entries at 4 per page requires 3 pages
+ # so actual target page sizes should be 3,4,3 (not 4,4,2)
+
+ is_deeply(
+ $index->ranges({ pagesize=>4, context=>0 }),
+ [qw(-ccc ccd-gg gh-)],
+ 'uniform page sizes'
+ );
+{ local $TODO = 'early lookbehind causing [c-gg]';
+ is_deeply(
+ $index->ranges({ pagesize=>4, context=>1 }),
+ [qw(-b c-h i-)],
+ 'context at new intervals'
+ );
+}
};
subtest 'context' => sub {
qw(-baa. baa.-bbb bbc-daa. daaa-eaa. eaaa-)
], 'no context');
is_deeply($index->ranges({pagesize => 2}), [
- qw(-a b c d-ea. eaa-)
+ qw(-a b c d e-)
], 'default context'); # context should be 1
is_deeply($index->ranges({pagesize => 2, context => 2}), [
qw(-a b-c d e-)
], 'overlap'); # first item equals second due to large context
- is_deeply($index->ranges({pagesize => 2, length => 1}), [
+ is_deeply($index->ranges({pagesize => 2, context => 0, length => 1}), [
qw(-a b-c d e-)
], 'single char');