use utf8;
my %uniblock = (
- 0x000, '<td colspan="1" class="X Po">ascii',
- 0x001, '<td colspan="4" class="X L Latin">latin',
-# 0x005, '<td colspan="5" class="X Sk">spacing modifier',
- 0x005, '<td colspan="2" class="X Mn">comb',
- 0x007, '<td colspan="1" class="X L Greek">grk',
- 0x008, '<td colspan="2" class="X L Cyrillic">cyr',
- 0x00A, '<td colspan="1" class="X L Armenian">arm',
- 0x00B, '<td colspan="6" class="X L Aramaic">aramaic',
- 0x011, '<td colspan="1" class="Xr">',
- 0x012, '<td colspan="15" class="X L Brahmic">brahmic',
- 0x020, '<td colspan="1" class="X L Brahmic">mm',
- 0x021, '<td colspan="1" class="X L Aramaic">geor',
- 0x022, '<td colspan="2" class="X L Hangul">jamo',
- 0x024, '<td colspan="3" class="X L African">ethiopic',
- 0x027, '<td colspan="6" class="X L Syllabic">aboriginal',
- 0x02D, '<td colspan="1" class="X L Alpha">ger',
- 0x02E, '<td colspan="2" class="X L Brahmic">brahm',
- 0x030, '<td colspan="1" class="X L Aramaic">mon',
- 0x031, '<td colspan="1" class="X Xr L Syllabic">can',
- 0x032, '<td colspan="8" class="X L Brahmic">brahmic',
- 0x03A, '<td colspan="4" class="X L Latin">extensions',
- 0x03E, '<td colspan="2" class="X L Greek">greek',
- 0x040, '<td colspan="1" class="X Po">·…',
- 0x041, '<td colspan="3" class="X So">misc',
- 0x044, '<td colspan="2" class="X Sm">maths',
- 0x046, '<td colspan="3" class="X So">technical',
- 0x049, '<td colspan="1" class="X Latin">()',
- 0x04A, '<td colspan="2" class="X So">draw',
- 0x04C, '<td colspan="4" class="X So">symbols',
- 0x050, '<td colspan="2" class="X L Alpha">braille',
- 0x052, '<td colspan="1" class="X So">→',
- 0x053, '<td colspan="3" class="X Sm">math',
- 0x056, '<td colspan="2" class="X So">misc',
- 0x058, '<td colspan="2" class="X L Greek">ancient',
- 0x05A, '<td colspan="2" class="X L Alpha">ext',
- 0x05C, '<td colspan="1" class="X Po">·+',
- 0x05D, '<td colspan="3" class="X L Han">radicals',
- 0x060, '<td colspan="2" class="X L Katakana">japanese',
- 0x062, '<td colspan="4" class="X L Han">cjk+',
- 0x066, '<td colspan="2" class="X Xd L Han">compat',
- 0x068, '<td colspan="8" class="X L Han" style="border-bottom:none">',
- 0x070, '<td colspan="16" rowspan="2" class="X L Han" style="border-top:none">cjk ideographs A', #+2
- 0x09C, '<td colspan="16" rowspan="10" class="X L Han">cjk unified ideographs',
- 0x140, '<td colspan="9" class="X L Syllabic">yi',
- 0x149, '<td colspan="1" class="X Xr L Latin">lisu',
- 0x14A, '<td colspan="2" class="X L Syllabic">vai',
- 0x14C, '<td colspan="1" class="X L Cyrillic">cyr',
- 0x14D, '<td colspan="1" class="X Xr L Syllabic">bam',
- 0x14E, '<td colspan="2" class="X L Latin">lat-D',
- 0x150, '<td colspan="8" class="X L Brahmic">brahmic',
- 0x158, '<td colspan="8" class="X L Hangul">hangeul syllables',
- 0x160, '<td colspan="16" rowspan="5" class="X L Hangul" style="border-top:none">hangeul syllables',
- 0x1B0, '<td colspan="16" class="X Cs">surrogates',
- 0x1C0, '<td colspan="16" rowspan="3" class="X Co">private use',
- 0x1F0, '<td colspan="4" class="X L Han">cjk compat',
- 0xFB0, '<td colspan="5" class="X Xd L">presentation',
- 0xFB5, '<td colspan="11" class="X Xd L Arabic" style="border-bottom:none">',
- 0xFC0, '<td colspan="16" class="X Xd L Arabic" style="border-top:none; border-bottom:none">arabic presentation forms A',
- 0xFD0, '<td colspan="13" class="X Xd L Arabic" style="border-top:none">',
- 0xFDD, '<td colspan="2" class="Xi">?',
- 0xFDF, '<td colspan="1" class="X Xd L Arabic" style="border-top:none">',
- 0xFE0, '<td colspan="1" class="X Cc">var',
- 0xFE1, '<td colspan="1" class="X L Pd">ver',
- 0xFE2, '<td colspan="1" class="X L Mn">½',
- 0xFE3, '<td colspan="2" class="X Xd Pd Han">comp',
- 0xFE5, '<td colspan="2" class="X Xd L Latin">small',
- 0xFE7, '<td colspan="9" class="X Xd L Arabic">arabic presentation B',
- 0xFF0, '<td colspan="15" class="X L Latin">halfwidth & fullwidth forms',
- 0xFFF, '<td colspan="1" class="X Cc">sp',
+ 0x0000, '<td colspan="1" class="X Po">ascii',
+ 0x0008, '<td colspan="4" class="X L Latin">latin',
+# 0x0028, '<td colspan="5" class="X Sk">spacing modifier',
+ 0x0028, '<td colspan="2" class="X Mn">comb',
+ 0x0038, '<td colspan="1" class="X L Greek">grk',
+ 0x0040, '<td colspan="2" class="X L Cyrillic">cyr',
+ 0x0050, '<td colspan="1" class="X L Armenian">arm',
+ 0x0058, '<td colspan="1" class="X L Aramaic">heb',
+ 0x0060, '<td colspan="2" class="X L Arabic">arabic',
+ 0x0070, '<td colspan="3" class="X L Aramaic">aram',
+ 0x0080, '<td colspan="2" class="X L Aramaic">aramaic',
+ 0x0090, '<td colspan="14" class="X L Brahmic">brahmic',
+ 0x0100, '<td colspan="1" class="X L Brahmic">mm',
+ 0x0108, '<td colspan="1" class="X L Aramaic">geor',
+ 0x0110, '<td colspan="2" class="X L Hangul">jamo',
+ 0x0120, '<td colspan="3" class="X L African">ethiopic',
+ 0x0138, '<td colspan="6" class="X L Syllabic">aboriginal',
+ 0x0168, '<td colspan="1" class="X L Alpha">ger',
+ 0x0170, '<td colspan="2" class="X L Brahmic">brahm',
+ 0x0180, '<td colspan="1" class="X L Aramaic">mon',
+ 0x0188, '<td colspan="1" class="X L Syllabic">can',
+ 0x0190, '<td colspan="8" class="X L Brahmic">brahmic',
+ 0x01D0, '<td colspan="4" class="X L Latin">extensions',
+ 0x01F0, '<td colspan="2" class="X L Greek">greek',
+ 0x0200, '<td colspan="1" class="X Po">·…',
+ 0x0208, '<td colspan="3" class="X So">symbols',
+ 0x0220, '<td colspan="2" class="X Sm">maths',
+ 0x0230, '<td colspan="3" class="X So">technical',
+ 0x0248, '<td colspan="1" class="X Latin">()',
+ 0x0250, '<td colspan="2" class="X So">draw',
+ 0x0260, '<td colspan="4" class="X So">symbols',
+ 0x0280, '<td colspan="2" class="X L Alpha">braille',
+ 0x0290, '<td colspan="1" class="X So">arr',
+ 0x0298, '<td colspan="3" class="X Sm">maths',
+ 0x02B0, '<td colspan="2" class="X So">misc',
+ 0x02C0, '<td colspan="2" class="X L Greek">ancient',
+ 0x02D0, '<td colspan="2" class="X L Alpha">ext',
+ 0x02E0, '<td colspan="1" class="X Po">·+',
+ 0x02E8, '<td colspan="3" class="X L Han">radicals',
+ 0x0300, '<td colspan="2" class="X L Katakana">japanese',
+ 0x0310, '<td colspan="4" class="X L Han">cjk+',
+ 0x0330, '<td colspan="2" class="X Xd L Han">compat',
+ 0x0340, '<td colspan="8" class="X L Han" style="border-bottom:none">',
+ 0x0380, '<td colspan="16" rowspan="2" class="X L Han" style="border-top:none">cjk ideographs A', #+2
+ 0x04E0, '<td colspan="16" rowspan="11" class="X L Han">cjk unified ideographs',
+ 0x0A00, '<td colspan="9" class="X L Syllabic">yi',
+ 0x0A48, '<td colspan="1" class="X L Latin">lisu',
+ 0x0A50, '<td colspan="2" class="X L Syllabic">vai',
+ 0x0A60, '<td colspan="1" class="X L Cyrillic">cyr',
+ 0x0A68, '<td colspan="1" class="X L Syllabic">bam',
+ 0x0A70, '<td colspan="2" class="X L Latin">lat-D',
+ 0x0A80, '<td colspan="6" class="X L Brahmic">brahmic',
+ 0x0AB0, '<td colspan="2" class="X L Alpha">ext',
+ 0x0AC0, '<td colspan="8" class="X L Hangul" style="border-bottom:none">',
+ 0x0B00, '<td colspan="16" rowspan="5" class="X L Hangul" style="border-top:none">hangeul syllables',
+ 0x0D80, '<td colspan="16" class="X Cs">surrogates',
+ 0x0E00, '<td colspan="16" rowspan="3" class="X Co" style="border-bottom:none">private use',
+ 0x0F80, '<td colspan="2" class="X Co" style="border-top:none">',
+ 0x0F90, '<td colspan="4" class="X L Han">cjk compat',
+ 0x0FB0, '<td colspan="8" class="X L Arabic">presentation',
+ 0x0FF0, '<td colspan="2" class="X L Latin">width',
+
+ 0x1000, '<td colspan="2" class="X L Syllabic">linear B',
+ 0x1010, '<td colspan="2" class="X No">a num',
+ 0x1020, '<td colspan="8" class="X L Alpha">ltr',
+ 0x1060, '<td colspan="3" class="X L Syllabic">linear A',
+ 0x1078, '<td colspan="1" class="X L Alpha">ltr',
+ 0x1080, '<td colspan="16" class="X L Aramaic">rtl',
+ 0x1100, '<td colspan="16" rowspan="2" class="X L Brahmic">brahmic',
+ 0x1200, '<td colspan="16" rowspan="2" class="X L Syllabic">cuneiform',
+ 0x1300, '<td colspan="16" rowspan="2" class="X L Syllabic">egyptian hieroglyphs',
+ 0x1400, '<td colspan="16" rowspan="4" class="X L Syllabic">other large scripts',
+ 0x1600, '<td colspan="16" rowspan="2" class="X L Alpha">recent',
+ 0x1700, '<td colspan="16" rowspan="8" class="X L Han">east asian',
+ 0x1B40, '<td colspan="2" class="">res',
+ 0x1B50, '<td colspan="14" class="X L Syllabic">proto-elamite',
+ 0x1BC0, '<td colspan="8" class="X L Alpha">shorthands',
+ 0x1BE0, '<td colspan="8" class="" style="border-bottom:none">',
+ 0x1C00, '<td colspan="16" rowspan="2" class="" style="border-top:none">other large scripts',
+ 0x1D00, '<td colspan="8" class="X So">notational systems',
+ 0x1D40, '<td colspan="8" class="X L Latin">mathematical', # Sm
+ 0x1D80, '<td colspan="8" class="X L Alpha">sutton signs',
+ 0x1DC0, '<td colspan="8" class="">notational',
+ 0x1E00, '<td colspan="16" class="X L Alpha">ltr',
+ 0x1E80, '<td colspan="16" class="X L Alpha">rtl',
+ 0x1F00, '<td colspan="2" class="X So">game',
+ 0x1F10, '<td colspan="4" class="X L So">enclosed',
+ 0x1F30, '<td colspan="12" class="X So">pictographic',
+ 0x1F80, '<td colspan="2" class="X So">arrows',
+ 0x1F90, '<td colspan="14" class="">unassigned',
);
sub {