1898184e3Ssthen 2898184e3SsthenBEGIN { 3898184e3Ssthen if ($ENV{PERL_CORE}) { 4898184e3Ssthen chdir('t') if -d 't'; 5898184e3Ssthen @INC = $^O eq 'MacOS' ? qw(::lib) : qw(../lib); 6898184e3Ssthen } 7898184e3Ssthen} 8898184e3Ssthen 9898184e3Ssthenuse strict; 10898184e3Ssthenuse warnings; 11898184e3SsthenBEGIN { $| = 1; print "1..33\n"; } 12898184e3Ssthenmy $count = 0; 13898184e3Ssthensub ok ($;$) { 14898184e3Ssthen my $p = my $r = shift; 15898184e3Ssthen if (@_) { 16898184e3Ssthen my $x = shift; 17898184e3Ssthen $p = !defined $x ? !defined $r : !defined $r ? 0 : $r eq $x; 18898184e3Ssthen } 19898184e3Ssthen print $p ? "ok" : "not ok", ' ', ++$count, "\n"; 20898184e3Ssthen} 21898184e3Ssthen 22898184e3Ssthenuse Unicode::Collate; 23898184e3Ssthen 24898184e3Ssthenok(1); 25898184e3Ssthen 26*256a93a4Safresh1sub _pack_U { Unicode::Collate::pack_U(@_) } 27*256a93a4Safresh1sub _unpack_U { Unicode::Collate::unpack_U(@_) } 28*256a93a4Safresh1 29898184e3Ssthen######################### 30898184e3Ssthen 31898184e3Ssthenuse Unicode::Collate::CJK::JISX0208; 32898184e3Ssthen 33898184e3Ssthenmy $collator = Unicode::Collate->new( 34898184e3Ssthen table => undef, 35898184e3Ssthen normalization => undef, 36898184e3Ssthen overrideCJK => \&Unicode::Collate::CJK::JISX0208::weightJISX0208 37898184e3Ssthen); 38898184e3Ssthen 39898184e3Ssthensub hex_sort { 40*256a93a4Safresh1 my @source = map _pack_U(hex $_), split ' ', shift; 41898184e3Ssthen my @sorted = $collator->sort(@source); 42*256a93a4Safresh1 return join " ", map sprintf("%04X", _unpack_U($_)), @sorted; 43898184e3Ssthen} 44898184e3Ssthen 45898184e3Ssthen# 1 46898184e3Ssthen 47898184e3Ssthen$collator->change(level => 1); 48898184e3Ssthen 49898184e3Ssthen# first ten kanji 50898184e3Ssthenok($collator->lt("\x{4E9C}", "\x{5516}")); 51898184e3Ssthenok($collator->lt("\x{5516}", "\x{5A03}")); 52898184e3Ssthenok($collator->lt("\x{5A03}", "\x{963F}")); 53898184e3Ssthenok($collator->lt("\x{963F}", "\x{54C0}")); 54898184e3Ssthenok($collator->lt("\x{54C0}", "\x{611B}")); 55898184e3Ssthenok($collator->lt("\x{611B}", "\x{6328}")); 56898184e3Ssthenok($collator->lt("\x{6328}", "\x{59F6}")); 57898184e3Ssthenok($collator->lt("\x{59F6}", "\x{9022}")); 58898184e3Ssthenok($collator->lt("\x{9022}", "\x{8475}")); 59898184e3Ssthen 60898184e3Ssthen# last five kanji and undef 61898184e3Ssthenok($collator->lt("\x{69C7}", "\x{9059}")); 62898184e3Ssthenok($collator->lt("\x{9059}", "\x{7464}")); 63898184e3Ssthenok($collator->lt("\x{7464}", "\x{51DC}")); 64898184e3Ssthenok($collator->lt("\x{51DC}", "\x{7199}")); 65898184e3Ssthenok($collator->lt("\x{7199}", "\x{4E02}")); # 4E02: UIdeo undef in JIS X 0208 66898184e3Ssthenok($collator->lt("\x{4E02}", "\x{3400}")); # 3400: Ext.A undef in JIS X 0208 67898184e3Ssthen 68898184e3Ssthen# Ext.B 69898184e3Ssthenok($collator->lt("\x{20000}", "\x{20001}")); 70898184e3Ssthenok($collator->lt("\x{20001}", "\x{20002}")); 71898184e3Ssthenok($collator->lt("\x{20002}", "\x{20003}")); 72898184e3Ssthenok($collator->lt("\x{20003}", "\x{20004}")); 73898184e3Ssthenok($collator->lt("\x{20004}", "\x{20005}")); 74898184e3Ssthen 75898184e3Ssthen# 21 76898184e3Ssthen 77898184e3Ssthenok(hex_sort('4E00 4E8C 4E09 56DB 4E94 516D 4E03 516B 4E5D 5341'), 78898184e3Ssthen '4E00 4E5D 4E94 4E09 56DB 4E03 5341 4E8C 516B 516D'); 79898184e3Ssthen 80898184e3Ssthen# 22 81898184e3Ssthen 82898184e3Ssthen$collator->change(overrideCJK => undef); 83898184e3Ssthen 84898184e3Ssthenok($collator->lt("\x{4E00}", "\x{4E01}")); 85898184e3Ssthenok($collator->lt("\x{4E01}", "\x{4E02}")); 86898184e3Ssthenok($collator->lt("\x{4E02}", "\x{4E03}")); 87898184e3Ssthenok($collator->lt("\x{4E03}", "\x{4E04}")); 88898184e3Ssthenok($collator->lt("\x{4E04}", "\x{4E05}")); 89898184e3Ssthen 90898184e3Ssthenok($collator->lt("\x{9F9B}", "\x{9F9C}")); 91898184e3Ssthenok($collator->lt("\x{9F9C}", "\x{9F9D}")); 92898184e3Ssthenok($collator->lt("\x{9F9D}", "\x{9F9E}")); 93898184e3Ssthenok($collator->lt("\x{9F9E}", "\x{9F9F}")); 94898184e3Ssthenok($collator->lt("\x{9F9F}", "\x{9FA0}")); 95898184e3Ssthen 96898184e3Ssthen# 32 97898184e3Ssthen 98898184e3Ssthenok(hex_sort('4E00 4E8C 4E09 56DB 4E94 516D 4E03 516B 4E5D 5341'), 99898184e3Ssthen '4E00 4E03 4E09 4E5D 4E8C 4E94 516B 516D 5341 56DB'); 100898184e3Ssthen 101898184e3Ssthen# 33 102