xref: /openbsd-src/gnu/usr.bin/perl/cpan/Unicode-Collate/t/cjk_ja.t (revision 256a93a44f36679bee503f12e49566c2183f6181)
1898184e3Ssthen
2898184e3SsthenBEGIN {
3898184e3Ssthen    if ($ENV{PERL_CORE}) {
4898184e3Ssthen	chdir('t') if -d 't';
5898184e3Ssthen	@INC = $^O eq 'MacOS' ? qw(::lib) : qw(../lib);
6898184e3Ssthen    }
7898184e3Ssthen}
8898184e3Ssthen
9898184e3Ssthenuse strict;
10898184e3Ssthenuse warnings;
11898184e3SsthenBEGIN { $| = 1; print "1..33\n"; }
12898184e3Ssthenmy $count = 0;
13898184e3Ssthensub ok ($;$) {
14898184e3Ssthen    my $p = my $r = shift;
15898184e3Ssthen    if (@_) {
16898184e3Ssthen	my $x = shift;
17898184e3Ssthen	$p = !defined $x ? !defined $r : !defined $r ? 0 : $r eq $x;
18898184e3Ssthen    }
19898184e3Ssthen    print $p ? "ok" : "not ok", ' ', ++$count, "\n";
20898184e3Ssthen}
21898184e3Ssthen
22898184e3Ssthenuse Unicode::Collate;
23898184e3Ssthen
24898184e3Ssthenok(1);
25898184e3Ssthen
26*256a93a4Safresh1sub _pack_U   { Unicode::Collate::pack_U(@_) }
27*256a93a4Safresh1sub _unpack_U { Unicode::Collate::unpack_U(@_) }
28*256a93a4Safresh1
29898184e3Ssthen#########################
30898184e3Ssthen
31898184e3Ssthenuse Unicode::Collate::CJK::JISX0208;
32898184e3Ssthen
33898184e3Ssthenmy $collator = Unicode::Collate->new(
34898184e3Ssthen    table => undef,
35898184e3Ssthen    normalization => undef,
36898184e3Ssthen    overrideCJK => \&Unicode::Collate::CJK::JISX0208::weightJISX0208
37898184e3Ssthen);
38898184e3Ssthen
39898184e3Ssthensub hex_sort {
40*256a93a4Safresh1    my @source = map _pack_U(hex $_), split ' ', shift;
41898184e3Ssthen    my @sorted = $collator->sort(@source);
42*256a93a4Safresh1    return join " ", map sprintf("%04X", _unpack_U($_)), @sorted;
43898184e3Ssthen}
44898184e3Ssthen
45898184e3Ssthen# 1
46898184e3Ssthen
47898184e3Ssthen$collator->change(level => 1);
48898184e3Ssthen
49898184e3Ssthen# first ten kanji
50898184e3Ssthenok($collator->lt("\x{4E9C}", "\x{5516}"));
51898184e3Ssthenok($collator->lt("\x{5516}", "\x{5A03}"));
52898184e3Ssthenok($collator->lt("\x{5A03}", "\x{963F}"));
53898184e3Ssthenok($collator->lt("\x{963F}", "\x{54C0}"));
54898184e3Ssthenok($collator->lt("\x{54C0}", "\x{611B}"));
55898184e3Ssthenok($collator->lt("\x{611B}", "\x{6328}"));
56898184e3Ssthenok($collator->lt("\x{6328}", "\x{59F6}"));
57898184e3Ssthenok($collator->lt("\x{59F6}", "\x{9022}"));
58898184e3Ssthenok($collator->lt("\x{9022}", "\x{8475}"));
59898184e3Ssthen
60898184e3Ssthen# last five kanji and undef
61898184e3Ssthenok($collator->lt("\x{69C7}", "\x{9059}"));
62898184e3Ssthenok($collator->lt("\x{9059}", "\x{7464}"));
63898184e3Ssthenok($collator->lt("\x{7464}", "\x{51DC}"));
64898184e3Ssthenok($collator->lt("\x{51DC}", "\x{7199}"));
65898184e3Ssthenok($collator->lt("\x{7199}", "\x{4E02}")); # 4E02: UIdeo undef in JIS X 0208
66898184e3Ssthenok($collator->lt("\x{4E02}", "\x{3400}")); # 3400: Ext.A undef in JIS X 0208
67898184e3Ssthen
68898184e3Ssthen# Ext.B
69898184e3Ssthenok($collator->lt("\x{20000}", "\x{20001}"));
70898184e3Ssthenok($collator->lt("\x{20001}", "\x{20002}"));
71898184e3Ssthenok($collator->lt("\x{20002}", "\x{20003}"));
72898184e3Ssthenok($collator->lt("\x{20003}", "\x{20004}"));
73898184e3Ssthenok($collator->lt("\x{20004}", "\x{20005}"));
74898184e3Ssthen
75898184e3Ssthen# 21
76898184e3Ssthen
77898184e3Ssthenok(hex_sort('4E00 4E8C 4E09 56DB 4E94 516D 4E03 516B 4E5D 5341'),
78898184e3Ssthen            '4E00 4E5D 4E94 4E09 56DB 4E03 5341 4E8C 516B 516D');
79898184e3Ssthen
80898184e3Ssthen# 22
81898184e3Ssthen
82898184e3Ssthen$collator->change(overrideCJK => undef);
83898184e3Ssthen
84898184e3Ssthenok($collator->lt("\x{4E00}", "\x{4E01}"));
85898184e3Ssthenok($collator->lt("\x{4E01}", "\x{4E02}"));
86898184e3Ssthenok($collator->lt("\x{4E02}", "\x{4E03}"));
87898184e3Ssthenok($collator->lt("\x{4E03}", "\x{4E04}"));
88898184e3Ssthenok($collator->lt("\x{4E04}", "\x{4E05}"));
89898184e3Ssthen
90898184e3Ssthenok($collator->lt("\x{9F9B}", "\x{9F9C}"));
91898184e3Ssthenok($collator->lt("\x{9F9C}", "\x{9F9D}"));
92898184e3Ssthenok($collator->lt("\x{9F9D}", "\x{9F9E}"));
93898184e3Ssthenok($collator->lt("\x{9F9E}", "\x{9F9F}"));
94898184e3Ssthenok($collator->lt("\x{9F9F}", "\x{9FA0}"));
95898184e3Ssthen
96898184e3Ssthen# 32
97898184e3Ssthen
98898184e3Ssthenok(hex_sort('4E00 4E8C 4E09 56DB 4E94 516D 4E03 516B 4E5D 5341'),
99898184e3Ssthen            '4E00 4E03 4E09 4E5D 4E8C 4E94 516B 516D 5341 56DB');
100898184e3Ssthen
101898184e3Ssthen# 33
102