xref: /openbsd-src/gnu/usr.bin/perl/cpan/Unicode-Collate/t/cjk_ja.t (revision 50b7afb2c2c0993b0894d4e34bf857cb13ed9c80)
1
2BEGIN {
3    unless ("A" eq pack('U', 0x41)) {
4	print "1..0 # Unicode::Collate " .
5	    "cannot stringify a Unicode code point\n";
6	exit 0;
7    }
8    if ($ENV{PERL_CORE}) {
9	chdir('t') if -d 't';
10	@INC = $^O eq 'MacOS' ? qw(::lib) : qw(../lib);
11    }
12}
13
14use strict;
15use warnings;
16BEGIN { $| = 1; print "1..33\n"; }
17my $count = 0;
18sub ok ($;$) {
19    my $p = my $r = shift;
20    if (@_) {
21	my $x = shift;
22	$p = !defined $x ? !defined $r : !defined $r ? 0 : $r eq $x;
23    }
24    print $p ? "ok" : "not ok", ' ', ++$count, "\n";
25}
26
27use Unicode::Collate;
28
29ok(1);
30
31#########################
32
33use Unicode::Collate::CJK::JISX0208;
34
35my $collator = Unicode::Collate->new(
36    table => undef,
37    normalization => undef,
38    overrideCJK => \&Unicode::Collate::CJK::JISX0208::weightJISX0208
39);
40
41sub hex_sort {
42    my @source = map pack('U', hex $_), split ' ', shift;
43    my @sorted = $collator->sort(@source);
44    return join " ", map sprintf("%04X", unpack 'U', $_), @sorted;
45}
46
47# 1
48
49$collator->change(level => 1);
50
51# first ten kanji
52ok($collator->lt("\x{4E9C}", "\x{5516}"));
53ok($collator->lt("\x{5516}", "\x{5A03}"));
54ok($collator->lt("\x{5A03}", "\x{963F}"));
55ok($collator->lt("\x{963F}", "\x{54C0}"));
56ok($collator->lt("\x{54C0}", "\x{611B}"));
57ok($collator->lt("\x{611B}", "\x{6328}"));
58ok($collator->lt("\x{6328}", "\x{59F6}"));
59ok($collator->lt("\x{59F6}", "\x{9022}"));
60ok($collator->lt("\x{9022}", "\x{8475}"));
61
62# last five kanji and undef
63ok($collator->lt("\x{69C7}", "\x{9059}"));
64ok($collator->lt("\x{9059}", "\x{7464}"));
65ok($collator->lt("\x{7464}", "\x{51DC}"));
66ok($collator->lt("\x{51DC}", "\x{7199}"));
67ok($collator->lt("\x{7199}", "\x{4E02}")); # 4E02: UIdeo undef in JIS X 0208
68ok($collator->lt("\x{4E02}", "\x{3400}")); # 3400: Ext.A undef in JIS X 0208
69
70# Ext.B
71ok($collator->lt("\x{20000}", "\x{20001}"));
72ok($collator->lt("\x{20001}", "\x{20002}"));
73ok($collator->lt("\x{20002}", "\x{20003}"));
74ok($collator->lt("\x{20003}", "\x{20004}"));
75ok($collator->lt("\x{20004}", "\x{20005}"));
76
77# 21
78
79ok(hex_sort('4E00 4E8C 4E09 56DB 4E94 516D 4E03 516B 4E5D 5341'),
80            '4E00 4E5D 4E94 4E09 56DB 4E03 5341 4E8C 516B 516D');
81
82# 22
83
84$collator->change(overrideCJK => undef);
85
86ok($collator->lt("\x{4E00}", "\x{4E01}"));
87ok($collator->lt("\x{4E01}", "\x{4E02}"));
88ok($collator->lt("\x{4E02}", "\x{4E03}"));
89ok($collator->lt("\x{4E03}", "\x{4E04}"));
90ok($collator->lt("\x{4E04}", "\x{4E05}"));
91
92ok($collator->lt("\x{9F9B}", "\x{9F9C}"));
93ok($collator->lt("\x{9F9C}", "\x{9F9D}"));
94ok($collator->lt("\x{9F9D}", "\x{9F9E}"));
95ok($collator->lt("\x{9F9E}", "\x{9F9F}"));
96ok($collator->lt("\x{9F9F}", "\x{9FA0}"));
97
98# 32
99
100ok(hex_sort('4E00 4E8C 4E09 56DB 4E94 516D 4E03 516B 4E5D 5341'),
101            '4E00 4E03 4E09 4E5D 4E8C 4E94 516B 516D 5341 56DB');
102
103# 33
104