xref: /openbsd-src/gnu/usr.bin/perl/dist/Unicode-Normalize/t/test.t (revision 256a93a44f36679bee503f12e49566c2183f6181)
15759b3d2Safresh1
25759b3d2Safresh1BEGIN {
35759b3d2Safresh1    if ($ENV{PERL_CORE}) {
45759b3d2Safresh1        chdir('t') if -d 't';
55759b3d2Safresh1        @INC = $^O eq 'MacOS' ? qw(::lib) : qw(../lib);
65759b3d2Safresh1    }
75759b3d2Safresh1}
85759b3d2Safresh1
95759b3d2Safresh1#########################
105759b3d2Safresh1
115759b3d2Safresh1use strict;
125759b3d2Safresh1use warnings;
135759b3d2Safresh1BEGIN { $| = 1; print "1..72\n"; }
145759b3d2Safresh1my $count = 0;
15*256a93a4Safresh1sub ok { Unicode::Normalize::ok(\$count, @_) }
165759b3d2Safresh1
175759b3d2Safresh1use Unicode::Normalize;
185759b3d2Safresh1
195759b3d2Safresh1ok(1);
205759b3d2Safresh1
21*256a93a4Safresh1sub _pack_U   { Unicode::Normalize::dot_t_pack_U(@_) }
22*256a93a4Safresh1sub _unpack_U { Unicode::Normalize::dot_t_unpack_U(@_) }
235759b3d2Safresh1
245759b3d2Safresh1#########################
255759b3d2Safresh1
265759b3d2Safresh1ok(NFD(""), "");
275759b3d2Safresh1ok(NFC(""), "");
285759b3d2Safresh1ok(NFKD(""), "");
295759b3d2Safresh1ok(NFKC(""), "");
305759b3d2Safresh1
315759b3d2Safresh1ok(NFD("A"), "A");
325759b3d2Safresh1ok(NFC("A"), "A");
335759b3d2Safresh1ok(NFKD("A"), "A");
345759b3d2Safresh1ok(NFKC("A"), "A");
355759b3d2Safresh1
365759b3d2Safresh1# 9
375759b3d2Safresh1
385759b3d2Safresh1# don't modify the source
395759b3d2Safresh1my $sNFD = "\x{FA19}";
405759b3d2Safresh1ok(NFD($sNFD), "\x{795E}");
415759b3d2Safresh1ok($sNFD, "\x{FA19}");
425759b3d2Safresh1
435759b3d2Safresh1my $sNFC = "\x{FA1B}";
445759b3d2Safresh1ok(NFC($sNFC), "\x{798F}");
455759b3d2Safresh1ok($sNFC, "\x{FA1B}");
465759b3d2Safresh1
475759b3d2Safresh1my $sNFKD = "\x{FA1E}";
485759b3d2Safresh1ok(NFKD($sNFKD), "\x{7FBD}");
495759b3d2Safresh1ok($sNFKD, "\x{FA1E}");
505759b3d2Safresh1
515759b3d2Safresh1my $sNFKC = "\x{FA26}";
525759b3d2Safresh1ok(NFKC($sNFKC), "\x{90FD}");
535759b3d2Safresh1ok($sNFKC, "\x{FA26}");
545759b3d2Safresh1
555759b3d2Safresh1# 17
565759b3d2Safresh1
575759b3d2Safresh1sub hexNFC {
585759b3d2Safresh1  join " ", map sprintf("%04X", $_),
595759b3d2Safresh1  _unpack_U NFC _pack_U map hex, split ' ', shift;
605759b3d2Safresh1}
615759b3d2Safresh1sub hexNFD {
625759b3d2Safresh1  join " ", map sprintf("%04X", $_),
635759b3d2Safresh1  _unpack_U NFD _pack_U map hex, split ' ', shift;
645759b3d2Safresh1}
655759b3d2Safresh1
665759b3d2Safresh1ok(hexNFD("1E14 AC01"), "0045 0304 0300 1100 1161 11A8");
675759b3d2Safresh1ok(hexNFD("AC00 AE00"), "1100 1161 1100 1173 11AF");
685759b3d2Safresh1
695759b3d2Safresh1ok(hexNFC("0061 0315 0300 05AE 05C4 0062"), "00E0 05AE 05C4 0315 0062");
705759b3d2Safresh1ok(hexNFC("00E0 05AE 05C4 0315 0062"),      "00E0 05AE 05C4 0315 0062");
715759b3d2Safresh1ok(hexNFC("0061 05AE 0300 05C4 0315 0062"), "00E0 05AE 05C4 0315 0062");
725759b3d2Safresh1ok(hexNFC("0045 0304 0300 AC00 11A8"), "1E14 AC01");
735759b3d2Safresh1ok(hexNFC("1100 1161 1100 1173 11AF"), "AC00 AE00");
745759b3d2Safresh1ok(hexNFC("1100 0300 1161 1173 11AF"), "1100 0300 1161 1173 11AF");
755759b3d2Safresh1
765759b3d2Safresh1ok(hexNFD("0061 0315 0300 05AE 05C4 0062"), "0061 05AE 0300 05C4 0315 0062");
775759b3d2Safresh1ok(hexNFD("00E0 05AE 05C4 0315 0062"),      "0061 05AE 0300 05C4 0315 0062");
785759b3d2Safresh1ok(hexNFD("0061 05AE 0300 05C4 0315 0062"), "0061 05AE 0300 05C4 0315 0062");
795759b3d2Safresh1ok(hexNFC("0061 05C4 0315 0300 05AE 0062"), "0061 05AE 05C4 0300 0315 0062");
805759b3d2Safresh1ok(hexNFC("0061 05AE 05C4 0300 0315 0062"), "0061 05AE 05C4 0300 0315 0062");
815759b3d2Safresh1ok(hexNFD("0061 05C4 0315 0300 05AE 0062"), "0061 05AE 05C4 0300 0315 0062");
825759b3d2Safresh1ok(hexNFD("0061 05AE 05C4 0300 0315 0062"), "0061 05AE 05C4 0300 0315 0062");
835759b3d2Safresh1ok(hexNFC("0000 0041 0000 0000"), "0000 0041 0000 0000");
845759b3d2Safresh1ok(hexNFD("0000 0041 0000 0000"), "0000 0041 0000 0000");
855759b3d2Safresh1
865759b3d2Safresh1ok(hexNFC("AC00 11A7"), "AC00 11A7");
875759b3d2Safresh1ok(hexNFC("AC00 11A8"), "AC01");
885759b3d2Safresh1ok(hexNFC("AC00 11A9"), "AC02");
895759b3d2Safresh1ok(hexNFC("AC00 11C2"), "AC1B");
905759b3d2Safresh1ok(hexNFC("AC00 11C3"), "AC00 11C3");
915759b3d2Safresh1
925759b3d2Safresh1# 39
935759b3d2Safresh1
945759b3d2Safresh1# Test Cases from Public Review Issue #29: Normalization Issue
955759b3d2Safresh1# cf. http://www.unicode.org/review/pr-29.html
965759b3d2Safresh1ok(hexNFC("0B47 0300 0B3E"), "0B47 0300 0B3E");
975759b3d2Safresh1ok(hexNFC("1100 0300 1161"), "1100 0300 1161");
985759b3d2Safresh1ok(hexNFC("0B47 0B3E 0300"), "0B4B 0300");
995759b3d2Safresh1ok(hexNFC("1100 1161 0300"), "AC00 0300");
1005759b3d2Safresh1ok(hexNFC("0B47 0300 0B3E 0327"), "0B47 0300 0B3E 0327");
1015759b3d2Safresh1ok(hexNFC("1100 0300 1161 0327"), "1100 0300 1161 0327");
1025759b3d2Safresh1
1035759b3d2Safresh1ok(hexNFC("0300 0041"), "0300 0041");
1045759b3d2Safresh1ok(hexNFC("0300 0301 0041"), "0300 0301 0041");
1055759b3d2Safresh1ok(hexNFC("0301 0300 0041"), "0301 0300 0041");
1065759b3d2Safresh1ok(hexNFC("0000 0300 0000 0301"), "0000 0300 0000 0301");
1075759b3d2Safresh1ok(hexNFC("0000 0301 0000 0300"), "0000 0301 0000 0300");
1085759b3d2Safresh1
1095759b3d2Safresh1ok(hexNFC("0327 0061 0300"), "0327 00E0");
1105759b3d2Safresh1ok(hexNFC("0301 0061 0300"), "0301 00E0");
1115759b3d2Safresh1ok(hexNFC("0315 0061 0300"), "0315 00E0");
1125759b3d2Safresh1ok(hexNFC("0000 0327 0061 0300"), "0000 0327 00E0");
1135759b3d2Safresh1ok(hexNFC("0000 0301 0061 0300"), "0000 0301 00E0");
1145759b3d2Safresh1ok(hexNFC("0000 0315 0061 0300"), "0000 0315 00E0");
1155759b3d2Safresh1
1165759b3d2Safresh1# 56
1175759b3d2Safresh1
1185759b3d2Safresh1# NFC() and NFKC() should be unary.
1195759b3d2Safresh1my $str11 = _pack_U(0x41, 0x0302, 0x0301, 0x62);
1205759b3d2Safresh1my $str12 = _pack_U(0x1EA4, 0x62);
1215759b3d2Safresh1ok(NFC $str11 eq $str12);
1225759b3d2Safresh1ok(NFKC $str11 eq $str12);
1235759b3d2Safresh1
1245759b3d2Safresh1# NFD() and NFKD() should be unary.
1255759b3d2Safresh1my $str21 = _pack_U(0xE0, 0xAC00);
1265759b3d2Safresh1my $str22 = _pack_U(0x61, 0x0300, 0x1100, 0x1161);
1275759b3d2Safresh1ok(NFD $str21 eq $str22);
1285759b3d2Safresh1ok(NFKD $str21 eq $str22);
1295759b3d2Safresh1
1305759b3d2Safresh1# 60
1315759b3d2Safresh1
1325759b3d2Safresh1## Bug #53197: NFKC("\x{2000}") produces...
1335759b3d2Safresh1
1345759b3d2Safresh1ok(NFKC("\x{2002}") eq ' ');
1355759b3d2Safresh1ok(NFKD("\x{2002}") eq ' ');
1365759b3d2Safresh1ok(NFKC("\x{2000}") eq ' ');
1375759b3d2Safresh1ok(NFKD("\x{2000}") eq ' ');
1385759b3d2Safresh1
1395759b3d2Safresh1ok(NFKC("\x{210C}") eq 'H');
1405759b3d2Safresh1ok(NFKD("\x{210C}") eq 'H');
1415759b3d2Safresh1ok(NFKC("\x{210D}") eq 'H');
1425759b3d2Safresh1ok(NFKD("\x{210D}") eq 'H');
1435759b3d2Safresh1
1445759b3d2Safresh1ok(NFC("\x{F907}") eq "\x{9F9C}");
1455759b3d2Safresh1ok(NFD("\x{F907}") eq "\x{9F9C}");
1465759b3d2Safresh1ok(NFKC("\x{F907}") eq "\x{9F9C}");
1475759b3d2Safresh1ok(NFKD("\x{F907}") eq "\x{9F9C}");
1485759b3d2Safresh1
1495759b3d2Safresh1# 72
1505759b3d2Safresh1
151