| |
| BEGIN { |
| unless ("A" eq pack('U', 0x41)) { |
| print "1..0 # Unicode::Normalize " . |
| "cannot stringify a Unicode code point\n"; |
| exit 0; |
| } |
| } |
| |
| BEGIN { |
| if ($ENV{PERL_CORE}) { |
| chdir('t') if -d 't'; |
| @INC = $^O eq 'MacOS' ? qw(::lib) : qw(../lib); |
| } |
| } |
| |
| ######################### |
| |
| use strict; |
| use warnings; |
| BEGIN { $| = 1; print "1..64\n"; } |
| my $count = 0; |
| sub ok ($;$) { |
| my $p = my $r = shift; |
| if (@_) { |
| my $x = shift; |
| $p = !defined $x ? !defined $r : !defined $r ? 0 : $r eq $x; |
| } |
| print $p ? "ok" : "not ok", ' ', ++$count, "\n"; |
| } |
| |
| use Unicode::Normalize qw(normalize); |
| |
| ok(1); |
| |
| sub _pack_U { Unicode::Normalize::pack_U(@_) } |
| sub _unpack_U { Unicode::Normalize::unpack_U(@_) } |
| |
| ######################### |
| |
| ok(normalize('D', ""), ""); |
| ok(normalize('C', ""), ""); |
| ok(normalize('KD',""), ""); |
| ok(normalize('KC',""), ""); |
| |
| ok(normalize('D', "A"), "A"); |
| ok(normalize('C', "A"), "A"); |
| ok(normalize('KD',"A"), "A"); |
| ok(normalize('KC',"A"), "A"); |
| |
| ok(normalize('NFD', ""), ""); |
| ok(normalize('NFC', ""), ""); |
| ok(normalize('NFKD',""), ""); |
| ok(normalize('NFKC',""), ""); |
| |
| ok(normalize('NFD', "A"), "A"); |
| ok(normalize('NFC', "A"), "A"); |
| ok(normalize('NFKD',"A"), "A"); |
| ok(normalize('NFKC',"A"), "A"); |
| |
| # 17 |
| |
| # don't modify the source |
| my $sNFD = "\x{FA19}"; |
| ok(normalize('NFD', $sNFD), "\x{795E}"); |
| ok($sNFD, "\x{FA19}"); |
| |
| my $sNFC = "\x{FA1B}"; |
| ok(normalize('NFC', $sNFC), "\x{798F}"); |
| ok($sNFC, "\x{FA1B}"); |
| |
| my $sNFKD = "\x{FA1E}"; |
| ok(normalize('NFKD', $sNFKD), "\x{7FBD}"); |
| ok($sNFKD, "\x{FA1E}"); |
| |
| my $sNFKC = "\x{FA26}"; |
| ok(normalize('NFKC', $sNFKC), "\x{90FD}"); |
| ok($sNFKC, "\x{FA26}"); |
| |
| # 25 |
| |
| sub hexNFC { |
| join " ", map sprintf("%04X", $_), |
| _unpack_U normalize 'C', _pack_U map hex, split ' ', shift; |
| } |
| sub hexNFD { |
| join " ", map sprintf("%04X", $_), |
| _unpack_U normalize 'D', _pack_U map hex, split ' ', shift; |
| } |
| |
| ok(hexNFD("1E14 AC01"), "0045 0304 0300 1100 1161 11A8"); |
| ok(hexNFD("AC00 AE00"), "1100 1161 1100 1173 11AF"); |
| |
| ok(hexNFC("0061 0315 0300 05AE 05C4 0062"), "00E0 05AE 05C4 0315 0062"); |
| ok(hexNFC("00E0 05AE 05C4 0315 0062"), "00E0 05AE 05C4 0315 0062"); |
| ok(hexNFC("0061 05AE 0300 05C4 0315 0062"), "00E0 05AE 05C4 0315 0062"); |
| ok(hexNFC("0045 0304 0300 AC00 11A8"), "1E14 AC01"); |
| ok(hexNFC("1100 1161 1100 1173 11AF"), "AC00 AE00"); |
| ok(hexNFC("1100 0300 1161 1173 11AF"), "1100 0300 1161 1173 11AF"); |
| |
| ok(hexNFD("0061 0315 0300 05AE 05C4 0062"), "0061 05AE 0300 05C4 0315 0062"); |
| ok(hexNFD("00E0 05AE 05C4 0315 0062"), "0061 05AE 0300 05C4 0315 0062"); |
| ok(hexNFD("0061 05AE 0300 05C4 0315 0062"), "0061 05AE 0300 05C4 0315 0062"); |
| ok(hexNFC("0061 05C4 0315 0300 05AE 0062"), "0061 05AE 05C4 0300 0315 0062"); |
| ok(hexNFC("0061 05AE 05C4 0300 0315 0062"), "0061 05AE 05C4 0300 0315 0062"); |
| ok(hexNFD("0061 05C4 0315 0300 05AE 0062"), "0061 05AE 05C4 0300 0315 0062"); |
| ok(hexNFD("0061 05AE 05C4 0300 0315 0062"), "0061 05AE 05C4 0300 0315 0062"); |
| ok(hexNFC("0000 0041 0000 0000"), "0000 0041 0000 0000"); |
| ok(hexNFD("0000 0041 0000 0000"), "0000 0041 0000 0000"); |
| |
| ok(hexNFC("AC00 11A7"), "AC00 11A7"); |
| ok(hexNFC("AC00 11A8"), "AC01"); |
| ok(hexNFC("AC00 11A9"), "AC02"); |
| ok(hexNFC("AC00 11C2"), "AC1B"); |
| ok(hexNFC("AC00 11C3"), "AC00 11C3"); |
| |
| # 47 |
| |
| # Test Cases from Public Review Issue #29: Normalization Issue |
| # cf. http://www.unicode.org/review/pr-29.html |
| ok(hexNFC("0B47 0300 0B3E"), "0B47 0300 0B3E"); |
| ok(hexNFC("1100 0300 1161"), "1100 0300 1161"); |
| ok(hexNFC("0B47 0B3E 0300"), "0B4B 0300"); |
| ok(hexNFC("1100 1161 0300"), "AC00 0300"); |
| ok(hexNFC("0B47 0300 0B3E 0327"), "0B47 0300 0B3E 0327"); |
| ok(hexNFC("1100 0300 1161 0327"), "1100 0300 1161 0327"); |
| |
| ok(hexNFC("0300 0041"), "0300 0041"); |
| ok(hexNFC("0300 0301 0041"), "0300 0301 0041"); |
| ok(hexNFC("0301 0300 0041"), "0301 0300 0041"); |
| ok(hexNFC("0000 0300 0000 0301"), "0000 0300 0000 0301"); |
| ok(hexNFC("0000 0301 0000 0300"), "0000 0301 0000 0300"); |
| |
| ok(hexNFC("0327 0061 0300"), "0327 00E0"); |
| ok(hexNFC("0301 0061 0300"), "0301 00E0"); |
| ok(hexNFC("0315 0061 0300"), "0315 00E0"); |
| ok(hexNFC("0000 0327 0061 0300"), "0000 0327 00E0"); |
| ok(hexNFC("0000 0301 0061 0300"), "0000 0301 00E0"); |
| ok(hexNFC("0000 0315 0061 0300"), "0000 0315 00E0"); |
| |
| # 64 |
| |