blob: 9157dde55cb4c6fc74a827624b80b49adae47909 [file] [log] [blame]
/* Test of compatibility decomposition of Unicode characters.
Copyright (C) 2009-2020 Free Software Foundation, Inc.
This program is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; either version 3 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program. If not, see <https://www.gnu.org/licenses/>. */
/* Written by Bruno Haible <bruno@clisp.org>, 2009. */
#include <config.h>
#include "uninorm/decompose-internal.h"
#include "uninorm.h"
#include "macros.h"
int
main ()
{
ucs4_t decomposed[UC_DECOMPOSITION_MAX_LENGTH];
int ret;
/* SPACE */
ret = uc_compat_decomposition (0x0020, decomposed);
ASSERT (ret == -1);
/* LATIN CAPITAL LETTER A WITH DIAERESIS */
ret = uc_compat_decomposition (0x00C4, decomposed);
ASSERT (ret == 2);
ASSERT (decomposed[0] == 0x0041);
ASSERT (decomposed[1] == 0x0308);
/* LATIN CAPITAL LETTER A WITH DIAERESIS AND MACRON */
ret = uc_compat_decomposition (0x01DE, decomposed);
ASSERT (ret == 2);
ASSERT (decomposed[0] == 0x00C4);
ASSERT (decomposed[1] == 0x0304);
/* GREEK DIALYTIKA AND PERISPOMENI */
ret = uc_compat_decomposition (0x1FC1, decomposed);
ASSERT (ret == 2);
ASSERT (decomposed[0] == 0x00A8);
ASSERT (decomposed[1] == 0x0342);
/* SCRIPT SMALL L */
ret = uc_compat_decomposition (0x2113, decomposed);
ASSERT (ret == 1);
ASSERT (decomposed[0] == 0x006C);
/* NO-BREAK SPACE */
ret = uc_compat_decomposition (0x00A0, decomposed);
ASSERT (ret == 1);
ASSERT (decomposed[0] == 0x0020);
/* ARABIC LETTER VEH INITIAL FORM */
ret = uc_compat_decomposition (0xFB6C, decomposed);
ASSERT (ret == 1);
ASSERT (decomposed[0] == 0x06A4);
/* ARABIC LETTER VEH MEDIAL FORM */
ret = uc_compat_decomposition (0xFB6D, decomposed);
ASSERT (ret == 1);
ASSERT (decomposed[0] == 0x06A4);
/* ARABIC LETTER VEH FINAL FORM */
ret = uc_compat_decomposition (0xFB6B, decomposed);
ASSERT (ret == 1);
ASSERT (decomposed[0] == 0x06A4);
/* ARABIC LETTER VEH ISOLATED FORM */
ret = uc_compat_decomposition (0xFB6A, decomposed);
ASSERT (ret == 1);
ASSERT (decomposed[0] == 0x06A4);
/* CIRCLED NUMBER FIFTEEN */
ret = uc_compat_decomposition (0x246E, decomposed);
ASSERT (ret == 2);
ASSERT (decomposed[0] == 0x0031);
ASSERT (decomposed[1] == 0x0035);
/* TRADE MARK SIGN */
ret = uc_compat_decomposition (0x2122, decomposed);
ASSERT (ret == 2);
ASSERT (decomposed[0] == 0x0054);
ASSERT (decomposed[1] == 0x004D);
/* LATIN SUBSCRIPT SMALL LETTER I */
ret = uc_compat_decomposition (0x1D62, decomposed);
ASSERT (ret == 1);
ASSERT (decomposed[0] == 0x0069);
/* PRESENTATION FORM FOR VERTICAL LEFT PARENTHESIS */
ret = uc_compat_decomposition (0xFE35, decomposed);
ASSERT (ret == 1);
ASSERT (decomposed[0] == 0x0028);
/* FULLWIDTH LATIN CAPITAL LETTER A */
ret = uc_compat_decomposition (0xFF21, decomposed);
ASSERT (ret == 1);
ASSERT (decomposed[0] == 0x0041);
/* HALFWIDTH IDEOGRAPHIC COMMA */
ret = uc_compat_decomposition (0xFF64, decomposed);
ASSERT (ret == 1);
ASSERT (decomposed[0] == 0x3001);
/* SMALL IDEOGRAPHIC COMMA */
ret = uc_compat_decomposition (0xFE51, decomposed);
ASSERT (ret == 1);
ASSERT (decomposed[0] == 0x3001);
/* SQUARE MHZ */
ret = uc_compat_decomposition (0x3392, decomposed);
ASSERT (ret == 3);
ASSERT (decomposed[0] == 0x004D);
ASSERT (decomposed[1] == 0x0048);
ASSERT (decomposed[2] == 0x007A);
/* VULGAR FRACTION THREE EIGHTHS */
ret = uc_compat_decomposition (0x215C, decomposed);
ASSERT (ret == 3);
ASSERT (decomposed[0] == 0x0033);
ASSERT (decomposed[1] == 0x2044);
ASSERT (decomposed[2] == 0x0038);
/* MICRO SIGN */
ret = uc_compat_decomposition (0x00B5, decomposed);
ASSERT (ret == 1);
ASSERT (decomposed[0] == 0x03BC);
/* ARABIC LIGATURE SALLALLAHOU ALAYHE WASALLAM */
ret = uc_compat_decomposition (0xFDFA, decomposed);
ASSERT (ret == 18);
ASSERT (decomposed[0] == 0x0635);
ASSERT (decomposed[1] == 0x0644);
ASSERT (decomposed[2] == 0x0649);
ASSERT (decomposed[3] == 0x0020);
ASSERT (decomposed[4] == 0x0627);
ASSERT (decomposed[5] == 0x0644);
ASSERT (decomposed[6] == 0x0644);
ASSERT (decomposed[7] == 0x0647);
ASSERT (decomposed[8] == 0x0020);
ASSERT (decomposed[9] == 0x0639);
ASSERT (decomposed[10] == 0x0644);
ASSERT (decomposed[11] == 0x064A);
ASSERT (decomposed[12] == 0x0647);
ASSERT (decomposed[13] == 0x0020);
ASSERT (decomposed[14] == 0x0648);
ASSERT (decomposed[15] == 0x0633);
ASSERT (decomposed[16] == 0x0644);
ASSERT (decomposed[17] == 0x0645);
/* HANGUL SYLLABLE GEUL */
ret = uc_compat_decomposition (0xAE00, decomposed);
/* See the clarification at <https://www.unicode.org/versions/Unicode5.1.0/>,
section "Clarification of Hangul Jamo Handling". */
#if 1
ASSERT (ret == 2);
ASSERT (decomposed[0] == 0xADF8);
ASSERT (decomposed[1] == 0x11AF);
#else
ASSERT (ret == 3);
ASSERT (decomposed[0] == 0x1100);
ASSERT (decomposed[1] == 0x1173);
ASSERT (decomposed[2] == 0x11AF);
#endif
/* HANGUL SYLLABLE GEU */
ret = uc_compat_decomposition (0xADF8, decomposed);
ASSERT (ret == 2);
ASSERT (decomposed[0] == 0x1100);
ASSERT (decomposed[1] == 0x1173);
return 0;
}