/* Test of conversion of multibyte character to 32-bit wide character. Copyright (C) 2023-2024 Free Software Foundation, Inc. This program is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program. If not, see . */ /* Written by Bruno Haible , 2023. */ #include #include #include #include #include #include #include #include #include "macros.h" int main (int argc, char *argv[]) { /* The only locales in which mbrtoc32 may map a multibyte character to a sequence of two or more Unicode characters are those with BIG5-HKSCS encoding. See */ if (setlocale (LC_ALL, "zh_HK.BIG5-HKSCS") == NULL) { fprintf (stderr, "Skipping test: found no locale with BIG5-HKSCS encoding.\n"); return 77; } /* The problematic BIG5-HKSCS characters are: input maps to name ----- ------- ---- 0x88 0x62 U+00CA U+0304 LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND MACRON 0x88 0x64 U+00CA U+030C LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND CARON 0x88 0xA3 U+00EA U+0304 LATIN SMALL LETTER E WITH CIRCUMFLEX AND MACRON 0x88 0xA5 U+00EA U+030C LATIN SMALL LETTER E WITH CIRCUMFLEX AND CARON Test one of them. See . */ mbstate_t state; memset (&state, '\0', sizeof (mbstate_t)); char32_t c32 = (char32_t) 0xBADFACE; size_t ret = mbrtoc32 (&c32, "\210\142", 2, &state); /* It is OK if this conversion fails. */ if (ret != (size_t)(-1)) { /* mbrtoc32 being regular, means that STATE is in an initial state. */ ASSERT (mbsinit (&state)); ret = mbrtoc32 (&c32, "", 0, &state); /* mbrtoc32 being regular, means that it returns (size_t)(-2), not (size_t)(-3), here. */ ASSERT (ret == (size_t)(-2)); ret = mbrtoc32 (&c32, "", 1, &state); /* mbrtoc32 being regular, means that it returns the null 32-bit wide character, here, not any remnant from the previous multibyte character. */ ASSERT (ret == 0); ASSERT (c32 == 0); } return 0; }