glib: Update Unicode Character Database to version 12.0.0

Using commands:
   glib/gen-unicode-tables.pl -both 12.0.0 path/to/UCD
   tests/gen-casefold-txt.py 12.0.0 path/to/UCD/CaseFolding.txt \
     > tests/casefold.txt
   tests/gen-casemap-txt.py 12.0.0 path/to/UCD/UnicodeData.txt \
      path/to/UCD/SpecialCasing.txt > tests/casemap.txt
plus some manual additions of the new G_UNICODE_SCRIPT_* symbols to
gunicode.h, guniprop.c and glib/tests/unicode.c.

Using UCD release https://www.unicode.org/Public/zipped/12.0.0/UCD.zip.

Signed-off-by: Philip Withnall <withnall@endlessm.com>

Fixes: #1713
This commit is contained in:
Philip Withnall 2019-04-29 14:16:12 +01:00
parent 1c77c93e81
commit 87014c8e97
9 changed files with 3000 additions and 1597 deletions

View File

@ -803,8 +803,8 @@ static const guchar g_script_easy_table[8192] = {
G_UNICODE_SCRIPT_DEVANAGARI, G_UNICODE_SCRIPT_DEVANAGARI, G_UNICODE_SCRIPT_DEVANAGARI,
G_UNICODE_SCRIPT_DEVANAGARI, G_UNICODE_SCRIPT_DEVANAGARI, G_UNICODE_SCRIPT_DEVANAGARI,
G_UNICODE_SCRIPT_DEVANAGARI, G_UNICODE_SCRIPT_DEVANAGARI, G_UNICODE_SCRIPT_DEVANAGARI,
G_UNICODE_SCRIPT_INHERITED, G_UNICODE_SCRIPT_INHERITED, G_UNICODE_SCRIPT_DEVANAGARI,
G_UNICODE_SCRIPT_DEVANAGARI, G_UNICODE_SCRIPT_DEVANAGARI, G_UNICODE_SCRIPT_DEVANAGARI,
G_UNICODE_SCRIPT_INHERITED, G_UNICODE_SCRIPT_INHERITED, G_UNICODE_SCRIPT_INHERITED,
G_UNICODE_SCRIPT_INHERITED, G_UNICODE_SCRIPT_DEVANAGARI, G_UNICODE_SCRIPT_DEVANAGARI,
G_UNICODE_SCRIPT_DEVANAGARI, G_UNICODE_SCRIPT_DEVANAGARI, G_UNICODE_SCRIPT_DEVANAGARI,
G_UNICODE_SCRIPT_DEVANAGARI, G_UNICODE_SCRIPT_DEVANAGARI, G_UNICODE_SCRIPT_DEVANAGARI,
G_UNICODE_SCRIPT_DEVANAGARI, G_UNICODE_SCRIPT_DEVANAGARI, G_UNICODE_SCRIPT_DEVANAGARI,
@ -1071,7 +1071,7 @@ static const guchar g_script_easy_table[8192] = {
G_UNICODE_SCRIPT_TELUGU, G_UNICODE_SCRIPT_TELUGU, G_UNICODE_SCRIPT_TELUGU,
G_UNICODE_SCRIPT_TELUGU, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_TELUGU,
G_UNICODE_SCRIPT_TELUGU, G_UNICODE_SCRIPT_TELUGU, G_UNICODE_SCRIPT_TELUGU,
G_UNICODE_SCRIPT_TELUGU, G_UNICODE_SCRIPT_TELUGU, G_UNICODE_SCRIPT_TELUGU,
G_UNICODE_SCRIPT_TELUGU, G_UNICODE_SCRIPT_TELUGU, G_UNICODE_SCRIPT_KANNADA,
@ -1247,24 +1247,24 @@ static const guchar g_script_easy_table[8192] = {
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_LAO,
G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO, G_UNICODE_SCRIPT_LAO,
@ -2480,7 +2480,7 @@ static const guchar g_script_easy_table[8192] = {
G_UNICODE_SCRIPT_COMMON, G_UNICODE_SCRIPT_COMMON, G_UNICODE_SCRIPT_COMMON,
G_UNICODE_SCRIPT_COMMON, G_UNICODE_SCRIPT_COMMON, G_UNICODE_SCRIPT_INHERITED,
G_UNICODE_SCRIPT_COMMON, G_UNICODE_SCRIPT_COMMON, G_UNICODE_SCRIPT_COMMON,
G_UNICODE_SCRIPT_INHERITED, G_UNICODE_SCRIPT_INHERITED, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_INHERITED, G_UNICODE_SCRIPT_INHERITED, G_UNICODE_SCRIPT_COMMON,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_LATIN,
G_UNICODE_SCRIPT_LATIN, G_UNICODE_SCRIPT_LATIN, G_UNICODE_SCRIPT_LATIN,
@ -2774,8 +2774,7 @@ static const struct {
{ 0x2800, 256, G_UNICODE_SCRIPT_BRAILLE },
{ 0x2900, 628, G_UNICODE_SCRIPT_COMMON },
{ 0x2b76, 32, G_UNICODE_SCRIPT_COMMON },
{ 0x2b98, 49, G_UNICODE_SCRIPT_COMMON },
{ 0x2bca, 53, G_UNICODE_SCRIPT_COMMON },
{ 0x2b98, 104, G_UNICODE_SCRIPT_COMMON },
{ 0x2c00, 47, G_UNICODE_SCRIPT_GLAGOLITIC },
{ 0x2c30, 47, G_UNICODE_SCRIPT_GLAGOLITIC },
{ 0x2c60, 32, G_UNICODE_SCRIPT_LATIN },
@ -2797,7 +2796,7 @@ static const struct {
{ 0x2dd0, 7, G_UNICODE_SCRIPT_ETHIOPIC },
{ 0x2dd8, 7, G_UNICODE_SCRIPT_ETHIOPIC },
{ 0x2de0, 32, G_UNICODE_SCRIPT_CYRILLIC },
{ 0x2e00, 79, G_UNICODE_SCRIPT_COMMON },
{ 0x2e00, 80, G_UNICODE_SCRIPT_COMMON },
{ 0x2e80, 26, G_UNICODE_SCRIPT_HAN },
{ 0x2e9b, 89, G_UNICODE_SCRIPT_HAN },
{ 0x2f00, 214, G_UNICODE_SCRIPT_HAN },
@ -2846,7 +2845,8 @@ static const struct {
{ 0xa700, 34, G_UNICODE_SCRIPT_COMMON },
{ 0xa722, 102, G_UNICODE_SCRIPT_LATIN },
{ 0xa788, 3, G_UNICODE_SCRIPT_COMMON },
{ 0xa78b, 47, G_UNICODE_SCRIPT_LATIN },
{ 0xa78b, 53, G_UNICODE_SCRIPT_LATIN },
{ 0xa7c2, 5, G_UNICODE_SCRIPT_LATIN },
{ 0xa7f7, 9, G_UNICODE_SCRIPT_LATIN },
{ 0xa800, 44, G_UNICODE_SCRIPT_SYLOTI_NAGRI },
{ 0xa830, 10, G_UNICODE_SCRIPT_COMMON },
@ -2882,6 +2882,7 @@ static const struct {
{ 0xab5b, 1, G_UNICODE_SCRIPT_COMMON },
{ 0xab5c, 9, G_UNICODE_SCRIPT_LATIN },
{ 0xab65, 1, G_UNICODE_SCRIPT_GREEK },
{ 0xab66, 2, G_UNICODE_SCRIPT_LATIN },
{ 0xab70, 80, G_UNICODE_SCRIPT_CHEROKEE },
{ 0xabc0, 46, G_UNICODE_SCRIPT_MEETEI_MAYEK },
{ 0xabf0, 10, G_UNICODE_SCRIPT_MEETEI_MAYEK },
@ -3022,6 +3023,7 @@ static const struct {
{ 0x10e60, 31, G_UNICODE_SCRIPT_ARABIC },
{ 0x10f00, 40, G_UNICODE_SCRIPT_OLD_SOGDIAN },
{ 0x10f30, 42, G_UNICODE_SCRIPT_SOGDIAN },
{ 0x10fe0, 23, G_UNICODE_SCRIPT_ELYMAIC },
{ 0x11000, 78, G_UNICODE_SCRIPT_BRAHMI },
{ 0x11052, 30, G_UNICODE_SCRIPT_BRAHMI },
{ 0x1107f, 1, G_UNICODE_SCRIPT_BRAHMI },
@ -3062,7 +3064,7 @@ static const struct {
{ 0x11370, 5, G_UNICODE_SCRIPT_GRANTHA },
{ 0x11400, 90, G_UNICODE_SCRIPT_NEWA },
{ 0x1145b, 1, G_UNICODE_SCRIPT_NEWA },
{ 0x1145d, 2, G_UNICODE_SCRIPT_NEWA },
{ 0x1145d, 3, G_UNICODE_SCRIPT_NEWA },
{ 0x11480, 72, G_UNICODE_SCRIPT_TIRHUTA },
{ 0x114d0, 10, G_UNICODE_SCRIPT_TIRHUTA },
{ 0x11580, 54, G_UNICODE_SCRIPT_SIDDHAM },
@ -3070,7 +3072,7 @@ static const struct {
{ 0x11600, 69, G_UNICODE_SCRIPT_MODI },
{ 0x11650, 10, G_UNICODE_SCRIPT_MODI },
{ 0x11660, 13, G_UNICODE_SCRIPT_MONGOLIAN },
{ 0x11680, 56, G_UNICODE_SCRIPT_TAKRI },
{ 0x11680, 57, G_UNICODE_SCRIPT_TAKRI },
{ 0x116c0, 10, G_UNICODE_SCRIPT_TAKRI },
{ 0x11700, 27, G_UNICODE_SCRIPT_AHOM },
{ 0x1171d, 15, G_UNICODE_SCRIPT_AHOM },
@ -3078,9 +3080,11 @@ static const struct {
{ 0x11800, 60, G_UNICODE_SCRIPT_DOGRA },
{ 0x118a0, 83, G_UNICODE_SCRIPT_WARANG_CITI },
{ 0x118ff, 1, G_UNICODE_SCRIPT_WARANG_CITI },
{ 0x119a0, 8, G_UNICODE_SCRIPT_NANDINAGARI },
{ 0x119aa, 46, G_UNICODE_SCRIPT_NANDINAGARI },
{ 0x119da, 11, G_UNICODE_SCRIPT_NANDINAGARI },
{ 0x11a00, 72, G_UNICODE_SCRIPT_ZANABAZAR_SQUARE },
{ 0x11a50, 52, G_UNICODE_SCRIPT_SOYOMBO },
{ 0x11a86, 29, G_UNICODE_SCRIPT_SOYOMBO },
{ 0x11a50, 83, G_UNICODE_SCRIPT_SOYOMBO },
{ 0x11ac0, 57, G_UNICODE_SCRIPT_PAU_CIN_HAU },
{ 0x11c00, 9, G_UNICODE_SCRIPT_BHAIKSUKI },
{ 0x11c0a, 45, G_UNICODE_SCRIPT_BHAIKSUKI },
@ -3103,11 +3107,14 @@ static const struct {
{ 0x11d93, 6, G_UNICODE_SCRIPT_GUNJALA_GONDI },
{ 0x11da0, 10, G_UNICODE_SCRIPT_GUNJALA_GONDI },
{ 0x11ee0, 25, G_UNICODE_SCRIPT_MAKASAR },
{ 0x11fc0, 50, G_UNICODE_SCRIPT_TAMIL },
{ 0x11fff, 1, G_UNICODE_SCRIPT_TAMIL },
{ 0x12000, 922, G_UNICODE_SCRIPT_CUNEIFORM },
{ 0x12400, 111, G_UNICODE_SCRIPT_CUNEIFORM },
{ 0x12470, 5, G_UNICODE_SCRIPT_CUNEIFORM },
{ 0x12480, 196, G_UNICODE_SCRIPT_CUNEIFORM },
{ 0x13000, 1071, G_UNICODE_SCRIPT_EGYPTIAN_HIEROGLYPHS },
{ 0x13430, 9, G_UNICODE_SCRIPT_EGYPTIAN_HIEROGLYPHS },
{ 0x14400, 583, G_UNICODE_SCRIPT_ANATOLIAN_HIEROGLYPHS },
{ 0x16800, 569, G_UNICODE_SCRIPT_BAMUM },
{ 0x16a40, 31, G_UNICODE_SCRIPT_MRO },
@ -3121,15 +3128,18 @@ static const struct {
{ 0x16b63, 21, G_UNICODE_SCRIPT_PAHAWH_HMONG },
{ 0x16b7d, 19, G_UNICODE_SCRIPT_PAHAWH_HMONG },
{ 0x16e40, 91, G_UNICODE_SCRIPT_MEDEFAIDRIN },
{ 0x16f00, 69, G_UNICODE_SCRIPT_MIAO },
{ 0x16f50, 47, G_UNICODE_SCRIPT_MIAO },
{ 0x16f00, 75, G_UNICODE_SCRIPT_MIAO },
{ 0x16f4f, 57, G_UNICODE_SCRIPT_MIAO },
{ 0x16f8f, 17, G_UNICODE_SCRIPT_MIAO },
{ 0x16fe0, 1, G_UNICODE_SCRIPT_TANGUT },
{ 0x16fe1, 1, G_UNICODE_SCRIPT_NUSHU },
{ 0x17000, 6130, G_UNICODE_SCRIPT_TANGUT },
{ 0x16fe2, 2, G_UNICODE_SCRIPT_COMMON },
{ 0x17000, 6136, G_UNICODE_SCRIPT_TANGUT },
{ 0x18800, 755, G_UNICODE_SCRIPT_TANGUT },
{ 0x1b000, 1, G_UNICODE_SCRIPT_KATAKANA },
{ 0x1b001, 286, G_UNICODE_SCRIPT_HIRAGANA },
{ 0x1b150, 3, G_UNICODE_SCRIPT_HIRAGANA },
{ 0x1b164, 4, G_UNICODE_SCRIPT_KATAKANA },
{ 0x1b170, 396, G_UNICODE_SCRIPT_NUSHU },
{ 0x1bc00, 107, G_UNICODE_SCRIPT_DUPLOYAN },
{ 0x1bc70, 13, G_UNICODE_SCRIPT_DUPLOYAN },
@ -3181,12 +3191,19 @@ static const struct {
{ 0x1e01b, 7, G_UNICODE_SCRIPT_GLAGOLITIC },
{ 0x1e023, 2, G_UNICODE_SCRIPT_GLAGOLITIC },
{ 0x1e026, 5, G_UNICODE_SCRIPT_GLAGOLITIC },
{ 0x1e100, 45, G_UNICODE_SCRIPT_NYIAKENG_PUACHUE_HMONG },
{ 0x1e130, 14, G_UNICODE_SCRIPT_NYIAKENG_PUACHUE_HMONG },
{ 0x1e140, 10, G_UNICODE_SCRIPT_NYIAKENG_PUACHUE_HMONG },
{ 0x1e14e, 2, G_UNICODE_SCRIPT_NYIAKENG_PUACHUE_HMONG },
{ 0x1e2c0, 58, G_UNICODE_SCRIPT_WANCHO },
{ 0x1e2ff, 1, G_UNICODE_SCRIPT_WANCHO },
{ 0x1e800, 197, G_UNICODE_SCRIPT_MENDE_KIKAKUI },
{ 0x1e8c7, 16, G_UNICODE_SCRIPT_MENDE_KIKAKUI },
{ 0x1e900, 75, G_UNICODE_SCRIPT_ADLAM },
{ 0x1e900, 76, G_UNICODE_SCRIPT_ADLAM },
{ 0x1e950, 10, G_UNICODE_SCRIPT_ADLAM },
{ 0x1e95e, 2, G_UNICODE_SCRIPT_ADLAM },
{ 0x1ec71, 68, G_UNICODE_SCRIPT_COMMON },
{ 0x1ed01, 61, G_UNICODE_SCRIPT_COMMON },
{ 0x1ee00, 4, G_UNICODE_SCRIPT_ARABIC },
{ 0x1ee05, 27, G_UNICODE_SCRIPT_ARABIC },
{ 0x1ee21, 2, G_UNICODE_SCRIPT_ARABIC },
@ -3228,7 +3245,7 @@ static const struct {
{ 0x1f0c1, 15, G_UNICODE_SCRIPT_COMMON },
{ 0x1f0d1, 37, G_UNICODE_SCRIPT_COMMON },
{ 0x1f100, 13, G_UNICODE_SCRIPT_COMMON },
{ 0x1f110, 92, G_UNICODE_SCRIPT_COMMON },
{ 0x1f110, 93, G_UNICODE_SCRIPT_COMMON },
{ 0x1f170, 61, G_UNICODE_SCRIPT_COMMON },
{ 0x1f1e6, 26, G_UNICODE_SCRIPT_COMMON },
{ 0x1f200, 1, G_UNICODE_SCRIPT_HIRAGANA },
@ -3237,26 +3254,29 @@ static const struct {
{ 0x1f240, 9, G_UNICODE_SCRIPT_COMMON },
{ 0x1f250, 2, G_UNICODE_SCRIPT_COMMON },
{ 0x1f260, 6, G_UNICODE_SCRIPT_COMMON },
{ 0x1f300, 981, G_UNICODE_SCRIPT_COMMON },
{ 0x1f300, 982, G_UNICODE_SCRIPT_COMMON },
{ 0x1f6e0, 13, G_UNICODE_SCRIPT_COMMON },
{ 0x1f6f0, 10, G_UNICODE_SCRIPT_COMMON },
{ 0x1f6f0, 11, G_UNICODE_SCRIPT_COMMON },
{ 0x1f700, 116, G_UNICODE_SCRIPT_COMMON },
{ 0x1f780, 89, G_UNICODE_SCRIPT_COMMON },
{ 0x1f7e0, 12, G_UNICODE_SCRIPT_COMMON },
{ 0x1f800, 12, G_UNICODE_SCRIPT_COMMON },
{ 0x1f810, 56, G_UNICODE_SCRIPT_COMMON },
{ 0x1f850, 10, G_UNICODE_SCRIPT_COMMON },
{ 0x1f860, 40, G_UNICODE_SCRIPT_COMMON },
{ 0x1f890, 30, G_UNICODE_SCRIPT_COMMON },
{ 0x1f900, 12, G_UNICODE_SCRIPT_COMMON },
{ 0x1f910, 47, G_UNICODE_SCRIPT_COMMON },
{ 0x1f940, 49, G_UNICODE_SCRIPT_COMMON },
{ 0x1f90d, 101, G_UNICODE_SCRIPT_COMMON },
{ 0x1f973, 4, G_UNICODE_SCRIPT_COMMON },
{ 0x1f97a, 1, G_UNICODE_SCRIPT_COMMON },
{ 0x1f97c, 39, G_UNICODE_SCRIPT_COMMON },
{ 0x1f9b0, 10, G_UNICODE_SCRIPT_COMMON },
{ 0x1f9c0, 3, G_UNICODE_SCRIPT_COMMON },
{ 0x1f9d0, 48, G_UNICODE_SCRIPT_COMMON },
{ 0x1f97a, 41, G_UNICODE_SCRIPT_COMMON },
{ 0x1f9a5, 6, G_UNICODE_SCRIPT_COMMON },
{ 0x1f9ae, 29, G_UNICODE_SCRIPT_COMMON },
{ 0x1f9cd, 135, G_UNICODE_SCRIPT_COMMON },
{ 0x1fa60, 14, G_UNICODE_SCRIPT_COMMON },
{ 0x1fa70, 4, G_UNICODE_SCRIPT_COMMON },
{ 0x1fa78, 3, G_UNICODE_SCRIPT_COMMON },
{ 0x1fa80, 3, G_UNICODE_SCRIPT_COMMON },
{ 0x1fa90, 6, G_UNICODE_SCRIPT_COMMON },
{ 0x20000, 42711, G_UNICODE_SCRIPT_HAN },
{ 0x2a700, 4149, G_UNICODE_SCRIPT_HAN },
{ 0x2b740, 222, G_UNICODE_SCRIPT_HAN },

File diff suppressed because it is too large Load Diff

File diff suppressed because it is too large Load Diff

View File

@ -607,7 +607,13 @@ typedef enum
G_UNICODE_SCRIPT_MAKASAR, /* Maka */
G_UNICODE_SCRIPT_MEDEFAIDRIN, /* Medf */
G_UNICODE_SCRIPT_OLD_SOGDIAN, /* Sogo */
G_UNICODE_SCRIPT_SOGDIAN /* Sogd */
G_UNICODE_SCRIPT_SOGDIAN, /* Sogd */
/* Unicode 12.0 additions */
G_UNICODE_SCRIPT_ELYMAIC, /* Elym */
G_UNICODE_SCRIPT_NANDINAGARI, /* Nand */
G_UNICODE_SCRIPT_NYIAKENG_PUACHUE_HMONG, /* Rohg */
G_UNICODE_SCRIPT_WANCHO /* Wcho */
} GUnicodeScript;
GLIB_AVAILABLE_IN_ALL

File diff suppressed because it is too large Load Diff

View File

@ -1449,6 +1449,12 @@ static const guint32 iso15924_tags[] =
PACK ('M','e','d','f'), /* G_UNICODE_SCRIPT_MEDEFAIDRIN */
PACK ('S','o','g','o'), /* G_UNICODE_SCRIPT_OLD_SOGDIAN */
PACK ('S','o','g','d'), /* G_UNICODE_SCRIPT_SOGDIAN */
/* Unicode 12.0 additions */
PACK ('E','l','y','m'), /* G_UNICODE_SCRIPT_ELYMAIC */
PACK ('N','a','n','d'), /* G_UNICODE_SCRIPT_NANDINAGARI */
PACK ('H','m','n','p'), /* G_UNICODE_SCRIPT_NYIAKENG_PUACHUE_HMONG */
PACK ('W','c','h','o'), /* G_UNICODE_SCRIPT_WANCHO */
#undef PACK
};

View File

@ -304,6 +304,10 @@ test_unichar_script (void)
{ G_UNICODE_SCRIPT_MEDEFAIDRIN, 0x16E40 },
{ G_UNICODE_SCRIPT_OLD_SOGDIAN, 0x10F00 },
{ G_UNICODE_SCRIPT_SOGDIAN, 0x10F30 },
{ G_UNICODE_SCRIPT_ELYMAIC, 0x10FE0 },
{ G_UNICODE_SCRIPT_NANDINAGARI, 0x119A0 },
{ G_UNICODE_SCRIPT_NYIAKENG_PUACHUE_HMONG, 0x1E100 },
{ G_UNICODE_SCRIPT_WANCHO, 0x1E2C0 },
};
for (i = 0; i < G_N_ELEMENTS (examples); i++)
g_assert_cmpint (g_unichar_get_script (examples[i].c), ==, examples[i].script);
@ -911,6 +915,12 @@ test_iso15924 (void)
{ G_UNICODE_SCRIPT_MEDEFAIDRIN, "Medf" },
{ G_UNICODE_SCRIPT_OLD_SOGDIAN, "Sogo" },
{ G_UNICODE_SCRIPT_SOGDIAN, "Sogd" },
/* Unicode 12.0 additions */
{ G_UNICODE_SCRIPT_ELYMAIC, "Elym" },
{ G_UNICODE_SCRIPT_NANDINAGARI, "Nand" },
{ G_UNICODE_SCRIPT_NYIAKENG_PUACHUE_HMONG, "Hmnp" },
{ G_UNICODE_SCRIPT_WANCHO, "Wcho" },
};
guint i;

View File

@ -1,4 +1,4 @@
# Test cases generated from Unicode 11.0.0 data
# Test cases generated from Unicode 12.0.0 data
# by gen-casefold-txt.py. Do not edit.
#
# Some special hand crafted tests
@ -1144,6 +1144,13 @@ Z z
Ꞷ ꞷ
Ꞹ ꞹ
Ꞻ ꞻ
Ꞽ ꞽ
Ꞿ ꞿ
Ꟃ ꟃ
Ꞔ ꞔ
Ʂ ʂ
Ᶎ ᶎ

View File

@ -1,4 +1,4 @@
# Test cases generated from Unicode 11.0.0 data
# Test cases generated from Unicode 12.0.0 data
# by gen-casemap-txt.py. Do not edit.
#
# Some special hand crafted tests
@ -541,7 +541,7 @@ lt_LT.UTF-8 Į́ į̇́ Į́ Į́ # LATIN CAPITAL LETTER I WITH OGONEK (with ac
ɿ ɿ # 27F
ʀ ʀ Ʀ Ʀ # 280
ʁ ʁ # 281
ʂ ʂ # 282
ʂ ʂ # 282
ʃ ʃ Ʃ Ʃ # 283
ʄ ʄ # 284
ʅ ʅ # 285
@ -1398,7 +1398,7 @@ lt_LT.UTF-8 Į́ į̇́ Į́ Į́ # LATIN CAPITAL LETTER I WITH OGONEK (with ac
ᶋ ᶋ # 1D8B
# 1D8C
ᶍ ᶍ # 1D8D
ᶎ ᶎ # 1D8E
ᶎ ᶎ # 1D8E
ᶏ ᶏ # 1D8F
ᶐ ᶐ # 1D90
ᶑ ᶑ # 1D91
@ -2383,7 +2383,7 @@ lt_LT.UTF-8 Į́ į̇́ Į́ Į́ # LATIN CAPITAL LETTER I WITH OGONEK (with ac
ꞑ ꞑ Ꞑ Ꞑ # A791
Ꞓ ꞓ Ꞓ # A792
ꞓ ꞓ Ꞓ Ꞓ # A793
ꞔ ꞔ # A794
ꞔ ꞔ # A794
ꞕ ꞕ # A795
Ꞗ ꞗ Ꞗ # A796
ꞗ ꞗ Ꞗ Ꞗ # A797
@ -2421,6 +2421,17 @@ lt_LT.UTF-8 Į́ į̇́ Į́ Į́ # LATIN CAPITAL LETTER I WITH OGONEK (with ac
ꞷ ꞷ Ꞷ Ꞷ # A7B7
Ꞹ ꞹ Ꞹ # A7B8
ꞹ ꞹ Ꞹ Ꞹ # A7B9
Ꞻ ꞻ Ꞻ # A7BA
ꞻ ꞻ Ꞻ Ꞻ # A7BB
Ꞽ ꞽ Ꞽ # A7BC
ꞽ ꞽ Ꞽ Ꞽ # A7BD
Ꞿ ꞿ Ꞿ # A7BE
ꞿ ꞿ Ꞿ Ꞿ # A7BF
Ꟃ ꟃ Ꟃ # A7C2
ꟃ ꟃ Ꟃ Ꟃ # A7C3
Ꞔ ꞔ Ꞔ # A7C4
Ʂ ʂ Ʂ # A7C5
Ᶎ ᶎ Ᶎ # A7C6
ꟺ ꟺ # A7FA
ꬰ ꬰ # AB30
ꬱ ꬱ # AB31
@ -2471,6 +2482,8 @@ lt_LT.UTF-8 Į́ į̇́ Į́ Į́ # LATIN CAPITAL LETTER I WITH OGONEK (with ac
ꭣ ꭣ # AB63
ꭤ ꭤ # AB64
ꭥ ꭥ # AB65
ꭦ ꭦ # AB66
ꭧ ꭧ # AB67
ꭰ ꭰ # AB70
ꭱ ꭱ # AB71
ꭲ ꭲ # AB72