unicode: Update to unicode 9.0.0

https://bugzilla.gnome.org/show_bug.cgi?id=771591
This commit is contained in:
Rico Tzschichholz 2016-09-17 15:57:10 +02:00
parent c7f4699735
commit ba18667bb4
7 changed files with 3575 additions and 2382 deletions

View File

@ -751,14 +751,9 @@ static const guchar g_script_easy_table[8192] = {
G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC,
G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC,
G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC,
G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC,
G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
@ -771,6 +766,11 @@ static const guchar g_script_easy_table[8192] = {
G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC,
G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC,
G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC,
G_UNICODE_SCRIPT_COMMON, G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC,
G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC,
G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC,
G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC,
G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC,
G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC,
G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC,
G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC, G_UNICODE_SCRIPT_ARABIC,
@ -1074,7 +1074,7 @@ static const guchar g_script_easy_table[8192] = {
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_TELUGU, G_UNICODE_SCRIPT_TELUGU, G_UNICODE_SCRIPT_TELUGU,
G_UNICODE_SCRIPT_TELUGU, G_UNICODE_SCRIPT_TELUGU, G_UNICODE_SCRIPT_TELUGU,
G_UNICODE_SCRIPT_TELUGU, G_UNICODE_SCRIPT_TELUGU, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_TELUGU, G_UNICODE_SCRIPT_TELUGU, G_UNICODE_SCRIPT_KANNADA,
G_UNICODE_SCRIPT_KANNADA, G_UNICODE_SCRIPT_KANNADA, G_UNICODE_SCRIPT_KANNADA,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_KANNADA, G_UNICODE_SCRIPT_KANNADA,
G_UNICODE_SCRIPT_KANNADA, G_UNICODE_SCRIPT_KANNADA, G_UNICODE_SCRIPT_KANNADA,
@ -1143,12 +1143,12 @@ static const guchar g_script_easy_table[8192] = {
G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_MALAYALAM,
G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM,
G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM,
G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM,
G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM,
G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM,
G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM,
G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM,
@ -1156,8 +1156,8 @@ static const guchar g_script_easy_table[8192] = {
G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM,
G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM,
G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM,
G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_MALAYALAM,
G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM,
G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM,
G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM,
G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM, G_UNICODE_SCRIPT_MALAYALAM,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_SINHALA,
@ -2440,9 +2440,9 @@ static const guchar g_script_easy_table[8192] = {
G_UNICODE_SCRIPT_OL_CHIKI, G_UNICODE_SCRIPT_OL_CHIKI, G_UNICODE_SCRIPT_OL_CHIKI,
G_UNICODE_SCRIPT_OL_CHIKI, G_UNICODE_SCRIPT_OL_CHIKI, G_UNICODE_SCRIPT_OL_CHIKI,
G_UNICODE_SCRIPT_OL_CHIKI, G_UNICODE_SCRIPT_OL_CHIKI, G_UNICODE_SCRIPT_OL_CHIKI,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_CYRILLIC, G_UNICODE_SCRIPT_CYRILLIC, G_UNICODE_SCRIPT_CYRILLIC,
G_UNICODE_SCRIPT_CYRILLIC, G_UNICODE_SCRIPT_CYRILLIC, G_UNICODE_SCRIPT_CYRILLIC,
G_UNICODE_SCRIPT_CYRILLIC, G_UNICODE_SCRIPT_CYRILLIC, G_UNICODE_SCRIPT_CYRILLIC,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
@ -2566,7 +2566,7 @@ static const guchar g_script_easy_table[8192] = {
G_UNICODE_SCRIPT_INHERITED, G_UNICODE_SCRIPT_INHERITED, G_UNICODE_SCRIPT_INHERITED,
G_UNICODE_SCRIPT_INHERITED, G_UNICODE_SCRIPT_INHERITED, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_INHERITED,
G_UNICODE_SCRIPT_UNKNOWN, G_UNICODE_SCRIPT_INHERITED, G_UNICODE_SCRIPT_INHERITED,
G_UNICODE_SCRIPT_INHERITED, G_UNICODE_SCRIPT_INHERITED, G_UNICODE_SCRIPT_INHERITED,
G_UNICODE_SCRIPT_LATIN, G_UNICODE_SCRIPT_LATIN, G_UNICODE_SCRIPT_LATIN,
G_UNICODE_SCRIPT_LATIN, G_UNICODE_SCRIPT_LATIN, G_UNICODE_SCRIPT_LATIN,
@ -2768,7 +2768,7 @@ static const struct {
{ 0x214f, 17, G_UNICODE_SCRIPT_COMMON },
{ 0x2160, 41, G_UNICODE_SCRIPT_LATIN },
{ 0x2189, 3, G_UNICODE_SCRIPT_COMMON },
{ 0x2190, 619, G_UNICODE_SCRIPT_COMMON },
{ 0x2190, 623, G_UNICODE_SCRIPT_COMMON },
{ 0x2400, 39, G_UNICODE_SCRIPT_COMMON },
{ 0x2440, 11, G_UNICODE_SCRIPT_COMMON },
{ 0x2460, 928, G_UNICODE_SCRIPT_COMMON },
@ -2800,7 +2800,7 @@ static const struct {
{ 0x2dd0, 7, G_UNICODE_SCRIPT_ETHIOPIC },
{ 0x2dd8, 7, G_UNICODE_SCRIPT_ETHIOPIC },
{ 0x2de0, 32, G_UNICODE_SCRIPT_CYRILLIC },
{ 0x2e00, 67, G_UNICODE_SCRIPT_COMMON },
{ 0x2e00, 69, G_UNICODE_SCRIPT_COMMON },
{ 0x2e80, 26, G_UNICODE_SCRIPT_HAN },
{ 0x2e9b, 89, G_UNICODE_SCRIPT_HAN },
{ 0x2f00, 214, G_UNICODE_SCRIPT_HAN },
@ -2849,13 +2849,13 @@ static const struct {
{ 0xa700, 34, G_UNICODE_SCRIPT_COMMON },
{ 0xa722, 102, G_UNICODE_SCRIPT_LATIN },
{ 0xa788, 3, G_UNICODE_SCRIPT_COMMON },
{ 0xa78b, 35, G_UNICODE_SCRIPT_LATIN },
{ 0xa78b, 36, G_UNICODE_SCRIPT_LATIN },
{ 0xa7b0, 8, G_UNICODE_SCRIPT_LATIN },
{ 0xa7f7, 9, G_UNICODE_SCRIPT_LATIN },
{ 0xa800, 44, G_UNICODE_SCRIPT_SYLOTI_NAGRI },
{ 0xa830, 10, G_UNICODE_SCRIPT_COMMON },
{ 0xa840, 56, G_UNICODE_SCRIPT_PHAGS_PA },
{ 0xa880, 69, G_UNICODE_SCRIPT_SAURASHTRA },
{ 0xa880, 70, G_UNICODE_SCRIPT_SAURASHTRA },
{ 0xa8ce, 12, G_UNICODE_SCRIPT_SAURASHTRA },
{ 0xa8e0, 30, G_UNICODE_SCRIPT_DEVANAGARI },
{ 0xa900, 46, G_UNICODE_SCRIPT_KAYAH_LI },
@ -2945,7 +2945,7 @@ static const struct {
{ 0x10100, 3, G_UNICODE_SCRIPT_COMMON },
{ 0x10107, 45, G_UNICODE_SCRIPT_COMMON },
{ 0x10137, 9, G_UNICODE_SCRIPT_COMMON },
{ 0x10140, 77, G_UNICODE_SCRIPT_GREEK },
{ 0x10140, 79, G_UNICODE_SCRIPT_GREEK },
{ 0x10190, 12, G_UNICODE_SCRIPT_COMMON },
{ 0x101a0, 1, G_UNICODE_SCRIPT_GREEK },
{ 0x101d0, 45, G_UNICODE_SCRIPT_COMMON },
@ -2965,6 +2965,8 @@ static const struct {
{ 0x10450, 48, G_UNICODE_SCRIPT_SHAVIAN },
{ 0x10480, 30, G_UNICODE_SCRIPT_OSMANYA },
{ 0x104a0, 10, G_UNICODE_SCRIPT_OSMANYA },
{ 0x104b0, 36, G_UNICODE_SCRIPT_OSAGE },
{ 0x104d8, 36, G_UNICODE_SCRIPT_OSAGE },
{ 0x10500, 40, G_UNICODE_SCRIPT_ELBASAN },
{ 0x10530, 52, G_UNICODE_SCRIPT_CAUCASIAN_ALBANIAN },
{ 0x1056f, 1, G_UNICODE_SCRIPT_CAUCASIAN_ALBANIAN },
@ -3032,7 +3034,7 @@ static const struct {
{ 0x111d0, 16, G_UNICODE_SCRIPT_SHARADA },
{ 0x111e1, 20, G_UNICODE_SCRIPT_SINHALA },
{ 0x11200, 18, G_UNICODE_SCRIPT_KHOJKI },
{ 0x11213, 43, G_UNICODE_SCRIPT_KHOJKI },
{ 0x11213, 44, G_UNICODE_SCRIPT_KHOJKI },
{ 0x11280, 7, G_UNICODE_SCRIPT_MULTANI },
{ 0x11288, 1, G_UNICODE_SCRIPT_MULTANI },
{ 0x1128a, 4, G_UNICODE_SCRIPT_MULTANI },
@ -3055,12 +3057,16 @@ static const struct {
{ 0x1135d, 7, G_UNICODE_SCRIPT_GRANTHA },
{ 0x11366, 7, G_UNICODE_SCRIPT_GRANTHA },
{ 0x11370, 5, G_UNICODE_SCRIPT_GRANTHA },
{ 0x11400, 90, G_UNICODE_SCRIPT_NEWA },
{ 0x1145b, 1, G_UNICODE_SCRIPT_NEWA },
{ 0x1145d, 1, G_UNICODE_SCRIPT_NEWA },
{ 0x11480, 72, G_UNICODE_SCRIPT_TIRHUTA },
{ 0x114d0, 10, G_UNICODE_SCRIPT_TIRHUTA },
{ 0x11580, 54, G_UNICODE_SCRIPT_SIDDHAM },
{ 0x115b8, 38, G_UNICODE_SCRIPT_SIDDHAM },
{ 0x11600, 69, G_UNICODE_SCRIPT_MODI },
{ 0x11650, 10, G_UNICODE_SCRIPT_MODI },
{ 0x11660, 13, G_UNICODE_SCRIPT_MONGOLIAN },
{ 0x11680, 56, G_UNICODE_SCRIPT_TAKRI },
{ 0x116c0, 10, G_UNICODE_SCRIPT_TAKRI },
{ 0x11700, 26, G_UNICODE_SCRIPT_AHOM },
@ -3069,6 +3075,13 @@ static const struct {
{ 0x118a0, 83, G_UNICODE_SCRIPT_WARANG_CITI },
{ 0x118ff, 1, G_UNICODE_SCRIPT_WARANG_CITI },
{ 0x11ac0, 57, G_UNICODE_SCRIPT_PAU_CIN_HAU },
{ 0x11c00, 9, G_UNICODE_SCRIPT_BHAIKSUKI },
{ 0x11c0a, 45, G_UNICODE_SCRIPT_BHAIKSUKI },
{ 0x11c38, 14, G_UNICODE_SCRIPT_BHAIKSUKI },
{ 0x11c50, 29, G_UNICODE_SCRIPT_BHAIKSUKI },
{ 0x11c70, 32, G_UNICODE_SCRIPT_MARCHEN },
{ 0x11c92, 22, G_UNICODE_SCRIPT_MARCHEN },
{ 0x11ca9, 14, G_UNICODE_SCRIPT_MARCHEN },
{ 0x12000, 922, G_UNICODE_SCRIPT_CUNEIFORM },
{ 0x12400, 111, G_UNICODE_SCRIPT_CUNEIFORM },
{ 0x12470, 5, G_UNICODE_SCRIPT_CUNEIFORM },
@ -3089,6 +3102,9 @@ static const struct {
{ 0x16f00, 69, G_UNICODE_SCRIPT_MIAO },
{ 0x16f50, 47, G_UNICODE_SCRIPT_MIAO },
{ 0x16f8f, 17, G_UNICODE_SCRIPT_MIAO },
{ 0x16fe0, 1, G_UNICODE_SCRIPT_TANGUT },
{ 0x17000, 6125, G_UNICODE_SCRIPT_TANGUT },
{ 0x18800, 755, G_UNICODE_SCRIPT_TANGUT },
{ 0x1b000, 1, G_UNICODE_SCRIPT_KATAKANA },
{ 0x1b001, 1, G_UNICODE_SCRIPT_HIRAGANA },
{ 0x1bc00, 107, G_UNICODE_SCRIPT_DUPLOYAN },
@ -3135,8 +3151,16 @@ static const struct {
{ 0x1d800, 652, G_UNICODE_SCRIPT_SIGNWRITING },
{ 0x1da9b, 5, G_UNICODE_SCRIPT_SIGNWRITING },
{ 0x1daa1, 15, G_UNICODE_SCRIPT_SIGNWRITING },
{ 0x1e000, 7, G_UNICODE_SCRIPT_GLAGOLITIC },
{ 0x1e008, 17, G_UNICODE_SCRIPT_GLAGOLITIC },
{ 0x1e01b, 7, G_UNICODE_SCRIPT_GLAGOLITIC },
{ 0x1e023, 2, G_UNICODE_SCRIPT_GLAGOLITIC },
{ 0x1e026, 5, G_UNICODE_SCRIPT_GLAGOLITIC },
{ 0x1e800, 197, G_UNICODE_SCRIPT_MENDE_KIKAKUI },
{ 0x1e8c7, 16, G_UNICODE_SCRIPT_MENDE_KIKAKUI },
{ 0x1e900, 75, G_UNICODE_SCRIPT_ADLAM },
{ 0x1e950, 10, G_UNICODE_SCRIPT_ADLAM },
{ 0x1e95e, 2, G_UNICODE_SCRIPT_ADLAM },
{ 0x1ee00, 4, G_UNICODE_SCRIPT_ARABIC },
{ 0x1ee05, 27, G_UNICODE_SCRIPT_ARABIC },
{ 0x1ee21, 2, G_UNICODE_SCRIPT_ARABIC },
@ -3180,18 +3204,16 @@ static const struct {
{ 0x1f100, 13, G_UNICODE_SCRIPT_COMMON },
{ 0x1f110, 31, G_UNICODE_SCRIPT_COMMON },
{ 0x1f130, 60, G_UNICODE_SCRIPT_COMMON },
{ 0x1f170, 43, G_UNICODE_SCRIPT_COMMON },
{ 0x1f170, 61, G_UNICODE_SCRIPT_COMMON },
{ 0x1f1e6, 26, G_UNICODE_SCRIPT_COMMON },
{ 0x1f200, 1, G_UNICODE_SCRIPT_HIRAGANA },
{ 0x1f201, 2, G_UNICODE_SCRIPT_COMMON },
{ 0x1f210, 43, G_UNICODE_SCRIPT_COMMON },
{ 0x1f210, 44, G_UNICODE_SCRIPT_COMMON },
{ 0x1f240, 9, G_UNICODE_SCRIPT_COMMON },
{ 0x1f250, 2, G_UNICODE_SCRIPT_COMMON },
{ 0x1f300, 634, G_UNICODE_SCRIPT_COMMON },
{ 0x1f57b, 41, G_UNICODE_SCRIPT_COMMON },
{ 0x1f5a5, 300, G_UNICODE_SCRIPT_COMMON },
{ 0x1f300, 979, G_UNICODE_SCRIPT_COMMON },
{ 0x1f6e0, 13, G_UNICODE_SCRIPT_COMMON },
{ 0x1f6f0, 4, G_UNICODE_SCRIPT_COMMON },
{ 0x1f6f0, 7, G_UNICODE_SCRIPT_COMMON },
{ 0x1f700, 116, G_UNICODE_SCRIPT_COMMON },
{ 0x1f780, 85, G_UNICODE_SCRIPT_COMMON },
{ 0x1f800, 12, G_UNICODE_SCRIPT_COMMON },
@ -3199,8 +3221,13 @@ static const struct {
{ 0x1f850, 10, G_UNICODE_SCRIPT_COMMON },
{ 0x1f860, 40, G_UNICODE_SCRIPT_COMMON },
{ 0x1f890, 30, G_UNICODE_SCRIPT_COMMON },
{ 0x1f910, 9, G_UNICODE_SCRIPT_COMMON },
{ 0x1f980, 5, G_UNICODE_SCRIPT_COMMON },
{ 0x1f910, 15, G_UNICODE_SCRIPT_COMMON },
{ 0x1f920, 8, G_UNICODE_SCRIPT_COMMON },
{ 0x1f930, 1, G_UNICODE_SCRIPT_COMMON },
{ 0x1f933, 12, G_UNICODE_SCRIPT_COMMON },
{ 0x1f940, 12, G_UNICODE_SCRIPT_COMMON },
{ 0x1f950, 15, G_UNICODE_SCRIPT_COMMON },
{ 0x1f980, 18, G_UNICODE_SCRIPT_COMMON },
{ 0x1f9c0, 1, G_UNICODE_SCRIPT_COMMON },
{ 0x20000, 42711, G_UNICODE_SCRIPT_HAN },
{ 0x2a700, 4149, G_UNICODE_SCRIPT_HAN },

File diff suppressed because it is too large Load Diff

File diff suppressed because it is too large Load Diff

View File

@ -201,6 +201,9 @@ typedef enum
* @G_UNICODE_BREAK_CONDITIONAL_JAPANESE_STARTER: Conditional Japanese Starter (CJ). Since: 2.32
* @G_UNICODE_BREAK_HEBREW_LETTER: Hebrew Letter (HL). Since: 2.32
* @G_UNICODE_BREAK_REGIONAL_INDICATOR: Regional Indicator (RI). Since: 2.36
* @G_UNICODE_BREAK_EMOJI_BASE: Emoji Base (EB). Since: 2.50
* @G_UNICODE_BREAK_EMOJI_MODIFIER: Emoji Modifier (EM). Since: 2.50
* @G_UNICODE_BREAK_ZERO_WIDTH_JOINER: Zero Width Joiner (ZWJ). Since: 2.50
*
* These are the possible line break classifications.
*
@ -250,7 +253,10 @@ typedef enum
G_UNICODE_BREAK_CLOSE_PARANTHESIS,
G_UNICODE_BREAK_CONDITIONAL_JAPANESE_STARTER,
G_UNICODE_BREAK_HEBREW_LETTER,
G_UNICODE_BREAK_REGIONAL_INDICATOR
G_UNICODE_BREAK_REGIONAL_INDICATOR,
G_UNICODE_BREAK_EMOJI_BASE,
G_UNICODE_BREAK_EMOJI_MODIFIER,
G_UNICODE_BREAK_ZERO_WIDTH_JOINER
} GUnicodeBreakType;
/**
@ -400,6 +406,12 @@ typedef enum
* @G_UNICODE_SCRIPT_MULTANI: Multani. Since: 2.48
* @G_UNICODE_SCRIPT_OLD_HUNGARIAN: Old Hungarian. Since: 2.48
* @G_UNICODE_SCRIPT_SIGNWRITING: Signwriting. Since: 2.48
* @G_UNICODE_SCRIPT_ADLAM: Adlam. Since: 2.50
* @G_UNICODE_SCRIPT_BHAIKSUKI: Bhaiksuki. Since: 2.50
* @G_UNICODE_SCRIPT_MARCHEN: Marchen. Since: 2.50
* @G_UNICODE_SCRIPT_NEWA: Newa. Since: 2.50
* @G_UNICODE_SCRIPT_OSAGE: Osage. Since: 2.50
* @G_UNICODE_SCRIPT_TANGUT: Tangut. Since: 2.50
*
* The #GUnicodeScript enumeration identifies different writing
* systems. The values correspond to the names as defined in the
@ -564,7 +576,15 @@ typedef enum
G_UNICODE_SCRIPT_HATRAN, /* Hatr */
G_UNICODE_SCRIPT_MULTANI, /* Mult */
G_UNICODE_SCRIPT_OLD_HUNGARIAN, /* Hung */
G_UNICODE_SCRIPT_SIGNWRITING /* Sgnw */
G_UNICODE_SCRIPT_SIGNWRITING, /* Sgnw */
/* Unicode 9.0 additions */
G_UNICODE_SCRIPT_ADLAM, /* Adlm */
G_UNICODE_SCRIPT_BHAIKSUKI, /* Bhks */
G_UNICODE_SCRIPT_MARCHEN, /* Marc */
G_UNICODE_SCRIPT_NEWA, /* Newa */
G_UNICODE_SCRIPT_OSAGE, /* Osge */
G_UNICODE_SCRIPT_TANGUT /* Tang */
} GUnicodeScript;
GLIB_AVAILABLE_IN_ALL

File diff suppressed because it is too large Load Diff

View File

@ -1421,6 +1421,14 @@ static const guint32 iso15924_tags[] =
PACK ('M','u','l','t'), /* G_UNICODE_SCRIPT_MULTANI */
PACK ('H','u','n','g'), /* G_UNICODE_SCRIPT_OLD_HUNGARIAN */
PACK ('S','g','n','w'), /* G_UNICODE_SCRIPT_SIGNWRITING */
/* Unicode 9.0 additions */
PACK ('O','s','g','e'), /* G_UNICODE_SCRIPT_OSAGE */
PACK ('N','e','w','a'), /* G_UNICODE_SCRIPT_NEWA */
PACK ('B','h','k','s'), /* G_UNICODE_SCRIPT_BHAIKSUKI */
PACK ('M','a','r','c'), /* G_UNICODE_SCRIPT_MARCHEN */
PACK ('T','a','n','g'), /* G_UNICODE_SCRIPT_TANGUT */
PACK ('A','d','l','m'), /* G_UNICODE_SCRIPT_ADLAM */
#undef PACK
};

View File

@ -131,7 +131,10 @@ test_unichar_break_type (void)
{ G_UNICODE_BREAK_HANGUL_LVT_SYLLABLE, 0xAC01 },
{ G_UNICODE_BREAK_CONDITIONAL_JAPANESE_STARTER, 0x3041 },
{ G_UNICODE_BREAK_HEBREW_LETTER, 0x05D0 },
{ G_UNICODE_BREAK_REGIONAL_INDICATOR, 0x1F1F6 }
{ G_UNICODE_BREAK_REGIONAL_INDICATOR, 0x1F1F6 },
{ G_UNICODE_BREAK_EMOJI_BASE, 0x1F466 },
{ G_UNICODE_BREAK_EMOJI_MODIFIER, 0x1F3FB },
{ G_UNICODE_BREAK_ZERO_WIDTH_JOINER, 0x200D },
};
for (i = 0; i < G_N_ELEMENTS (examples); i++)
@ -284,6 +287,12 @@ test_unichar_script (void)
{ G_UNICODE_SCRIPT_CUNEIFORM, 0x12480 },
{ G_UNICODE_SCRIPT_ANATOLIAN_HIEROGLYPHS, 0x14400 },
{ G_UNICODE_SCRIPT_SIGNWRITING, 0x1D800 },
{ G_UNICODE_SCRIPT_ADLAM, 0x1E900 },
{ G_UNICODE_SCRIPT_BHAIKSUKI, 0x11C00 },
{ G_UNICODE_SCRIPT_MARCHEN, 0x11C70 },
{ G_UNICODE_SCRIPT_NEWA, 0x11400 },
{ G_UNICODE_SCRIPT_OSAGE, 0x104B0 },
{ G_UNICODE_SCRIPT_TANGUT, 0x16FE0 },
};
for (i = 0; i < G_N_ELEMENTS (examples); i++)
g_assert_cmpint (g_unichar_get_script (examples[i].c), ==, examples[i].script);
@ -868,6 +877,14 @@ test_iso15924 (void)
{ G_UNICODE_SCRIPT_MULTANI, "Mult" },
{ G_UNICODE_SCRIPT_OLD_HUNGARIAN, "Hung" },
{ G_UNICODE_SCRIPT_SIGNWRITING, "Sgnw" },
/* Unicode 9.0 additions */
{ G_UNICODE_SCRIPT_ADLAM, "Adlm" },
{ G_UNICODE_SCRIPT_BHAIKSUKI, "Bhks" },
{ G_UNICODE_SCRIPT_MARCHEN, "Marc" },
{ G_UNICODE_SCRIPT_NEWA, "Newa" },
{ G_UNICODE_SCRIPT_OSAGE, "Osge" },
{ G_UNICODE_SCRIPT_TANGUT, "Tang" },
};
guint i;