| 1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030 |
- /*
- * Copyright © 2011 Codethink Limited
- * Copyright © 2011 Google, Inc.
- *
- * This is part of HarfBuzz, a text shaping library.
- *
- * Permission is hereby granted, without written agreement and without
- * license or royalty fees, to use, copy, modify, and distribute this
- * software and its documentation for any purpose, provided that the
- * above copyright notice and the following two paragraphs appear in
- * all copies of this software.
- *
- * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR
- * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES
- * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN
- * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
- * DAMAGE.
- *
- * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING,
- * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
- * FITNESS FOR A PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS
- * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO
- * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
- *
- * Codethink Author(s): Ryan Lortie
- * Google Author(s): Behdad Esfahbod
- */
- #include "hb-test.h"
- /* Unit tests for hb-unicode.h */
- /* Unit tests for hb-glib.h */
- /* Unit tests for hb-icu.h */
- #ifdef HAVE_GLIB
- #include <hb-glib.h>
- #endif
- #ifdef HAVE_ICU
- #include <hb-icu.h>
- #endif
- /* Some useful stuff */
- #define MAGIC0 0x12345678
- #define MAGIC1 0x76543210
- typedef struct {
- int value;
- gboolean freed;
- } data_t;
- static void free_up (void *p)
- {
- data_t *data = (data_t *) p;
- g_assert (data->value == MAGIC0 || data->value == MAGIC1);
- g_assert (!data->freed);
- data->freed = TRUE;
- }
- static hb_script_t
- simple_get_script (hb_unicode_funcs_t *ufuncs,
- hb_codepoint_t codepoint,
- void *user_data)
- {
- data_t *data = (data_t *) user_data;
- g_assert (hb_unicode_funcs_get_parent (ufuncs) != NULL);
- g_assert_cmphex (data->value, ==, MAGIC0);
- g_assert (!data->freed);
- if ('a' <= codepoint && codepoint <= 'z')
- return HB_SCRIPT_LATIN;
- else
- return HB_SCRIPT_UNKNOWN;
- }
- static hb_script_t
- a_is_for_arabic_get_script (hb_unicode_funcs_t *ufuncs,
- hb_codepoint_t codepoint,
- void *user_data)
- {
- data_t *data = (data_t *) user_data;
- g_assert (hb_unicode_funcs_get_parent (ufuncs) != NULL);
- g_assert_cmphex (data->value, ==, MAGIC1);
- g_assert (!data->freed);
- if (codepoint == 'a') {
- return HB_SCRIPT_ARABIC;
- } else {
- hb_unicode_funcs_t *parent = hb_unicode_funcs_get_parent (ufuncs);
- return hb_unicode_script (parent, codepoint);
- }
- }
- /* Check all properties */
- /* Some of the following tables where adapted from glib/glib/tests/utf8-misc.c.
- * The license is compatible. */
- typedef struct {
- hb_codepoint_t unicode;
- unsigned int value;
- } test_pair_t;
- static const test_pair_t combining_class_tests[] =
- {
- { 0x0020, 0 },
- { 0x0334, 1 },
- { 0x093C, 7 },
- { 0x3099, 8 },
- { 0x094D, 9 },
- { 0x05B0, 10 },
- { 0x05B1, 11 },
- { 0x05B2, 12 },
- { 0x05B3, 13 },
- { 0x05B4, 14 },
- { 0x05B5, 15 },
- { 0x05B6, 16 },
- { 0x05B7, 17 },
- { 0x05B8, 18 },
- { 0x05B9, 19 },
- { 0x05BB, 20 },
- { 0x05BC, 21 },
- { 0x05BD, 22 },
- { 0x05BF, 23 },
- { 0x05C1, 24 },
- { 0x05C2, 25 },
- { 0xFB1E, 26 },
- { 0x064B, 27 },
- { 0x064C, 28 },
- { 0x064D, 29 },
- /* ... */
- { 0x05AE, 228 },
- { 0x0300, 230 },
- { 0x302C, 232 },
- { 0x0362, 233 },
- { 0x0360, 234 },
- { 0x0345, 240 },
- { 0x111111, 0 }
- };
- static const test_pair_t combining_class_tests_more[] =
- {
- /* Unicode-5.1 character additions */
- { 0x1DCD, 234 },
- /* Unicode-5.2 character additions */
- { 0xA8E0, 230 },
- /* Unicode-6.0 character additions */
- { 0x135D, 230 },
- /* Unicode-6.1 character additions */
- { 0xA674, 230 },
- /* Unicode-7.0 character additions */
- { 0x1AB0, 230 },
- /* Unicode-8.0 character additions */
- { 0xA69E, 230 },
- /* Unicode-9.0 character additions */
- { 0x1E000, 230 },
- /* Unicode-10.0 character additions */
- { 0x1DF6, 232 },
- /* Unicode-11.0 character additions */
- { 0x07FD, 220 },
- /* Unicode-12.0 character additions */
- { 0x0EBA, 9 },
- /* Unicode-13.0 character additions */
- { 0x1ABF, 220 },
- /* Unicode-14.0 character additions */
- { 0x1DFA, 218 },
- /* Unicode-15.0 character additions */
- { 0x10EFD, 220 },
- /* Unicode-16.0 character additions */
- { 0x0897, 230 },
- { 0x111111, 0 }
- };
- static const test_pair_t general_category_tests[] =
- {
- { 0x000D, HB_UNICODE_GENERAL_CATEGORY_CONTROL },
- { 0x200E, HB_UNICODE_GENERAL_CATEGORY_FORMAT },
- { 0x0378, HB_UNICODE_GENERAL_CATEGORY_UNASSIGNED },
- { 0xE000, HB_UNICODE_GENERAL_CATEGORY_PRIVATE_USE },
- { 0xD800, HB_UNICODE_GENERAL_CATEGORY_SURROGATE },
- { 0x0061, HB_UNICODE_GENERAL_CATEGORY_LOWERCASE_LETTER },
- { 0x02B0, HB_UNICODE_GENERAL_CATEGORY_MODIFIER_LETTER },
- { 0x3400, HB_UNICODE_GENERAL_CATEGORY_OTHER_LETTER },
- { 0x01C5, HB_UNICODE_GENERAL_CATEGORY_TITLECASE_LETTER },
- { 0xFF21, HB_UNICODE_GENERAL_CATEGORY_UPPERCASE_LETTER },
- { 0x0903, HB_UNICODE_GENERAL_CATEGORY_SPACING_MARK },
- { 0x20DD, HB_UNICODE_GENERAL_CATEGORY_ENCLOSING_MARK },
- { 0xA806, HB_UNICODE_GENERAL_CATEGORY_NON_SPACING_MARK },
- { 0xFF10, HB_UNICODE_GENERAL_CATEGORY_DECIMAL_NUMBER },
- { 0x16EE, HB_UNICODE_GENERAL_CATEGORY_LETTER_NUMBER },
- { 0x17F0, HB_UNICODE_GENERAL_CATEGORY_OTHER_NUMBER },
- { 0x005F, HB_UNICODE_GENERAL_CATEGORY_CONNECT_PUNCTUATION },
- { 0x058A, HB_UNICODE_GENERAL_CATEGORY_DASH_PUNCTUATION },
- { 0x0F3B, HB_UNICODE_GENERAL_CATEGORY_CLOSE_PUNCTUATION },
- { 0x2019, HB_UNICODE_GENERAL_CATEGORY_FINAL_PUNCTUATION },
- { 0x2018, HB_UNICODE_GENERAL_CATEGORY_INITIAL_PUNCTUATION },
- { 0x2016, HB_UNICODE_GENERAL_CATEGORY_OTHER_PUNCTUATION },
- { 0x0F3A, HB_UNICODE_GENERAL_CATEGORY_OPEN_PUNCTUATION },
- { 0x20A0, HB_UNICODE_GENERAL_CATEGORY_CURRENCY_SYMBOL },
- { 0x309B, HB_UNICODE_GENERAL_CATEGORY_MODIFIER_SYMBOL },
- { 0xFB29, HB_UNICODE_GENERAL_CATEGORY_MATH_SYMBOL },
- { 0x00A6, HB_UNICODE_GENERAL_CATEGORY_OTHER_SYMBOL },
- { 0x2028, HB_UNICODE_GENERAL_CATEGORY_LINE_SEPARATOR },
- { 0x2029, HB_UNICODE_GENERAL_CATEGORY_PARAGRAPH_SEPARATOR },
- { 0x202F, HB_UNICODE_GENERAL_CATEGORY_SPACE_SEPARATOR },
- { 0x111111, HB_UNICODE_GENERAL_CATEGORY_UNASSIGNED }
- };
- static const test_pair_t general_category_tests_more[] =
- {
- /* Unicode-5.2 character additions */
- { 0x1F131, HB_UNICODE_GENERAL_CATEGORY_OTHER_SYMBOL },
- /* Unicode-6.0 character additions */
- { 0x0620, HB_UNICODE_GENERAL_CATEGORY_OTHER_LETTER },
- /* Unicode-6.1 character additions */
- { 0x058F, HB_UNICODE_GENERAL_CATEGORY_CURRENCY_SYMBOL },
- /* Unicode-6.2 character additions */
- { 0x20BA, HB_UNICODE_GENERAL_CATEGORY_CURRENCY_SYMBOL },
- /* Unicode-6.3 character additions */
- { 0x061C, HB_UNICODE_GENERAL_CATEGORY_FORMAT },
- /* Unicode-7.0 character additions */
- { 0x058D, HB_UNICODE_GENERAL_CATEGORY_OTHER_SYMBOL },
- /* Unicode-8.0 character additions */
- { 0x08E3, HB_UNICODE_GENERAL_CATEGORY_NON_SPACING_MARK },
- /* Unicode-9.0 character additions */
- { 0x08D4, HB_UNICODE_GENERAL_CATEGORY_NON_SPACING_MARK },
- /* Unicode-10.0 character additions */
- { 0x09FD, HB_UNICODE_GENERAL_CATEGORY_OTHER_PUNCTUATION },
- /* Unicode-11.0 character additions */
- { 0x0560, HB_UNICODE_GENERAL_CATEGORY_LOWERCASE_LETTER },
- /* Unicode-12.0 character additions */
- { 0x0C77, HB_UNICODE_GENERAL_CATEGORY_OTHER_PUNCTUATION },
- /* Unicode-12.1 character additions */
- { 0x32FF, HB_UNICODE_GENERAL_CATEGORY_OTHER_SYMBOL },
- /* Unicode-13.0 character additions */
- { 0x08BE, HB_UNICODE_GENERAL_CATEGORY_OTHER_LETTER },
- /* Unicode-14.0 character additions */
- { 0x20C0, HB_UNICODE_GENERAL_CATEGORY_CURRENCY_SYMBOL },
- /* Unicode-15.0 character additions */
- { 0x0CF3, HB_UNICODE_GENERAL_CATEGORY_SPACING_MARK },
- /* Unicode-15.1 character additions */
- { 0x31EF, HB_UNICODE_GENERAL_CATEGORY_OTHER_SYMBOL },
- /* Unicode-16.0 character additions */
- { 0x10D6E, HB_UNICODE_GENERAL_CATEGORY_DASH_PUNCTUATION },
- { 0x111111, HB_UNICODE_GENERAL_CATEGORY_UNASSIGNED }
- };
- static const test_pair_t mirroring_tests[] =
- {
- /* Some characters that do NOT mirror */
- { 0x0020, 0x0020 },
- { 0x0041, 0x0041 },
- { 0x00F0, 0x00F0 },
- { 0x27CC, 0x27CC },
- { 0xE01EF, 0xE01EF },
- { 0x1D7C3, 0x1D7C3 },
- { 0x100000, 0x100000 },
- /* Some characters that do mirror */
- { 0x0029, 0x0028 },
- { 0x0028, 0x0029 },
- { 0x003E, 0x003C },
- { 0x003C, 0x003E },
- { 0x005D, 0x005B },
- { 0x005B, 0x005D },
- { 0x007D, 0x007B },
- { 0x007B, 0x007D },
- { 0x00BB, 0x00AB },
- { 0x00AB, 0x00BB },
- { 0x226B, 0x226A },
- { 0x226A, 0x226B },
- { 0x22F1, 0x22F0 },
- { 0x22F0, 0x22F1 },
- { 0xFF60, 0xFF5F },
- { 0xFF5F, 0xFF60 },
- { 0xFF63, 0xFF62 },
- { 0xFF62, 0xFF63 },
- { 0x111111, 0x111111 },
- };
- static const test_pair_t mirroring_tests_more[] =
- {
- /* Unicode-6.1 character additions */
- { 0x27CB, 0x27CD },
- /* Unicode-11.0 character additions */
- { 0x2BFE, 0x221F },
- { 0x111111, 0x111111 }
- };
- static const test_pair_t script_tests[] =
- {
- { 0x002A, HB_SCRIPT_COMMON },
- { 0x0670, HB_SCRIPT_INHERITED },
- { 0x060D, HB_SCRIPT_ARABIC },
- { 0x0559, HB_SCRIPT_ARMENIAN },
- { 0x09CD, HB_SCRIPT_BENGALI },
- { 0x31B6, HB_SCRIPT_BOPOMOFO },
- { 0x13A2, HB_SCRIPT_CHEROKEE },
- { 0x2CFD, HB_SCRIPT_COPTIC },
- { 0x0482, HB_SCRIPT_CYRILLIC },
- { 0x10401, HB_SCRIPT_DESERET },
- { 0x094D, HB_SCRIPT_DEVANAGARI },
- { 0x1258, HB_SCRIPT_ETHIOPIC },
- { 0x10FC, HB_SCRIPT_GEORGIAN },
- { 0x10341, HB_SCRIPT_GOTHIC },
- { 0x0375, HB_SCRIPT_GREEK },
- { 0x0A83, HB_SCRIPT_GUJARATI },
- { 0x0A3C, HB_SCRIPT_GURMUKHI },
- { 0x3005, HB_SCRIPT_HAN },
- { 0x1100, HB_SCRIPT_HANGUL },
- { 0x05BF, HB_SCRIPT_HEBREW },
- { 0x309F, HB_SCRIPT_HIRAGANA },
- { 0x0CBC, HB_SCRIPT_KANNADA },
- { 0x30FF, HB_SCRIPT_KATAKANA },
- { 0x17DD, HB_SCRIPT_KHMER },
- { 0x0EDD, HB_SCRIPT_LAO },
- { 0x0061, HB_SCRIPT_LATIN },
- { 0x0D3D, HB_SCRIPT_MALAYALAM },
- { 0x1843, HB_SCRIPT_MONGOLIAN },
- { 0x1031, HB_SCRIPT_MYANMAR },
- { 0x169C, HB_SCRIPT_OGHAM },
- { 0x10322, HB_SCRIPT_OLD_ITALIC },
- { 0x0B3C, HB_SCRIPT_ORIYA },
- { 0x16EF, HB_SCRIPT_RUNIC },
- { 0x0DBD, HB_SCRIPT_SINHALA },
- { 0x0711, HB_SCRIPT_SYRIAC },
- { 0x0B82, HB_SCRIPT_TAMIL },
- { 0x0C03, HB_SCRIPT_TELUGU },
- { 0x07B1, HB_SCRIPT_THAANA },
- { 0x0E31, HB_SCRIPT_THAI },
- { 0x0FD4, HB_SCRIPT_TIBETAN },
- { 0x1401, HB_SCRIPT_CANADIAN_SYLLABICS },
- { 0xA015, HB_SCRIPT_YI },
- { 0x1700, HB_SCRIPT_TAGALOG },
- { 0x1720, HB_SCRIPT_HANUNOO },
- { 0x1740, HB_SCRIPT_BUHID },
- { 0x1760, HB_SCRIPT_TAGBANWA },
- /* Unicode-4.0 additions */
- { 0x2800, HB_SCRIPT_BRAILLE },
- { 0x10808, HB_SCRIPT_CYPRIOT },
- { 0x1932, HB_SCRIPT_LIMBU },
- { 0x10480, HB_SCRIPT_OSMANYA },
- { 0x10450, HB_SCRIPT_SHAVIAN },
- { 0x10000, HB_SCRIPT_LINEAR_B },
- { 0x1950, HB_SCRIPT_TAI_LE },
- { 0x1039F, HB_SCRIPT_UGARITIC },
- /* Unicode-4.1 additions */
- { 0x1980, HB_SCRIPT_NEW_TAI_LUE },
- { 0x1A1F, HB_SCRIPT_BUGINESE },
- { 0x2C00, HB_SCRIPT_GLAGOLITIC },
- { 0x2D6F, HB_SCRIPT_TIFINAGH },
- { 0xA800, HB_SCRIPT_SYLOTI_NAGRI },
- { 0x103D0, HB_SCRIPT_OLD_PERSIAN },
- { 0x10A3F, HB_SCRIPT_KHAROSHTHI },
- /* Unicode-5.0 additions */
- { 0x0378, HB_SCRIPT_UNKNOWN },
- { 0x1B04, HB_SCRIPT_BALINESE },
- { 0x12000, HB_SCRIPT_CUNEIFORM },
- { 0x10900, HB_SCRIPT_PHOENICIAN },
- { 0xA840, HB_SCRIPT_PHAGS_PA },
- { 0x07C0, HB_SCRIPT_NKO },
- /* Unicode-5.1 additions */
- { 0xA900, HB_SCRIPT_KAYAH_LI },
- { 0x1C00, HB_SCRIPT_LEPCHA },
- { 0xA930, HB_SCRIPT_REJANG },
- { 0x1B80, HB_SCRIPT_SUNDANESE },
- { 0xA880, HB_SCRIPT_SAURASHTRA },
- { 0xAA00, HB_SCRIPT_CHAM },
- { 0x1C50, HB_SCRIPT_OL_CHIKI },
- { 0xA500, HB_SCRIPT_VAI },
- { 0x102A0, HB_SCRIPT_CARIAN },
- { 0x10280, HB_SCRIPT_LYCIAN },
- { 0x1093F, HB_SCRIPT_LYDIAN },
- { 0x111111, HB_SCRIPT_UNKNOWN }
- };
- static const test_pair_t script_tests_more[] =
- {
- /* Unicode-5.2 additions */
- { 0x10B00, HB_SCRIPT_AVESTAN },
- { 0xA6A0, HB_SCRIPT_BAMUM },
- { 0x1400, HB_SCRIPT_CANADIAN_SYLLABICS },
- { 0x13000, HB_SCRIPT_EGYPTIAN_HIEROGLYPHS },
- { 0x10840, HB_SCRIPT_IMPERIAL_ARAMAIC },
- { 0x1CED, HB_SCRIPT_INHERITED },
- { 0x10B60, HB_SCRIPT_INSCRIPTIONAL_PAHLAVI },
- { 0x10B40, HB_SCRIPT_INSCRIPTIONAL_PARTHIAN },
- { 0xA980, HB_SCRIPT_JAVANESE },
- { 0x11082, HB_SCRIPT_KAITHI },
- { 0xA4D0, HB_SCRIPT_LISU },
- { 0xABE5, HB_SCRIPT_MEETEI_MAYEK },
- { 0x10A60, HB_SCRIPT_OLD_SOUTH_ARABIAN },
- { 0x10C00, HB_SCRIPT_OLD_TURKIC },
- { 0x0800, HB_SCRIPT_SAMARITAN },
- { 0x1A20, HB_SCRIPT_TAI_THAM },
- { 0xAA80, HB_SCRIPT_TAI_VIET },
- /* Unicode-6.0 additions */
- { 0x1BC0, HB_SCRIPT_BATAK },
- { 0x11000, HB_SCRIPT_BRAHMI },
- { 0x0840, HB_SCRIPT_MANDAIC },
- /* Unicode-6.1 additions */
- { 0x10980, HB_SCRIPT_MEROITIC_HIEROGLYPHS },
- { 0x109A0, HB_SCRIPT_MEROITIC_CURSIVE },
- { 0x110D0, HB_SCRIPT_SORA_SOMPENG },
- { 0x11100, HB_SCRIPT_CHAKMA },
- { 0x11180, HB_SCRIPT_SHARADA },
- { 0x11680, HB_SCRIPT_TAKRI },
- { 0x16F00, HB_SCRIPT_MIAO },
- /* Unicode-6.2 additions */
- { 0x20BA, HB_SCRIPT_COMMON },
- /* Unicode-6.3 additions */
- { 0x2066, HB_SCRIPT_COMMON },
- /* Unicode-7.0 additions */
- { 0x10350, HB_SCRIPT_OLD_PERMIC },
- { 0x10500, HB_SCRIPT_ELBASAN },
- { 0x10530, HB_SCRIPT_CAUCASIAN_ALBANIAN },
- { 0x10600, HB_SCRIPT_LINEAR_A },
- { 0x10860, HB_SCRIPT_PALMYRENE },
- { 0x10880, HB_SCRIPT_NABATAEAN },
- { 0x10A80, HB_SCRIPT_OLD_NORTH_ARABIAN },
- { 0x10AC0, HB_SCRIPT_MANICHAEAN },
- { 0x10B80, HB_SCRIPT_PSALTER_PAHLAVI },
- { 0x11150, HB_SCRIPT_MAHAJANI },
- { 0x11200, HB_SCRIPT_KHOJKI },
- { 0x112B0, HB_SCRIPT_KHUDAWADI },
- { 0x11300, HB_SCRIPT_GRANTHA },
- { 0x11480, HB_SCRIPT_TIRHUTA },
- { 0x11580, HB_SCRIPT_SIDDHAM },
- { 0x11600, HB_SCRIPT_MODI },
- { 0x118A0, HB_SCRIPT_WARANG_CITI },
- { 0x11AC0, HB_SCRIPT_PAU_CIN_HAU },
- { 0x16A40, HB_SCRIPT_MRO },
- { 0x16AD0, HB_SCRIPT_BASSA_VAH },
- { 0x16B00, HB_SCRIPT_PAHAWH_HMONG },
- { 0x1BC00, HB_SCRIPT_DUPLOYAN },
- { 0x1E800, HB_SCRIPT_MENDE_KIKAKUI },
- /* Unicode-8.0 additions */
- { 0x108E0, HB_SCRIPT_HATRAN },
- { 0x10C80, HB_SCRIPT_OLD_HUNGARIAN },
- { 0x11280, HB_SCRIPT_MULTANI },
- { 0x11700, HB_SCRIPT_AHOM },
- { 0x14400, HB_SCRIPT_ANATOLIAN_HIEROGLYPHS },
- { 0x1D800, HB_SCRIPT_SIGNWRITING },
- /* Unicode-9.0 additions */
- { 0x104B0, HB_SCRIPT_OSAGE },
- { 0x11400, HB_SCRIPT_NEWA },
- { 0x11C00, HB_SCRIPT_BHAIKSUKI },
- { 0x11C70, HB_SCRIPT_MARCHEN },
- { 0x17000, HB_SCRIPT_TANGUT },
- { 0x1E900, HB_SCRIPT_ADLAM },
- /* Unicode-10.0 additions */
- { 0x11A00, HB_SCRIPT_ZANABAZAR_SQUARE },
- { 0x11A50, HB_SCRIPT_SOYOMBO },
- { 0x11D00, HB_SCRIPT_MASARAM_GONDI },
- { 0x1B170, HB_SCRIPT_NUSHU },
- /* Unicode-11.0 additions */
- { 0x10D00, HB_SCRIPT_HANIFI_ROHINGYA },
- { 0x10F00, HB_SCRIPT_OLD_SOGDIAN },
- { 0x10F30, HB_SCRIPT_SOGDIAN },
- { 0x11800, HB_SCRIPT_DOGRA },
- { 0x11D60, HB_SCRIPT_GUNJALA_GONDI },
- { 0x11EE0, HB_SCRIPT_MAKASAR },
- { 0x16E40, HB_SCRIPT_MEDEFAIDRIN },
- /* Unicode-12.0 additions */
- { 0x10FE0, HB_SCRIPT_ELYMAIC },
- { 0x119A0, HB_SCRIPT_NANDINAGARI },
- { 0x1E100, HB_SCRIPT_NYIAKENG_PUACHUE_HMONG },
- { 0x1E2C0, HB_SCRIPT_WANCHO },
- /* Unicode-12.1 additions */
- { 0x32FF, HB_SCRIPT_COMMON },
- /* Unicode-13.0 additions */
- { 0x10E80, HB_SCRIPT_YEZIDI },
- { 0x10FB0, HB_SCRIPT_CHORASMIAN },
- { 0x11900, HB_SCRIPT_DIVES_AKURU },
- { 0x18B00, HB_SCRIPT_KHITAN_SMALL_SCRIPT },
- /* Unicode-14.0 additions */
- { 0x10570, HB_SCRIPT_VITHKUQI },
- { 0x10F70, HB_SCRIPT_OLD_UYGHUR },
- { 0x12F90, HB_SCRIPT_CYPRO_MINOAN },
- { 0x16A70, HB_SCRIPT_TANGSA },
- { 0x1E290, HB_SCRIPT_TOTO },
- /* Unicode-15.0 additions */
- { 0x11F00, HB_SCRIPT_KAWI },
- { 0x1E4D0, HB_SCRIPT_NAG_MUNDARI },
- /* Unicode-16.0 additions */
- { 0x105C0, HB_SCRIPT_TODHRI },
- { 0x10D40, HB_SCRIPT_GARAY },
- { 0x11380, HB_SCRIPT_TULU_TIGALARI },
- { 0x11BC0, HB_SCRIPT_SUNUWAR },
- { 0x16100, HB_SCRIPT_GURUNG_KHEMA },
- { 0x16D40, HB_SCRIPT_KIRAT_RAI },
- { 0x1E5D0, HB_SCRIPT_OL_ONAL },
- { 0x111111, HB_SCRIPT_UNKNOWN }
- };
- typedef unsigned int (*get_func_t) (hb_unicode_funcs_t *ufuncs,
- hb_codepoint_t unicode,
- void *user_data);
- typedef unsigned int (*func_setter_func_t) (hb_unicode_funcs_t *ufuncs,
- get_func_t func,
- void *user_data,
- hb_destroy_func_t destroy);
- typedef unsigned int (*getter_func_t) (hb_unicode_funcs_t *ufuncs,
- hb_codepoint_t unicode);
- typedef struct {
- const char *name;
- func_setter_func_t func_setter;
- getter_func_t getter;
- const test_pair_t *tests;
- unsigned int num_tests;
- const test_pair_t *tests_more;
- unsigned int num_tests_more;
- unsigned int default_value;
- } property_t;
- #define RETURNS_UNICODE_ITSELF ((unsigned int) -1)
- #define PROPERTY(name, DEFAULT) \
- { \
- #name, \
- (func_setter_func_t) hb_unicode_funcs_set_##name##_func, \
- (getter_func_t) hb_unicode_##name, \
- name##_tests, \
- G_N_ELEMENTS (name##_tests), \
- name##_tests_more, \
- G_N_ELEMENTS (name##_tests_more), \
- DEFAULT \
- }
- #pragma GCC diagnostic push
- #pragma GCC diagnostic ignored "-Wcast-function-type"
- static const property_t properties[] =
- {
- PROPERTY (combining_class, 0),
- PROPERTY (general_category, (unsigned int) HB_UNICODE_GENERAL_CATEGORY_OTHER_LETTER),
- PROPERTY (mirroring, RETURNS_UNICODE_ITSELF),
- PROPERTY (script, (unsigned int) HB_SCRIPT_UNKNOWN)
- };
- #pragma GCC diagnostic pop
- #undef PROPERTY
- static void
- test_unicode_properties (gconstpointer user_data, hb_bool_t lenient)
- {
- hb_unicode_funcs_t *uf = (hb_unicode_funcs_t *) user_data;
- unsigned int i, j;
- gboolean failed = TRUE;
- g_assert (hb_unicode_funcs_is_immutable (uf));
- g_assert (hb_unicode_funcs_get_parent (uf));
- for (i = 0; i < G_N_ELEMENTS (properties); i++) {
- const property_t *p = &properties[i];
- const test_pair_t *tests;
- g_test_message ("Testing property %s", p->name);
- tests = p->tests;
- for (j = 0; j < p->num_tests; j++) {
- g_test_message ("Test %s #%d: U+%04X", p->name, j, tests[j].unicode);
- g_assert_cmphex (p->getter (uf, tests[j].unicode), ==, tests[j].value);
- }
- /* These tests are from Unicode 5.2 onward and older glib/ICU
- * don't get them right. Just warn instead of assert. */
- tests = p->tests_more;
- for (j = 0; j < p->num_tests_more; j++) {
- g_test_message ("Test %s more #%d: U+%04X", p->name, j, tests[j].unicode);
- if (lenient) {
- if (p->getter (uf, tests[j].unicode) != tests[j].value) {
- g_test_message ("Soft fail: Received %x, expected %x", p->getter (uf, tests[j].unicode), tests[j].value);
- failed = TRUE;
- }
- }
- else
- g_assert_cmphex (p->getter (uf, tests[j].unicode), ==, tests[j].value);
- }
- }
- if (failed)
- g_test_message ("Some property tests failed. You probably have an old version of one of the libraries used.");
- }
- static void
- test_unicode_properties_lenient (gconstpointer user_data)
- {
- test_unicode_properties (user_data, TRUE);
- }
- static void
- test_unicode_properties_strict (gconstpointer user_data)
- {
- test_unicode_properties (user_data, FALSE);
- }
- static hb_codepoint_t
- default_value (hb_codepoint_t _default_value, hb_codepoint_t unicode)
- {
- return _default_value == RETURNS_UNICODE_ITSELF ? unicode : _default_value;
- }
- static void
- _test_unicode_properties_nil (hb_unicode_funcs_t *uf)
- {
- unsigned int i, j;
- for (i = 0; i < G_N_ELEMENTS (properties); i++) {
- const property_t *p = &properties[i];
- const test_pair_t *tests;
- g_test_message ("Testing property %s", p->name);
- tests = p->tests;
- for (j = 0; j < p->num_tests; j++) {
- g_test_message ("Test %s #%d: U+%04X", p->name, j, tests[j].unicode);
- g_assert_cmphex (p->getter (uf, tests[j].unicode), ==, default_value (p->default_value, tests[j].unicode));
- }
- tests = p->tests_more;
- for (j = 0; j < p->num_tests_more; j++) {
- g_test_message ("Test %s more #%d: U+%04X", p->name, j, tests[j].unicode);
- g_assert_cmphex (p->getter (uf, tests[j].unicode), ==, default_value (p->default_value, tests[j].unicode));
- }
- }
- }
- static void
- test_unicode_properties_nil (void)
- {
- hb_unicode_funcs_t *uf = hb_unicode_funcs_create (NULL);
- g_assert (!hb_unicode_funcs_is_immutable (uf));
- _test_unicode_properties_nil (uf);
- hb_unicode_funcs_destroy (uf);
- }
- static void
- test_unicode_properties_empty (void)
- {
- hb_unicode_funcs_t *uf = hb_unicode_funcs_get_empty ();
- g_assert (uf);
- g_assert (hb_unicode_funcs_is_immutable (uf));
- _test_unicode_properties_nil (uf);
- }
- static void
- test_unicode_chainup (void)
- {
- hb_unicode_funcs_t *uf, *uf2;
- /* Chain-up to nil */
- uf = hb_unicode_funcs_create (NULL);
- g_assert (!hb_unicode_funcs_is_immutable (uf));
- uf2 = hb_unicode_funcs_create (uf);
- g_assert (hb_unicode_funcs_is_immutable (uf));
- hb_unicode_funcs_destroy (uf);
- g_assert (!hb_unicode_funcs_is_immutable (uf2));
- _test_unicode_properties_nil (uf2);
- hb_unicode_funcs_destroy (uf2);
- /* Chain-up to default */
- uf = hb_unicode_funcs_create (hb_unicode_funcs_get_default ());
- g_assert (!hb_unicode_funcs_is_immutable (uf));
- uf2 = hb_unicode_funcs_create (uf);
- g_assert (hb_unicode_funcs_is_immutable (uf));
- hb_unicode_funcs_destroy (uf);
- g_assert (!hb_unicode_funcs_is_immutable (uf2));
- hb_unicode_funcs_make_immutable (uf2);
- test_unicode_properties_strict (uf2);
- hb_unicode_funcs_destroy (uf2);
- }
- static void
- test_unicode_setters (void)
- {
- hb_unicode_funcs_t *uf;
- unsigned int i;
- /* This is cruel: we use script-returning functions to test all properties,
- * but it works. */
- for (i = 0; i < G_N_ELEMENTS (properties); i++) {
- const property_t *p = &properties[i];
- data_t data[2] = {{MAGIC0, FALSE}, {MAGIC1, FALSE}};
- g_test_message ("Testing property %s", p->name);
- uf = hb_unicode_funcs_create (NULL);
- g_assert (!hb_unicode_funcs_is_immutable (uf));
- p->func_setter (uf, (get_func_t) simple_get_script, &data[0], free_up);
- g_assert_cmphex (p->getter (uf, 'a'), ==, HB_SCRIPT_LATIN);
- g_assert_cmphex (p->getter (uf, '0'), ==, HB_SCRIPT_UNKNOWN);
- p->func_setter (uf, (get_func_t) NULL, NULL, NULL);
- g_assert (data[0].freed && !data[1].freed);
- g_assert (!hb_unicode_funcs_is_immutable (uf));
- hb_unicode_funcs_make_immutable (uf);
- g_assert (hb_unicode_funcs_is_immutable (uf));
- /* Since uf is immutable now, the following setter should do nothing. */
- p->func_setter (uf, (get_func_t) a_is_for_arabic_get_script, &data[1], free_up);
- g_assert (data[0].freed && data[1].freed);
- hb_unicode_funcs_destroy (uf);
- g_assert (data[0].freed && data[1].freed);
- }
- }
- typedef struct {
- data_t data[2];
- } data_fixture_t;
- static void
- data_fixture_init (data_fixture_t *f, gconstpointer user_data HB_UNUSED)
- {
- f->data[0].value = MAGIC0;
- f->data[1].value = MAGIC1;
- }
- static void
- data_fixture_finish (data_fixture_t *f HB_UNUSED, gconstpointer user_data HB_UNUSED)
- {
- }
- static void
- test_unicode_subclassing_nil (data_fixture_t *f, gconstpointer user_data HB_UNUSED)
- {
- hb_unicode_funcs_t *uf, *aa;
- uf = hb_unicode_funcs_create (NULL);
- aa = hb_unicode_funcs_create (uf);
- hb_unicode_funcs_destroy (uf);
- hb_unicode_funcs_set_script_func (aa, a_is_for_arabic_get_script,
- &f->data[1], free_up);
- g_assert_cmphex (hb_unicode_script (aa, 'a'), ==, HB_SCRIPT_ARABIC);
- g_assert_cmphex (hb_unicode_script (aa, 'b'), ==, HB_SCRIPT_UNKNOWN);
- g_assert (!f->data[0].freed && !f->data[1].freed);
- hb_unicode_funcs_destroy (aa);
- g_assert (!f->data[0].freed && f->data[1].freed);
- }
- static void
- test_unicode_subclassing_default (data_fixture_t *f, gconstpointer user_data HB_UNUSED)
- {
- hb_unicode_funcs_t *uf, *aa;
- uf = hb_unicode_funcs_get_default ();
- aa = hb_unicode_funcs_create (uf);
- hb_unicode_funcs_set_script_func (aa, a_is_for_arabic_get_script,
- &f->data[1], free_up);
- g_assert_cmphex (hb_unicode_script (aa, 'a'), ==, HB_SCRIPT_ARABIC);
- g_assert_cmphex (hb_unicode_script (aa, 'b'), ==, HB_SCRIPT_LATIN);
- g_assert (!f->data[0].freed && !f->data[1].freed);
- hb_unicode_funcs_destroy (aa);
- g_assert (!f->data[0].freed && f->data[1].freed);
- }
- static void
- test_unicode_subclassing_deep (data_fixture_t *f, gconstpointer user_data HB_UNUSED)
- {
- hb_unicode_funcs_t *uf, *aa;
- uf = hb_unicode_funcs_create (NULL);
- hb_unicode_funcs_set_script_func (uf, simple_get_script,
- &f->data[0], free_up);
- aa = hb_unicode_funcs_create (uf);
- hb_unicode_funcs_destroy (uf);
- /* make sure the 'uf' didn't get freed, since 'aa' holds a ref */
- g_assert (!f->data[0].freed);
- hb_unicode_funcs_set_script_func (aa, a_is_for_arabic_get_script,
- &f->data[1], free_up);
- g_assert_cmphex (hb_unicode_script (aa, 'a'), ==, HB_SCRIPT_ARABIC);
- g_assert_cmphex (hb_unicode_script (aa, 'b'), ==, HB_SCRIPT_LATIN);
- g_assert_cmphex (hb_unicode_script (aa, '0'), ==, HB_SCRIPT_UNKNOWN);
- g_assert (!f->data[0].freed && !f->data[1].freed);
- hb_unicode_funcs_destroy (aa);
- g_assert (f->data[0].freed && f->data[1].freed);
- }
- static hb_script_t
- script_roundtrip_default (hb_script_t script)
- {
- return hb_script_from_iso15924_tag (hb_script_to_iso15924_tag (script));
- }
- #ifdef HAVE_GLIB
- static hb_script_t
- script_roundtrip_glib (hb_script_t script)
- {
- return hb_glib_script_to_script (hb_glib_script_from_script (script));
- }
- #endif
- #ifdef HAVE_ICU
- static hb_script_t
- script_roundtrip_icu (hb_script_t script)
- {
- return hb_icu_script_to_script (hb_icu_script_from_script (script));
- }
- #endif
- static void
- test_unicode_script_roundtrip (gconstpointer user_data)
- {
- typedef hb_script_t (*roundtrip_func_t) (hb_script_t);
- roundtrip_func_t roundtrip_func = (roundtrip_func_t) user_data;
- unsigned int i;
- gboolean failed = FALSE;
- for (i = 0; i < G_N_ELEMENTS (script_tests); i++) {
- const test_pair_t *test = &script_tests[i];
- hb_script_t script = test->value;
- g_test_message ("Test script roundtrip #%d: %x", i, script);
- g_assert_cmphex (script, ==, roundtrip_func (script));
- }
- for (i = 0; i < G_N_ELEMENTS (script_tests_more); i++) {
- const test_pair_t *test = &script_tests_more[i];
- hb_script_t script = test->value;
- g_test_message ("Test script roundtrip more #%d: %x", i, script);
- if (script != roundtrip_func (script)) {
- g_test_message ("Soft fail: Received %x, expected %x", roundtrip_func (script), script);
- failed = TRUE;
- }
- }
- g_assert_cmphex (HB_SCRIPT_INVALID, ==, roundtrip_func (HB_SCRIPT_INVALID));
- if (failed)
- g_test_message ("Some script roundtrip tests failed. You probably have an old version of one of the libraries used.");
- }
- static void
- test_unicode_normalization (gconstpointer user_data)
- {
- hb_unicode_funcs_t *uf = (hb_unicode_funcs_t *) user_data;
- gunichar a, b, ab;
- /* Test compose() */
- /* Not composable */
- g_assert (!hb_unicode_compose (uf, 0x0041, 0x0042, &ab) && ab == 0);
- g_assert (!hb_unicode_compose (uf, 0x0041, 0, &ab) && ab == 0);
- g_assert (!hb_unicode_compose (uf, 0x0066, 0x0069, &ab) && ab == 0);
- /* Singletons should not compose */
- g_assert (!hb_unicode_compose (uf, 0x212B, 0, &ab) && ab == 0);
- g_assert (!hb_unicode_compose (uf, 0x00C5, 0, &ab) && ab == 0);
- g_assert (!hb_unicode_compose (uf, 0x2126, 0, &ab) && ab == 0);
- g_assert (!hb_unicode_compose (uf, 0x03A9, 0, &ab) && ab == 0);
- /* Non-starter pairs should not compose */
- g_assert (!hb_unicode_compose (uf, 0x0308, 0x0301, &ab) && ab == 0); /* !0x0344 */
- g_assert (!hb_unicode_compose (uf, 0x0F71, 0x0F72, &ab) && ab == 0); /* !0x0F73 */
- /* Pairs */
- g_assert (hb_unicode_compose (uf, 0x0041, 0x030A, &ab) && ab == 0x00C5);
- g_assert (hb_unicode_compose (uf, 0x006F, 0x0302, &ab) && ab == 0x00F4);
- g_assert (hb_unicode_compose (uf, 0x1E63, 0x0307, &ab) && ab == 0x1E69);
- g_assert (hb_unicode_compose (uf, 0x0073, 0x0323, &ab) && ab == 0x1E63);
- g_assert (hb_unicode_compose (uf, 0x0064, 0x0307, &ab) && ab == 0x1E0B);
- g_assert (hb_unicode_compose (uf, 0x0064, 0x0323, &ab) && ab == 0x1E0D);
- /* Hangul */
- g_assert (hb_unicode_compose (uf, 0xD4CC, 0x11B6, &ab) && ab == 0xD4DB);
- g_assert (hb_unicode_compose (uf, 0x1111, 0x1171, &ab) && ab == 0xD4CC);
- g_assert (hb_unicode_compose (uf, 0xCE20, 0x11B8, &ab) && ab == 0xCE31);
- g_assert (hb_unicode_compose (uf, 0x110E, 0x1173, &ab) && ab == 0xCE20);
- g_assert (!hb_unicode_compose (uf, 0xAC00, 0x11A7, &ab));
- g_assert (hb_unicode_compose (uf, 0xAC00, 0x11A8, &ab) && ab == 0xAC01);
- g_assert (!hb_unicode_compose (uf, 0xAC01, 0x11A8, &ab));
- /* Test decompose() */
- /* Not decomposable */
- g_assert (!hb_unicode_decompose (uf, 0x0041, &a, &b) && a == 0x0041 && b == 0);
- g_assert (!hb_unicode_decompose (uf, 0xFB01, &a, &b) && a == 0xFB01 && b == 0);
- g_assert (!hb_unicode_decompose (uf, 0x1F1EF, &a, &b) && a == 0x1F1EF && b == 0);
- /* Singletons */
- g_assert (hb_unicode_decompose (uf, 0x212B, &a, &b) && a == 0x00C5 && b == 0);
- g_assert (hb_unicode_decompose (uf, 0x2126, &a, &b) && a == 0x03A9 && b == 0);
- /* Non-starter pairs decompose, but not compose */
- g_assert (hb_unicode_decompose (uf, 0x0344, &a, &b) && a == 0x0308 && b == 0x0301);
- g_assert (hb_unicode_decompose (uf, 0x0F73, &a, &b) && a == 0x0F71 && b == 0x0F72);
- /* Pairs */
- g_assert (hb_unicode_decompose (uf, 0x00C5, &a, &b) && a == 0x0041 && b == 0x030A);
- g_assert (hb_unicode_decompose (uf, 0x00F4, &a, &b) && a == 0x006F && b == 0x0302);
- g_assert (hb_unicode_decompose (uf, 0x1E69, &a, &b) && a == 0x1E63 && b == 0x0307);
- g_assert (hb_unicode_decompose (uf, 0x1E63, &a, &b) && a == 0x0073 && b == 0x0323);
- g_assert (hb_unicode_decompose (uf, 0x1E0B, &a, &b) && a == 0x0064 && b == 0x0307);
- g_assert (hb_unicode_decompose (uf, 0x1E0D, &a, &b) && a == 0x0064 && b == 0x0323);
- /* Hangul */
- g_assert (hb_unicode_decompose (uf, 0xD4DB, &a, &b) && a == 0xD4CC && b == 0x11B6);
- g_assert (hb_unicode_decompose (uf, 0xD4CC, &a, &b) && a == 0x1111 && b == 0x1171);
- g_assert (hb_unicode_decompose (uf, 0xCE31, &a, &b) && a == 0xCE20 && b == 0x11B8);
- g_assert (hb_unicode_decompose (uf, 0xCE20, &a, &b) && a == 0x110E && b == 0x1173);
- }
- int
- main (int argc, char **argv)
- {
- hb_test_init (&argc, &argv);
- hb_test_add (test_unicode_properties_nil);
- hb_test_add (test_unicode_properties_empty);
- hb_test_add_data_flavor (hb_unicode_funcs_get_default (), "default", test_unicode_properties_strict);
- hb_test_add_data_flavor (hb_unicode_funcs_get_default (), "default", test_unicode_normalization);
- hb_test_add_data_flavor ((gconstpointer) script_roundtrip_default, "default", test_unicode_script_roundtrip);
- #ifdef HAVE_GLIB
- hb_test_add_data_flavor (hb_glib_get_unicode_funcs (), "glib", test_unicode_properties_lenient);
- hb_test_add_data_flavor (hb_glib_get_unicode_funcs (), "glib", test_unicode_normalization);
- hb_test_add_data_flavor ((gconstpointer) script_roundtrip_glib, "glib", test_unicode_script_roundtrip);
- #endif
- #ifdef HAVE_ICU
- hb_test_add_data_flavor (hb_icu_get_unicode_funcs (), "icu", test_unicode_properties_lenient);
- hb_test_add_data_flavor (hb_icu_get_unicode_funcs (), "icu", test_unicode_normalization);
- hb_test_add_data_flavor ((gconstpointer) script_roundtrip_icu, "icu", test_unicode_script_roundtrip);
- #endif
- hb_test_add (test_unicode_chainup);
- hb_test_add (test_unicode_setters);
- hb_test_add_fixture (data_fixture, NULL, test_unicode_subclassing_nil);
- hb_test_add_fixture (data_fixture, NULL, test_unicode_subclassing_default);
- hb_test_add_fixture (data_fixture, NULL, test_unicode_subclassing_deep);
- return hb_test_run ();
- }
|