Ignore:
Timestamp:
Sep 7, 2016, 11:56:08 AM (3 years ago)
Author:
cameron
Message:

Updates for Unicode 9.0

File:
1 edited

Legend:

Unmodified
Added
Removed
  • icGREP/icgrep-devel/icgrep/UCD/PropertyValueAliases.h

    r4742 r5145  
    22#define PROPERTYVALUEALIASES_H
    33/*
    4  *  Copyright (c) 2015 International Characters, Inc.
     4 *  Copyright (c) 2016 International Characters, Inc.
    55 *  This software is licensed to the public under the Open Software License 3.0.
    66 *  icgrep is a trademark of International Characters, Inc.
     
    5050    namespace SCX_ns {
    5151        enum value_t {
    52             Aghb, Ahom, Arab, Armi, Armn, Avst, Bali, Bamu, Bass, Batk,
    53             Beng, Bopo, Brah, Brai, Bugi, Buhd, Cakm, Cans, Cari, Cham,
    54             Cher, Copt, Cprt, Cyrl, Deva, Dsrt, Dupl, Egyp, Elba, Ethi,
    55             Geor, Glag, Goth, Gran, Grek, Gujr, Guru, Hang, Hani, Hano,
    56             Hatr, Hebr, Hira, Hluw, Hmng, Hrkt, Hung, Ital, Java, Kali,
    57             Kana, Khar, Khmr, Khoj, Knda, Kthi, Lana, Laoo, Latn, Lepc,
    58             Limb, Lina, Linb, Lisu, Lyci, Lydi, Mahj, Mand, Mani, Mend,
    59             Merc, Mero, Mlym, Modi, Mong, Mroo, Mtei, Mult, Mymr, Narb,
    60             Nbat, Nkoo, Ogam, Olck, Orkh, Orya, Osma, Palm, Pauc, Perm,
    61             Phag, Phli, Phlp, Phnx, Plrd, Prti, Rjng, Runr, Samr, Sarb,
    62             Saur, Sgnw, Shaw, Shrd, Sidd, Sind, Sinh, Sora, Sund, Sylo,
    63             Syrc, Tagb, Takr, Tale, Talu, Taml, Tavt, Telu, Tfng, Tglg,
    64             Thaa, Thai, Tibt, Tirh, Ugar, Vaii, Wara, Xpeo, Xsux, Yiii,
    65             Zinh, Zyyy, Zzzz};
    66         const static std::vector<std::string> enum_names = {
    67             "Aghb", "Ahom", "Arab", "Armi", "Armn", "Avst", "Bali", "Bamu",
    68             "Bass", "Batk", "Beng", "Bopo", "Brah", "Brai", "Bugi", "Buhd",
    69             "Cakm", "Cans", "Cari", "Cham", "Cher", "Copt", "Cprt", "Cyrl",
    70             "Deva", "Dsrt", "Dupl", "Egyp", "Elba", "Ethi", "Geor", "Glag",
    71             "Goth", "Gran", "Grek", "Gujr", "Guru", "Hang", "Hani", "Hano",
    72             "Hatr", "Hebr", "Hira", "Hluw", "Hmng", "Hrkt", "Hung", "Ital",
    73             "Java", "Kali", "Kana", "Khar", "Khmr", "Khoj", "Knda", "Kthi",
    74             "Lana", "Laoo", "Latn", "Lepc", "Limb", "Lina", "Linb", "Lisu",
    75             "Lyci", "Lydi", "Mahj", "Mand", "Mani", "Mend", "Merc", "Mero",
    76             "Mlym", "Modi", "Mong", "Mroo", "Mtei", "Mult", "Mymr", "Narb",
    77             "Nbat", "Nkoo", "Ogam", "Olck", "Orkh", "Orya", "Osma", "Palm",
    78             "Pauc", "Perm", "Phag", "Phli", "Phlp", "Phnx", "Plrd", "Prti",
    79             "Rjng", "Runr", "Samr", "Sarb", "Saur", "Sgnw", "Shaw", "Shrd",
    80             "Sidd", "Sind", "Sinh", "Sora", "Sund", "Sylo", "Syrc", "Tagb",
    81             "Takr", "Tale", "Talu", "Taml", "Tavt", "Telu", "Tfng", "Tglg",
    82             "Thaa", "Thai", "Tibt", "Tirh", "Ugar", "Vaii", "Wara", "Xpeo",
    83             "Xsux", "Yiii", "Zinh", "Zyyy", "Zzzz"};
    84         const static std::vector<std::string> value_names = {
    85             "Caucasian_Albanian", "Ahom", "Arabic", "Imperial_Aramaic",
    86             "Armenian", "Avestan", "Balinese", "Bamum", "Bassa_Vah",
    87             "Batak", "Bengali", "Bopomofo", "Brahmi", "Braille", "Buginese",
    88             "Buhid", "Chakma", "Canadian_Aboriginal", "Carian", "Cham",
    89             "Cherokee", "Coptic", "Cypriot", "Cyrillic", "Devanagari",
    90             "Deseret", "Duployan", "Egyptian_Hieroglyphs", "Elbasan",
    91             "Ethiopic", "Georgian", "Glagolitic", "Gothic", "Grantha",
    92             "Greek", "Gujarati", "Gurmukhi", "Hangul", "Han", "Hanunoo",
    93             "Hatran", "Hebrew", "Hiragana", "Anatolian_Hieroglyphs",
    94             "Pahawh_Hmong", "Katakana_Or_Hiragana", "Old_Hungarian",
    95             "Old_Italic", "Javanese", "Kayah_Li", "Katakana", "Kharoshthi",
    96             "Khmer", "Khojki", "Kannada", "Kaithi", "Tai_Tham", "Lao",
    97             "Latin", "Lepcha", "Limbu", "Linear_A", "Linear_B", "Lisu",
    98             "Lycian", "Lydian", "Mahajani", "Mandaic", "Manichaean",
     52            Adlm, Aghb, Ahom, Arab, Armi, Armn, Avst, Bali, Bamu, Bass,
     53            Batk, Beng, Bhks, Bopo, Brah, Brai, Bugi, Buhd, Cakm, Cans,
     54            Cari, Cham, Cher, Copt, Cprt, Cyrl, Deva, Dsrt, Dupl, Egyp,
     55            Elba, Ethi, Geor, Glag, Goth, Gran, Grek, Gujr, Guru, Hang,
     56            Hani, Hano, Hatr, Hebr, Hira, Hluw, Hmng, Hrkt, Hung, Ital,
     57            Java, Kali, Kana, Khar, Khmr, Khoj, Knda, Kthi, Lana, Laoo,
     58            Latn, Lepc, Limb, Lina, Linb, Lisu, Lyci, Lydi, Mahj, Mand,
     59            Mani, Marc, Mend, Merc, Mero, Mlym, Modi, Mong, Mroo, Mtei,
     60            Mult, Mymr, Narb, Nbat, Newa, Nkoo, Ogam, Olck, Orkh, Orya,
     61            Osge, Osma, Palm, Pauc, Perm, Phag, Phli, Phlp, Phnx, Plrd,
     62            Prti, Rjng, Runr, Samr, Sarb, Saur, Sgnw, Shaw, Shrd, Sidd,
     63            Sind, Sinh, Sora, Sund, Sylo, Syrc, Tagb, Takr, Tale, Talu,
     64            Taml, Tang, Tavt, Telu, Tfng, Tglg, Thaa, Thai, Tibt, Tirh,
     65            Ugar, Vaii, Wara, Xpeo, Xsux, Yiii, Zinh, Zyyy, Zzzz};
     66        const static std::vector<std::string> enum_names = {
     67            "Adlm", "Aghb", "Ahom", "Arab", "Armi", "Armn", "Avst", "Bali",
     68            "Bamu", "Bass", "Batk", "Beng", "Bhks", "Bopo", "Brah", "Brai",
     69            "Bugi", "Buhd", "Cakm", "Cans", "Cari", "Cham", "Cher", "Copt",
     70            "Cprt", "Cyrl", "Deva", "Dsrt", "Dupl", "Egyp", "Elba", "Ethi",
     71            "Geor", "Glag", "Goth", "Gran", "Grek", "Gujr", "Guru", "Hang",
     72            "Hani", "Hano", "Hatr", "Hebr", "Hira", "Hluw", "Hmng", "Hrkt",
     73            "Hung", "Ital", "Java", "Kali", "Kana", "Khar", "Khmr", "Khoj",
     74            "Knda", "Kthi", "Lana", "Laoo", "Latn", "Lepc", "Limb", "Lina",
     75            "Linb", "Lisu", "Lyci", "Lydi", "Mahj", "Mand", "Mani", "Marc",
     76            "Mend", "Merc", "Mero", "Mlym", "Modi", "Mong", "Mroo", "Mtei",
     77            "Mult", "Mymr", "Narb", "Nbat", "Newa", "Nkoo", "Ogam", "Olck",
     78            "Orkh", "Orya", "Osge", "Osma", "Palm", "Pauc", "Perm", "Phag",
     79            "Phli", "Phlp", "Phnx", "Plrd", "Prti", "Rjng", "Runr", "Samr",
     80            "Sarb", "Saur", "Sgnw", "Shaw", "Shrd", "Sidd", "Sind", "Sinh",
     81            "Sora", "Sund", "Sylo", "Syrc", "Tagb", "Takr", "Tale", "Talu",
     82            "Taml", "Tang", "Tavt", "Telu", "Tfng", "Tglg", "Thaa", "Thai",
     83            "Tibt", "Tirh", "Ugar", "Vaii", "Wara", "Xpeo", "Xsux", "Yiii",
     84            "Zinh", "Zyyy", "Zzzz"};
     85        const static std::vector<std::string> value_names = {
     86            "Adlam", "Caucasian_Albanian", "Ahom", "Arabic",
     87            "Imperial_Aramaic", "Armenian", "Avestan", "Balinese", "Bamum",
     88            "Bassa_Vah", "Batak", "Bengali", "Bhaiksuki", "Bopomofo",
     89            "Brahmi", "Braille", "Buginese", "Buhid", "Chakma",
     90            "Canadian_Aboriginal", "Carian", "Cham", "Cherokee", "Coptic",
     91            "Cypriot", "Cyrillic", "Devanagari", "Deseret", "Duployan",
     92            "Egyptian_Hieroglyphs", "Elbasan", "Ethiopic", "Georgian",
     93            "Glagolitic", "Gothic", "Grantha", "Greek", "Gujarati",
     94            "Gurmukhi", "Hangul", "Han", "Hanunoo", "Hatran", "Hebrew",
     95            "Hiragana", "Anatolian_Hieroglyphs", "Pahawh_Hmong",
     96            "Katakana_Or_Hiragana", "Old_Hungarian", "Old_Italic",
     97            "Javanese", "Kayah_Li", "Katakana", "Kharoshthi", "Khmer",
     98            "Khojki", "Kannada", "Kaithi", "Tai_Tham", "Lao", "Latin",
     99            "Lepcha", "Limbu", "Linear_A", "Linear_B", "Lisu", "Lycian",
     100            "Lydian", "Mahajani", "Mandaic", "Manichaean", "Marchen",
    99101            "Mende_Kikakui", "Meroitic_Cursive", "Meroitic_Hieroglyphs",
    100102            "Malayalam", "Modi", "Mongolian", "Mro", "Meetei_Mayek",
    101             "Multani", "Myanmar", "Old_North_Arabian", "Nabataean", "Nko",
    102             "Ogham", "Ol_Chiki", "Old_Turkic", "Oriya", "Osmanya",
    103             "Palmyrene", "Pau_Cin_Hau", "Old_Permic", "Phags_Pa",
     103            "Multani", "Myanmar", "Old_North_Arabian", "Nabataean", "Newa",
     104            "Nko", "Ogham", "Ol_Chiki", "Old_Turkic", "Oriya", "Osage",
     105            "Osmanya", "Palmyrene", "Pau_Cin_Hau", "Old_Permic", "Phags_Pa",
    104106            "Inscriptional_Pahlavi", "Psalter_Pahlavi", "Phoenician",
    105107            "Miao", "Inscriptional_Parthian", "Rejang", "Runic",
     
    107109            "Shavian", "Sharada", "Siddham", "Khudawadi", "Sinhala",
    108110            "Sora_Sompeng", "Sundanese", "Syloti_Nagri", "Syriac",
    109             "Tagbanwa", "Takri", "Tai_Le", "New_Tai_Lue", "Tamil",
     111            "Tagbanwa", "Takri", "Tai_Le", "New_Tai_Lue", "Tamil", "Tangut",
    110112            "Tai_Viet", "Telugu", "Tifinagh", "Tagalog", "Thaana", "Thai",
    111113            "Tibetan", "Tirhuta", "Ugaritic", "Vai", "Warang_Citi",
     
    119121        enum value_t {
    120122            V1_1, V2_0, V2_1, V3_0, V3_1, V3_2, V4_0, V4_1, V5_0, V5_1,
    121             V5_2, V6_0, V6_1, V6_2, V6_3, V7_0, V8_0, Unassigned};
     123            V5_2, V6_0, V6_1, V6_2, V6_3, V7_0, V8_0, V9_0, Unassigned};
    122124        const static std::vector<std::string> enum_names = {
    123125            "V1_1", "V2_0", "V2_1", "V3_0", "V3_1", "V3_2", "V4_0", "V4_1",
    124126            "V5_0", "V5_1", "V5_2", "V6_0", "V6_1", "V6_2", "V6_3", "V7_0",
    125             "V8_0", "Unassigned"};
     127            "V8_0", "V9_0", "Unassigned"};
    126128        const static std::vector<std::string> value_names = {
    127129            "V1_1", "V2_0", "V2_1", "V3_0", "V3_1", "V3_2", "V4_0", "V4_1",
    128130            "V5_0", "V5_1", "V5_2", "V6_0", "V6_1", "V6_2", "V6_3", "V7_0",
    129             "V8_0", "Unassigned"};
     131            "V8_0", "V9_0", "Unassigned"};
    130132        static std::unordered_map<std::string, int> aliases_only_map {{
    131133            {"1.1", AGE_ns::V1_1}, {"2.0", AGE_ns::V2_0},
     
    137139            {"6.1", AGE_ns::V6_1}, {"6.2", AGE_ns::V6_2},
    138140            {"6.3", AGE_ns::V6_3}, {"7.0", AGE_ns::V7_0},
    139             {"8.0", AGE_ns::V8_0}, {"na", AGE_ns::Unassigned}}};
     141            {"8.0", AGE_ns::V8_0}, {"9.0", AGE_ns::V9_0},
     142            {"na", AGE_ns::Unassigned}}};
    140143    }
    141144
    142145    namespace BLK_ns {
    143146        enum value_t {
    144             Aegean_Numbers, Ahom, Alchemical, Alphabetic_PF,
     147            Adlam, Aegean_Numbers, Ahom, Alchemical, Alphabetic_PF,
    145148            Anatolian_Hieroglyphs, Ancient_Greek_Music,
    146149            Ancient_Greek_Numbers, Ancient_Symbols, Arabic, Arabic_Ext_A,
    147150            Arabic_Math, Arabic_PF_A, Arabic_PF_B, Arabic_Sup, Armenian,
    148151            Arrows, ASCII, Avestan, Balinese, Bamum, Bamum_Sup, Bassa_Vah,
    149             Batak, Bengali, Block_Elements, Bopomofo, Bopomofo_Ext,
    150             Box_Drawing, Brahmi, Braille, Buginese, Buhid, Byzantine_Music,
    151             Carian, Caucasian_Albanian, Chakma, Cham, Cherokee,
    152             Cherokee_Sup, CJK, CJK_Compat, CJK_Compat_Forms,
     152            Batak, Bengali, Bhaiksuki, Block_Elements, Bopomofo,
     153            Bopomofo_Ext, Box_Drawing, Brahmi, Braille, Buginese, Buhid,
     154            Byzantine_Music, Carian, Caucasian_Albanian, Chakma, Cham,
     155            Cherokee, Cherokee_Sup, CJK, CJK_Compat, CJK_Compat_Forms,
    153156            CJK_Compat_Ideographs, CJK_Compat_Ideographs_Sup, CJK_Ext_A,
    154157            CJK_Ext_B, CJK_Ext_C, CJK_Ext_D, CJK_Ext_E, CJK_Radicals_Sup,
     
    156159            Coptic_Epact_Numbers, Counting_Rod, Cuneiform,
    157160            Cuneiform_Numbers, Currency_Symbols, Cypriot_Syllabary,
    158             Cyrillic, Cyrillic_Ext_A, Cyrillic_Ext_B, Cyrillic_Sup, Deseret,
    159             Devanagari, Devanagari_Ext, Diacriticals, Diacriticals_Ext,
    160             Diacriticals_For_Symbols, Diacriticals_Sup, Dingbats, Domino,
    161             Duployan, Early_Dynastic_Cuneiform, Egyptian_Hieroglyphs,
    162             Elbasan, Emoticons, Enclosed_Alphanum, Enclosed_Alphanum_Sup,
    163             Enclosed_CJK, Enclosed_Ideographic_Sup, Ethiopic, Ethiopic_Ext,
    164             Ethiopic_Ext_A, Ethiopic_Sup, Geometric_Shapes,
    165             Geometric_Shapes_Ext, Georgian, Georgian_Sup, Glagolitic,
    166             Gothic, Grantha, Greek, Greek_Ext, Gujarati, Gurmukhi,
    167             Half_And_Full_Forms, Half_Marks, Hangul, Hanunoo, Hatran,
    168             Hebrew, High_PU_Surrogates, High_Surrogates, Hiragana, IDC,
    169             Imperial_Aramaic, Indic_Number_Forms, Inscriptional_Pahlavi,
     161            Cyrillic, Cyrillic_Ext_A, Cyrillic_Ext_B, Cyrillic_Ext_C,
     162            Cyrillic_Sup, Deseret, Devanagari, Devanagari_Ext, Diacriticals,
     163            Diacriticals_Ext, Diacriticals_For_Symbols, Diacriticals_Sup,
     164            Dingbats, Domino, Duployan, Early_Dynastic_Cuneiform,
     165            Egyptian_Hieroglyphs, Elbasan, Emoticons, Enclosed_Alphanum,
     166            Enclosed_Alphanum_Sup, Enclosed_CJK, Enclosed_Ideographic_Sup,
     167            Ethiopic, Ethiopic_Ext, Ethiopic_Ext_A, Ethiopic_Sup,
     168            Geometric_Shapes, Geometric_Shapes_Ext, Georgian, Georgian_Sup,
     169            Glagolitic, Glagolitic_Sup, Gothic, Grantha, Greek, Greek_Ext,
     170            Gujarati, Gurmukhi, Half_And_Full_Forms, Half_Marks, Hangul,
     171            Hanunoo, Hatran, Hebrew, High_PU_Surrogates, High_Surrogates,
     172            Hiragana, IDC, Ideographic_Symbols, Imperial_Aramaic,
     173            Indic_Number_Forms, Inscriptional_Pahlavi,
    170174            Inscriptional_Parthian, IPA_Ext, Jamo, Jamo_Ext_A, Jamo_Ext_B,
    171175            Javanese, Kaithi, Kana_Sup, Kanbun, Kangxi, Kannada, Katakana,
     
    176180            Linear_B_Ideograms, Linear_B_Syllabary, Lisu, Low_Surrogates,
    177181            Lycian, Lydian, Mahajani, Mahjong, Malayalam, Mandaic,
    178             Manichaean, Math_Alphanum, Math_Operators, Meetei_Mayek,
    179             Meetei_Mayek_Ext, Mende_Kikakui, Meroitic_Cursive,
     182            Manichaean, Marchen, Math_Alphanum, Math_Operators,
     183            Meetei_Mayek, Meetei_Mayek_Ext, Mende_Kikakui, Meroitic_Cursive,
    180184            Meroitic_Hieroglyphs, Miao, Misc_Arrows, Misc_Math_Symbols_A,
    181185            Misc_Math_Symbols_B, Misc_Pictographs, Misc_Symbols,
    182186            Misc_Technical, Modi, Modifier_Letters, Modifier_Tone_Letters,
    183             Mongolian, Mro, Multani, Music, Myanmar, Myanmar_Ext_A,
    184             Myanmar_Ext_B, Nabataean, NB, New_Tai_Lue, NKo, Number_Forms,
    185             OCR, Ogham, Ol_Chiki, Old_Hungarian, Old_Italic,
    186             Old_North_Arabian, Old_Permic, Old_Persian, Old_South_Arabian,
    187             Old_Turkic, Oriya, Ornamental_Dingbats, Osmanya, Pahawh_Hmong,
    188             Palmyrene, Pau_Cin_Hau, Phags_Pa, Phaistos, Phoenician,
    189             Phonetic_Ext, Phonetic_Ext_Sup, Playing_Cards, Psalter_Pahlavi,
    190             PUA, Punctuation, Rejang, Rumi, Runic, Samaritan, Saurashtra,
    191             Sharada, Shavian, Shorthand_Format_Controls, Siddham, Sinhala,
     187            Mongolian, Mongolian_Sup, Mro, Multani, Music, Myanmar,
     188            Myanmar_Ext_A, Myanmar_Ext_B, Nabataean, NB, New_Tai_Lue, Newa,
     189            NKo, Number_Forms, OCR, Ogham, Ol_Chiki, Old_Hungarian,
     190            Old_Italic, Old_North_Arabian, Old_Permic, Old_Persian,
     191            Old_South_Arabian, Old_Turkic, Oriya, Ornamental_Dingbats,
     192            Osage, Osmanya, Pahawh_Hmong, Palmyrene, Pau_Cin_Hau, Phags_Pa,
     193            Phaistos, Phoenician, Phonetic_Ext, Phonetic_Ext_Sup,
     194            Playing_Cards, Psalter_Pahlavi, PUA, Punctuation, Rejang, Rumi,
     195            Runic, Samaritan, Saurashtra, Sharada, Shavian,
     196            Shorthand_Format_Controls, Siddham, Sinhala,
    192197            Sinhala_Archaic_Numbers, Small_Forms, Sora_Sompeng, Specials,
    193198            Sundanese, Sundanese_Sup, Sup_Arrows_A, Sup_Arrows_B,
     
    196201            Sutton_SignWriting, Syloti_Nagri, Syriac, Tagalog, Tagbanwa,
    197202            Tags, Tai_Le, Tai_Tham, Tai_Viet, Tai_Xuan_Jing, Takri, Tamil,
    198             Telugu, Thaana, Thai, Tibetan, Tifinagh, Tirhuta,
    199             Transport_And_Map, UCAS, UCAS_Ext, Ugaritic, Vai, Vedic_Ext,
    200             Vertical_Forms, VS, VS_Sup, Warang_Citi, Yi_Radicals,
    201             Yi_Syllables, Yijing};
    202         const static std::vector<std::string> enum_names = {
    203             "Aegean_Numbers", "Ahom", "Alchemical", "Alphabetic_PF",
    204             "Anatolian_Hieroglyphs", "Ancient_Greek_Music",
     203            Tangut, Tangut_Components, Telugu, Thaana, Thai, Tibetan,
     204            Tifinagh, Tirhuta, Transport_And_Map, UCAS, UCAS_Ext, Ugaritic,
     205            Vai, Vedic_Ext, Vertical_Forms, VS, VS_Sup, Warang_Citi,
     206            Yi_Radicals, Yi_Syllables, Yijing};
     207        const static std::vector<std::string> enum_names = {
     208            "Adlam", "Aegean_Numbers", "Ahom", "Alchemical",
     209            "Alphabetic_PF", "Anatolian_Hieroglyphs", "Ancient_Greek_Music",
    205210            "Ancient_Greek_Numbers", "Ancient_Symbols", "Arabic",
    206211            "Arabic_Ext_A", "Arabic_Math", "Arabic_PF_A", "Arabic_PF_B",
    207212            "Arabic_Sup", "Armenian", "Arrows", "ASCII", "Avestan",
    208213            "Balinese", "Bamum", "Bamum_Sup", "Bassa_Vah", "Batak",
    209             "Bengali", "Block_Elements", "Bopomofo", "Bopomofo_Ext",
    210             "Box_Drawing", "Brahmi", "Braille", "Buginese", "Buhid",
    211             "Byzantine_Music", "Carian", "Caucasian_Albanian", "Chakma",
    212             "Cham", "Cherokee", "Cherokee_Sup", "CJK", "CJK_Compat",
    213             "CJK_Compat_Forms", "CJK_Compat_Ideographs",
     214            "Bengali", "Bhaiksuki", "Block_Elements", "Bopomofo",
     215            "Bopomofo_Ext", "Box_Drawing", "Brahmi", "Braille", "Buginese",
     216            "Buhid", "Byzantine_Music", "Carian", "Caucasian_Albanian",
     217            "Chakma", "Cham", "Cherokee", "Cherokee_Sup", "CJK",
     218            "CJK_Compat", "CJK_Compat_Forms", "CJK_Compat_Ideographs",
    214219            "CJK_Compat_Ideographs_Sup", "CJK_Ext_A", "CJK_Ext_B",
    215220            "CJK_Ext_C", "CJK_Ext_D", "CJK_Ext_E", "CJK_Radicals_Sup",
     
    217222            "Coptic", "Coptic_Epact_Numbers", "Counting_Rod", "Cuneiform",
    218223            "Cuneiform_Numbers", "Currency_Symbols", "Cypriot_Syllabary",
    219             "Cyrillic", "Cyrillic_Ext_A", "Cyrillic_Ext_B", "Cyrillic_Sup",
    220             "Deseret", "Devanagari", "Devanagari_Ext", "Diacriticals",
    221             "Diacriticals_Ext", "Diacriticals_For_Symbols",
    222             "Diacriticals_Sup", "Dingbats", "Domino", "Duployan",
    223             "Early_Dynastic_Cuneiform", "Egyptian_Hieroglyphs", "Elbasan",
    224             "Emoticons", "Enclosed_Alphanum", "Enclosed_Alphanum_Sup",
    225             "Enclosed_CJK", "Enclosed_Ideographic_Sup", "Ethiopic",
    226             "Ethiopic_Ext", "Ethiopic_Ext_A", "Ethiopic_Sup",
    227             "Geometric_Shapes", "Geometric_Shapes_Ext", "Georgian",
    228             "Georgian_Sup", "Glagolitic", "Gothic", "Grantha", "Greek",
     224            "Cyrillic", "Cyrillic_Ext_A", "Cyrillic_Ext_B",
     225            "Cyrillic_Ext_C", "Cyrillic_Sup", "Deseret", "Devanagari",
     226            "Devanagari_Ext", "Diacriticals", "Diacriticals_Ext",
     227            "Diacriticals_For_Symbols", "Diacriticals_Sup", "Dingbats",
     228            "Domino", "Duployan", "Early_Dynastic_Cuneiform",
     229            "Egyptian_Hieroglyphs", "Elbasan", "Emoticons",
     230            "Enclosed_Alphanum", "Enclosed_Alphanum_Sup", "Enclosed_CJK",
     231            "Enclosed_Ideographic_Sup", "Ethiopic", "Ethiopic_Ext",
     232            "Ethiopic_Ext_A", "Ethiopic_Sup", "Geometric_Shapes",
     233            "Geometric_Shapes_Ext", "Georgian", "Georgian_Sup",
     234            "Glagolitic", "Glagolitic_Sup", "Gothic", "Grantha", "Greek",
    229235            "Greek_Ext", "Gujarati", "Gurmukhi", "Half_And_Full_Forms",
    230236            "Half_Marks", "Hangul", "Hanunoo", "Hatran", "Hebrew",
    231237            "High_PU_Surrogates", "High_Surrogates", "Hiragana", "IDC",
    232             "Imperial_Aramaic", "Indic_Number_Forms",
     238            "Ideographic_Symbols", "Imperial_Aramaic", "Indic_Number_Forms",
    233239            "Inscriptional_Pahlavi", "Inscriptional_Parthian", "IPA_Ext",
    234240            "Jamo", "Jamo_Ext_A", "Jamo_Ext_B", "Javanese", "Kaithi",
     
    241247            "Linear_B_Syllabary", "Lisu", "Low_Surrogates", "Lycian",
    242248            "Lydian", "Mahajani", "Mahjong", "Malayalam", "Mandaic",
    243             "Manichaean", "Math_Alphanum", "Math_Operators", "Meetei_Mayek",
    244             "Meetei_Mayek_Ext", "Mende_Kikakui", "Meroitic_Cursive",
    245             "Meroitic_Hieroglyphs", "Miao", "Misc_Arrows",
    246             "Misc_Math_Symbols_A", "Misc_Math_Symbols_B",
     249            "Manichaean", "Marchen", "Math_Alphanum", "Math_Operators",
     250            "Meetei_Mayek", "Meetei_Mayek_Ext", "Mende_Kikakui",
     251            "Meroitic_Cursive", "Meroitic_Hieroglyphs", "Miao",
     252            "Misc_Arrows", "Misc_Math_Symbols_A", "Misc_Math_Symbols_B",
    247253            "Misc_Pictographs", "Misc_Symbols", "Misc_Technical", "Modi",
    248             "Modifier_Letters", "Modifier_Tone_Letters", "Mongolian", "Mro",
    249             "Multani", "Music", "Myanmar", "Myanmar_Ext_A", "Myanmar_Ext_B",
    250             "Nabataean", "NB", "New_Tai_Lue", "NKo", "Number_Forms", "OCR",
    251             "Ogham", "Ol_Chiki", "Old_Hungarian", "Old_Italic",
    252             "Old_North_Arabian", "Old_Permic", "Old_Persian",
    253             "Old_South_Arabian", "Old_Turkic", "Oriya",
    254             "Ornamental_Dingbats", "Osmanya", "Pahawh_Hmong", "Palmyrene",
    255             "Pau_Cin_Hau", "Phags_Pa", "Phaistos", "Phoenician",
    256             "Phonetic_Ext", "Phonetic_Ext_Sup", "Playing_Cards",
    257             "Psalter_Pahlavi", "PUA", "Punctuation", "Rejang", "Rumi",
    258             "Runic", "Samaritan", "Saurashtra", "Sharada", "Shavian",
    259             "Shorthand_Format_Controls", "Siddham", "Sinhala",
     254            "Modifier_Letters", "Modifier_Tone_Letters", "Mongolian",
     255            "Mongolian_Sup", "Mro", "Multani", "Music", "Myanmar",
     256            "Myanmar_Ext_A", "Myanmar_Ext_B", "Nabataean", "NB",
     257            "New_Tai_Lue", "Newa", "NKo", "Number_Forms", "OCR", "Ogham",
     258            "Ol_Chiki", "Old_Hungarian", "Old_Italic", "Old_North_Arabian",
     259            "Old_Permic", "Old_Persian", "Old_South_Arabian", "Old_Turkic",
     260            "Oriya", "Ornamental_Dingbats", "Osage", "Osmanya",
     261            "Pahawh_Hmong", "Palmyrene", "Pau_Cin_Hau", "Phags_Pa",
     262            "Phaistos", "Phoenician", "Phonetic_Ext", "Phonetic_Ext_Sup",
     263            "Playing_Cards", "Psalter_Pahlavi", "PUA", "Punctuation",
     264            "Rejang", "Rumi", "Runic", "Samaritan", "Saurashtra", "Sharada",
     265            "Shavian", "Shorthand_Format_Controls", "Siddham", "Sinhala",
    260266            "Sinhala_Archaic_Numbers", "Small_Forms", "Sora_Sompeng",
    261267            "Specials", "Sundanese", "Sundanese_Sup", "Sup_Arrows_A",
     
    265271            "Sutton_SignWriting", "Syloti_Nagri", "Syriac", "Tagalog",
    266272            "Tagbanwa", "Tags", "Tai_Le", "Tai_Tham", "Tai_Viet",
    267             "Tai_Xuan_Jing", "Takri", "Tamil", "Telugu", "Thaana", "Thai",
    268             "Tibetan", "Tifinagh", "Tirhuta", "Transport_And_Map", "UCAS",
    269             "UCAS_Ext", "Ugaritic", "Vai", "Vedic_Ext", "Vertical_Forms",
    270             "VS", "VS_Sup", "Warang_Citi", "Yi_Radicals", "Yi_Syllables",
     273            "Tai_Xuan_Jing", "Takri", "Tamil", "Tangut",
     274            "Tangut_Components", "Telugu", "Thaana", "Thai", "Tibetan",
     275            "Tifinagh", "Tirhuta", "Transport_And_Map", "UCAS", "UCAS_Ext",
     276            "Ugaritic", "Vai", "Vedic_Ext", "Vertical_Forms", "VS",
     277            "VS_Sup", "Warang_Citi", "Yi_Radicals", "Yi_Syllables",
    271278            "Yijing"};
    272279        const static std::vector<std::string> value_names = {
    273             "Aegean_Numbers", "Ahom", "Alchemical_Symbols",
     280            "Adlam", "Aegean_Numbers", "Ahom", "Alchemical_Symbols",
    274281            "Alphabetic_Presentation_Forms", "Anatolian_Hieroglyphs",
    275282            "Ancient_Greek_Musical_Notation", "Ancient_Greek_Numbers",
     
    279286            "Arabic_Supplement", "Armenian", "Arrows", "Basic_Latin",
    280287            "Avestan", "Balinese", "Bamum", "Bamum_Supplement", "Bassa_Vah",
    281             "Batak", "Bengali", "Block_Elements", "Bopomofo",
     288            "Batak", "Bengali", "Bhaiksuki", "Block_Elements", "Bopomofo",
    282289            "Bopomofo_Extended", "Box_Drawing", "Brahmi",
    283290            "Braille_Patterns", "Buginese", "Buhid",
     
    297304            "Cuneiform_Numbers_And_Punctuation", "Currency_Symbols",
    298305            "Cypriot_Syllabary", "Cyrillic", "Cyrillic_Extended_A",
    299             "Cyrillic_Extended_B", "Cyrillic_Supplement", "Deseret",
    300             "Devanagari", "Devanagari_Extended",
    301             "Combining_Diacritical_Marks",
     306            "Cyrillic_Extended_B", "Cyrillic_Extended_C",
     307            "Cyrillic_Supplement", "Deseret", "Devanagari",
     308            "Devanagari_Extended", "Combining_Diacritical_Marks",
    302309            "Combining_Diacritical_Marks_Extended",
    303310            "Combining_Diacritical_Marks_For_Symbols",
     
    311318            "Ethiopic_Supplement", "Geometric_Shapes",
    312319            "Geometric_Shapes_Extended", "Georgian", "Georgian_Supplement",
    313             "Glagolitic", "Gothic", "Grantha", "Greek_And_Coptic",
    314             "Greek_Extended", "Gujarati", "Gurmukhi",
     320            "Glagolitic", "Glagolitic_Supplement", "Gothic", "Grantha",
     321            "Greek_And_Coptic", "Greek_Extended", "Gujarati", "Gurmukhi",
    315322            "Halfwidth_And_Fullwidth_Forms", "Combining_Half_Marks",
    316323            "Hangul_Syllables", "Hanunoo", "Hatran", "Hebrew",
    317324            "High_Private_Use_Surrogates", "High_Surrogates", "Hiragana",
    318             "Ideographic_Description_Characters", "Imperial_Aramaic",
     325            "Ideographic_Description_Characters",
     326            "Ideographic_Symbols_And_Punctuation", "Imperial_Aramaic",
    319327            "Common_Indic_Number_Forms", "Inscriptional_Pahlavi",
    320328            "Inscriptional_Parthian", "IPA_Extensions", "Hangul_Jamo",
     
    330338            "Low_Surrogates", "Lycian", "Lydian", "Mahajani",
    331339            "Mahjong_Tiles", "Malayalam", "Mandaic", "Manichaean",
    332             "Mathematical_Alphanumeric_Symbols", "Mathematical_Operators",
    333             "Meetei_Mayek", "Meetei_Mayek_Extensions", "Mende_Kikakui",
    334             "Meroitic_Cursive", "Meroitic_Hieroglyphs", "Miao",
     340            "Marchen", "Mathematical_Alphanumeric_Symbols",
     341            "Mathematical_Operators", "Meetei_Mayek",
     342            "Meetei_Mayek_Extensions", "Mende_Kikakui", "Meroitic_Cursive",
     343            "Meroitic_Hieroglyphs", "Miao",
    335344            "Miscellaneous_Symbols_And_Arrows",
    336345            "Miscellaneous_Mathematical_Symbols_A",
     
    339348            "Miscellaneous_Symbols", "Miscellaneous_Technical", "Modi",
    340349            "Spacing_Modifier_Letters", "Modifier_Tone_Letters",
    341             "Mongolian", "Mro", "Multani", "Musical_Symbols", "Myanmar",
    342             "Myanmar_Extended_A", "Myanmar_Extended_B", "Nabataean",
    343             "No_Block", "New_Tai_Lue", "NKo", "Number_Forms",
    344             "Optical_Character_Recognition", "Ogham", "Ol_Chiki",
    345             "Old_Hungarian", "Old_Italic", "Old_North_Arabian",
    346             "Old_Permic", "Old_Persian", "Old_South_Arabian", "Old_Turkic",
    347             "Oriya", "Ornamental_Dingbats", "Osmanya", "Pahawh_Hmong",
     350            "Mongolian", "Mongolian_Supplement", "Mro", "Multani",
     351            "Musical_Symbols", "Myanmar", "Myanmar_Extended_A",
     352            "Myanmar_Extended_B", "Nabataean", "No_Block", "New_Tai_Lue",
     353            "Newa", "NKo", "Number_Forms", "Optical_Character_Recognition",
     354            "Ogham", "Ol_Chiki", "Old_Hungarian", "Old_Italic",
     355            "Old_North_Arabian", "Old_Permic", "Old_Persian",
     356            "Old_South_Arabian", "Old_Turkic", "Oriya",
     357            "Ornamental_Dingbats", "Osage", "Osmanya", "Pahawh_Hmong",
    348358            "Palmyrene", "Pau_Cin_Hau", "Phags_Pa", "Phaistos_Disc",
    349359            "Phoenician", "Phonetic_Extensions",
     
    363373            "Syloti_Nagri", "Syriac", "Tagalog", "Tagbanwa", "Tags",
    364374            "Tai_Le", "Tai_Tham", "Tai_Viet", "Tai_Xuan_Jing_Symbols",
    365             "Takri", "Tamil", "Telugu", "Thaana", "Thai", "Tibetan",
    366             "Tifinagh", "Tirhuta", "Transport_And_Map_Symbols",
     375            "Takri", "Tamil", "Tangut", "Tangut_Components", "Telugu",
     376            "Thaana", "Thai", "Tibetan", "Tifinagh", "Tirhuta",
     377            "Transport_And_Map_Symbols",
    367378            "Unified_Canadian_Aboriginal_Syllabics",
    368379            "Unified_Canadian_Aboriginal_Syllabics_Extended", "Ugaritic",
     
    380391    namespace SC_ns {
    381392        enum value_t {
    382             Aghb, Ahom, Arab, Armi, Armn, Avst, Bali, Bamu, Bass, Batk,
    383             Beng, Bopo, Brah, Brai, Bugi, Buhd, Cakm, Cans, Cari, Cham,
    384             Cher, Copt, Cprt, Cyrl, Deva, Dsrt, Dupl, Egyp, Elba, Ethi,
    385             Geor, Glag, Goth, Gran, Grek, Gujr, Guru, Hang, Hani, Hano,
    386             Hatr, Hebr, Hira, Hluw, Hmng, Hrkt, Hung, Ital, Java, Kali,
    387             Kana, Khar, Khmr, Khoj, Knda, Kthi, Lana, Laoo, Latn, Lepc,
    388             Limb, Lina, Linb, Lisu, Lyci, Lydi, Mahj, Mand, Mani, Mend,
    389             Merc, Mero, Mlym, Modi, Mong, Mroo, Mtei, Mult, Mymr, Narb,
    390             Nbat, Nkoo, Ogam, Olck, Orkh, Orya, Osma, Palm, Pauc, Perm,
    391             Phag, Phli, Phlp, Phnx, Plrd, Prti, Rjng, Runr, Samr, Sarb,
    392             Saur, Sgnw, Shaw, Shrd, Sidd, Sind, Sinh, Sora, Sund, Sylo,
    393             Syrc, Tagb, Takr, Tale, Talu, Taml, Tavt, Telu, Tfng, Tglg,
    394             Thaa, Thai, Tibt, Tirh, Ugar, Vaii, Wara, Xpeo, Xsux, Yiii,
    395             Zinh, Zyyy, Zzzz};
    396         const static std::vector<std::string> enum_names = {
    397             "Aghb", "Ahom", "Arab", "Armi", "Armn", "Avst", "Bali", "Bamu",
    398             "Bass", "Batk", "Beng", "Bopo", "Brah", "Brai", "Bugi", "Buhd",
    399             "Cakm", "Cans", "Cari", "Cham", "Cher", "Copt", "Cprt", "Cyrl",
    400             "Deva", "Dsrt", "Dupl", "Egyp", "Elba", "Ethi", "Geor", "Glag",
    401             "Goth", "Gran", "Grek", "Gujr", "Guru", "Hang", "Hani", "Hano",
    402             "Hatr", "Hebr", "Hira", "Hluw", "Hmng", "Hrkt", "Hung", "Ital",
    403             "Java", "Kali", "Kana", "Khar", "Khmr", "Khoj", "Knda", "Kthi",
    404             "Lana", "Laoo", "Latn", "Lepc", "Limb", "Lina", "Linb", "Lisu",
    405             "Lyci", "Lydi", "Mahj", "Mand", "Mani", "Mend", "Merc", "Mero",
    406             "Mlym", "Modi", "Mong", "Mroo", "Mtei", "Mult", "Mymr", "Narb",
    407             "Nbat", "Nkoo", "Ogam", "Olck", "Orkh", "Orya", "Osma", "Palm",
    408             "Pauc", "Perm", "Phag", "Phli", "Phlp", "Phnx", "Plrd", "Prti",
    409             "Rjng", "Runr", "Samr", "Sarb", "Saur", "Sgnw", "Shaw", "Shrd",
    410             "Sidd", "Sind", "Sinh", "Sora", "Sund", "Sylo", "Syrc", "Tagb",
    411             "Takr", "Tale", "Talu", "Taml", "Tavt", "Telu", "Tfng", "Tglg",
    412             "Thaa", "Thai", "Tibt", "Tirh", "Ugar", "Vaii", "Wara", "Xpeo",
    413             "Xsux", "Yiii", "Zinh", "Zyyy", "Zzzz"};
    414         const static std::vector<std::string> value_names = {
    415             "Caucasian_Albanian", "Ahom", "Arabic", "Imperial_Aramaic",
    416             "Armenian", "Avestan", "Balinese", "Bamum", "Bassa_Vah",
    417             "Batak", "Bengali", "Bopomofo", "Brahmi", "Braille", "Buginese",
    418             "Buhid", "Chakma", "Canadian_Aboriginal", "Carian", "Cham",
    419             "Cherokee", "Coptic", "Cypriot", "Cyrillic", "Devanagari",
    420             "Deseret", "Duployan", "Egyptian_Hieroglyphs", "Elbasan",
    421             "Ethiopic", "Georgian", "Glagolitic", "Gothic", "Grantha",
    422             "Greek", "Gujarati", "Gurmukhi", "Hangul", "Han", "Hanunoo",
    423             "Hatran", "Hebrew", "Hiragana", "Anatolian_Hieroglyphs",
    424             "Pahawh_Hmong", "Katakana_Or_Hiragana", "Old_Hungarian",
    425             "Old_Italic", "Javanese", "Kayah_Li", "Katakana", "Kharoshthi",
    426             "Khmer", "Khojki", "Kannada", "Kaithi", "Tai_Tham", "Lao",
    427             "Latin", "Lepcha", "Limbu", "Linear_A", "Linear_B", "Lisu",
    428             "Lycian", "Lydian", "Mahajani", "Mandaic", "Manichaean",
     393            Adlm, Aghb, Ahom, Arab, Armi, Armn, Avst, Bali, Bamu, Bass,
     394            Batk, Beng, Bhks, Bopo, Brah, Brai, Bugi, Buhd, Cakm, Cans,
     395            Cari, Cham, Cher, Copt, Cprt, Cyrl, Deva, Dsrt, Dupl, Egyp,
     396            Elba, Ethi, Geor, Glag, Goth, Gran, Grek, Gujr, Guru, Hang,
     397            Hani, Hano, Hatr, Hebr, Hira, Hluw, Hmng, Hrkt, Hung, Ital,
     398            Java, Kali, Kana, Khar, Khmr, Khoj, Knda, Kthi, Lana, Laoo,
     399            Latn, Lepc, Limb, Lina, Linb, Lisu, Lyci, Lydi, Mahj, Mand,
     400            Mani, Marc, Mend, Merc, Mero, Mlym, Modi, Mong, Mroo, Mtei,
     401            Mult, Mymr, Narb, Nbat, Newa, Nkoo, Ogam, Olck, Orkh, Orya,
     402            Osge, Osma, Palm, Pauc, Perm, Phag, Phli, Phlp, Phnx, Plrd,
     403            Prti, Rjng, Runr, Samr, Sarb, Saur, Sgnw, Shaw, Shrd, Sidd,
     404            Sind, Sinh, Sora, Sund, Sylo, Syrc, Tagb, Takr, Tale, Talu,
     405            Taml, Tang, Tavt, Telu, Tfng, Tglg, Thaa, Thai, Tibt, Tirh,
     406            Ugar, Vaii, Wara, Xpeo, Xsux, Yiii, Zinh, Zyyy, Zzzz};
     407        const static std::vector<std::string> enum_names = {
     408            "Adlm", "Aghb", "Ahom", "Arab", "Armi", "Armn", "Avst", "Bali",
     409            "Bamu", "Bass", "Batk", "Beng", "Bhks", "Bopo", "Brah", "Brai",
     410            "Bugi", "Buhd", "Cakm", "Cans", "Cari", "Cham", "Cher", "Copt",
     411            "Cprt", "Cyrl", "Deva", "Dsrt", "Dupl", "Egyp", "Elba", "Ethi",
     412            "Geor", "Glag", "Goth", "Gran", "Grek", "Gujr", "Guru", "Hang",
     413            "Hani", "Hano", "Hatr", "Hebr", "Hira", "Hluw", "Hmng", "Hrkt",
     414            "Hung", "Ital", "Java", "Kali", "Kana", "Khar", "Khmr", "Khoj",
     415            "Knda", "Kthi", "Lana", "Laoo", "Latn", "Lepc", "Limb", "Lina",
     416            "Linb", "Lisu", "Lyci", "Lydi", "Mahj", "Mand", "Mani", "Marc",
     417            "Mend", "Merc", "Mero", "Mlym", "Modi", "Mong", "Mroo", "Mtei",
     418            "Mult", "Mymr", "Narb", "Nbat", "Newa", "Nkoo", "Ogam", "Olck",
     419            "Orkh", "Orya", "Osge", "Osma", "Palm", "Pauc", "Perm", "Phag",
     420            "Phli", "Phlp", "Phnx", "Plrd", "Prti", "Rjng", "Runr", "Samr",
     421            "Sarb", "Saur", "Sgnw", "Shaw", "Shrd", "Sidd", "Sind", "Sinh",
     422            "Sora", "Sund", "Sylo", "Syrc", "Tagb", "Takr", "Tale", "Talu",
     423            "Taml", "Tang", "Tavt", "Telu", "Tfng", "Tglg", "Thaa", "Thai",
     424            "Tibt", "Tirh", "Ugar", "Vaii", "Wara", "Xpeo", "Xsux", "Yiii",
     425            "Zinh", "Zyyy", "Zzzz"};
     426        const static std::vector<std::string> value_names = {
     427            "Adlam", "Caucasian_Albanian", "Ahom", "Arabic",
     428            "Imperial_Aramaic", "Armenian", "Avestan", "Balinese", "Bamum",
     429            "Bassa_Vah", "Batak", "Bengali", "Bhaiksuki", "Bopomofo",
     430            "Brahmi", "Braille", "Buginese", "Buhid", "Chakma",
     431            "Canadian_Aboriginal", "Carian", "Cham", "Cherokee", "Coptic",
     432            "Cypriot", "Cyrillic", "Devanagari", "Deseret", "Duployan",
     433            "Egyptian_Hieroglyphs", "Elbasan", "Ethiopic", "Georgian",
     434            "Glagolitic", "Gothic", "Grantha", "Greek", "Gujarati",
     435            "Gurmukhi", "Hangul", "Han", "Hanunoo", "Hatran", "Hebrew",
     436            "Hiragana", "Anatolian_Hieroglyphs", "Pahawh_Hmong",
     437            "Katakana_Or_Hiragana", "Old_Hungarian", "Old_Italic",
     438            "Javanese", "Kayah_Li", "Katakana", "Kharoshthi", "Khmer",
     439            "Khojki", "Kannada", "Kaithi", "Tai_Tham", "Lao", "Latin",
     440            "Lepcha", "Limbu", "Linear_A", "Linear_B", "Lisu", "Lycian",
     441            "Lydian", "Mahajani", "Mandaic", "Manichaean", "Marchen",
    429442            "Mende_Kikakui", "Meroitic_Cursive", "Meroitic_Hieroglyphs",
    430443            "Malayalam", "Modi", "Mongolian", "Mro", "Meetei_Mayek",
    431             "Multani", "Myanmar", "Old_North_Arabian", "Nabataean", "Nko",
    432             "Ogham", "Ol_Chiki", "Old_Turkic", "Oriya", "Osmanya",
    433             "Palmyrene", "Pau_Cin_Hau", "Old_Permic", "Phags_Pa",
     444            "Multani", "Myanmar", "Old_North_Arabian", "Nabataean", "Newa",
     445            "Nko", "Ogham", "Ol_Chiki", "Old_Turkic", "Oriya", "Osage",
     446            "Osmanya", "Palmyrene", "Pau_Cin_Hau", "Old_Permic", "Phags_Pa",
    434447            "Inscriptional_Pahlavi", "Psalter_Pahlavi", "Phoenician",
    435448            "Miao", "Inscriptional_Parthian", "Rejang", "Runic",
     
    437450            "Shavian", "Sharada", "Siddham", "Khudawadi", "Sinhala",
    438451            "Sora_Sompeng", "Sundanese", "Syloti_Nagri", "Syriac",
    439             "Tagbanwa", "Takri", "Tai_Le", "New_Tai_Lue", "Tamil",
     452            "Tagbanwa", "Takri", "Tai_Le", "New_Tai_Lue", "Tamil", "Tangut",
    440453            "Tai_Viet", "Telugu", "Tifinagh", "Tagalog", "Thaana", "Thai",
    441454            "Tibetan", "Tirhuta", "Ugaritic", "Vai", "Warang_Citi",
     
    599612    namespace GCB_ns {
    600613        enum value_t {
    601             CN, CR, EX, L, LF, LV, LVT, PP, RI, SM, T, V, XX};
    602         const static std::vector<std::string> enum_names = {
    603             "CN", "CR", "EX", "L", "LF", "LV", "LVT", "PP", "RI", "SM", "T",
    604             "V", "XX"};
    605         const static std::vector<std::string> value_names = {
    606             "Control", "CR", "Extend", "L", "LF", "LV", "LVT", "Prepend",
    607             "Regional_Indicator", "SpacingMark", "T", "V", "Other"};
     614            CN, CR, EB, EBG, EM, EX, GAZ, L, LF, LV, LVT, PP, RI, SM, T, V,
     615            XX, ZWJ};
     616        const static std::vector<std::string> enum_names = {
     617            "CN", "CR", "EB", "EBG", "EM", "EX", "GAZ", "L", "LF", "LV",
     618            "LVT", "PP", "RI", "SM", "T", "V", "XX", "ZWJ"};
     619        const static std::vector<std::string> value_names = {
     620            "Control", "CR", "E_Base", "E_Base_GAZ", "E_Modifier", "Extend",
     621            "Glue_After_Zwj", "L", "LF", "LV", "LVT", "Prepend",
     622            "Regional_Indicator", "SpacingMark", "T", "V", "Other", "ZWJ"};
    608623        static std::unordered_map<std::string, int> aliases_only_map {{
    609624            }};
     
    686701    namespace JG_ns {
    687702        enum value_t {
    688             Ain, Alaph, Alef, Beh, Beth, Burushaski_Yeh_Barree, Dal,
    689             Dalath_Rish, E, Farsi_Yeh, Fe, Feh, Final_Semkath, Gaf, Gamal,
    690             Hah, He, Heh, Heh_Goal, Heth, Kaf, Kaph, Khaph, Knotted_Heh,
    691             Lam, Lamadh, Manichaean_Aleph, Manichaean_Ayin, Manichaean_Beth,
    692             Manichaean_Daleth, Manichaean_Dhamedh, Manichaean_Five,
    693             Manichaean_Gimel, Manichaean_Heth, Manichaean_Hundred,
    694             Manichaean_Kaph, Manichaean_Lamedh, Manichaean_Mem,
    695             Manichaean_Nun, Manichaean_One, Manichaean_Pe, Manichaean_Qoph,
    696             Manichaean_Resh, Manichaean_Sadhe, Manichaean_Samekh,
    697             Manichaean_Taw, Manichaean_Ten, Manichaean_Teth,
    698             Manichaean_Thamedh, Manichaean_Twenty, Manichaean_Waw,
    699             Manichaean_Yodh, Manichaean_Zayin, Meem, Mim, No_Joining_Group,
    700             Noon, Nun, Nya, Pe, Qaf, Qaph, Reh, Reversed_Pe, Rohingya_Yeh,
    701             Sad, Sadhe, Seen, Semkath, Shin, Straight_Waw, Swash_Kaf,
    702             Syriac_Waw, Tah, Taw, Teh_Marbuta, Teh_Marbuta_Goal, Teth, Waw,
    703             Yeh, Yeh_Barree, Yeh_With_Tail, Yudh, Yudh_He, Zain, Zhain};
    704         const static std::vector<std::string> enum_names = {
    705             "Ain", "Alaph", "Alef", "Beh", "Beth", "Burushaski_Yeh_Barree",
    706             "Dal", "Dalath_Rish", "E", "Farsi_Yeh", "Fe", "Feh",
    707             "Final_Semkath", "Gaf", "Gamal", "Hah", "He", "Heh", "Heh_Goal",
    708             "Heth", "Kaf", "Kaph", "Khaph", "Knotted_Heh", "Lam", "Lamadh",
     703            African_Feh, African_Noon, African_Qaf, Ain, Alaph, Alef, Beh,
     704            Beth, Burushaski_Yeh_Barree, Dal, Dalath_Rish, E, Farsi_Yeh, Fe,
     705            Feh, Final_Semkath, Gaf, Gamal, Hah, He, Heh, Heh_Goal, Heth,
     706            Kaf, Kaph, Khaph, Knotted_Heh, Lam, Lamadh, Manichaean_Aleph,
     707            Manichaean_Ayin, Manichaean_Beth, Manichaean_Daleth,
     708            Manichaean_Dhamedh, Manichaean_Five, Manichaean_Gimel,
     709            Manichaean_Heth, Manichaean_Hundred, Manichaean_Kaph,
     710            Manichaean_Lamedh, Manichaean_Mem, Manichaean_Nun,
     711            Manichaean_One, Manichaean_Pe, Manichaean_Qoph, Manichaean_Resh,
     712            Manichaean_Sadhe, Manichaean_Samekh, Manichaean_Taw,
     713            Manichaean_Ten, Manichaean_Teth, Manichaean_Thamedh,
     714            Manichaean_Twenty, Manichaean_Waw, Manichaean_Yodh,
     715            Manichaean_Zayin, Meem, Mim, No_Joining_Group, Noon, Nun, Nya,
     716            Pe, Qaf, Qaph, Reh, Reversed_Pe, Rohingya_Yeh, Sad, Sadhe, Seen,
     717            Semkath, Shin, Straight_Waw, Swash_Kaf, Syriac_Waw, Tah, Taw,
     718            Teh_Marbuta, Teh_Marbuta_Goal, Teth, Waw, Yeh, Yeh_Barree,
     719            Yeh_With_Tail, Yudh, Yudh_He, Zain, Zhain};
     720        const static std::vector<std::string> enum_names = {
     721            "African_Feh", "African_Noon", "African_Qaf", "Ain", "Alaph",
     722            "Alef", "Beh", "Beth", "Burushaski_Yeh_Barree", "Dal",
     723            "Dalath_Rish", "E", "Farsi_Yeh", "Fe", "Feh", "Final_Semkath",
     724            "Gaf", "Gamal", "Hah", "He", "Heh", "Heh_Goal", "Heth", "Kaf",
     725            "Kaph", "Khaph", "Knotted_Heh", "Lam", "Lamadh",
    709726            "Manichaean_Aleph", "Manichaean_Ayin", "Manichaean_Beth",
    710727            "Manichaean_Daleth", "Manichaean_Dhamedh", "Manichaean_Five",
     
    723740            "Yudh_He", "Zain", "Zhain"};
    724741        const static std::vector<std::string> value_names = {
    725             "Ain", "Alaph", "Alef", "Beh", "Beth", "Burushaski_Yeh_Barree",
    726             "Dal", "Dalath_Rish", "E", "Farsi_Yeh", "Fe", "Feh",
    727             "Final_Semkath", "Gaf", "Gamal", "Hah", "He", "Heh", "Heh_Goal",
    728             "Heth", "Kaf", "Kaph", "Khaph", "Knotted_Heh", "Lam", "Lamadh",
     742            "African_Feh", "African_Noon", "African_Qaf", "Ain", "Alaph",
     743            "Alef", "Beh", "Beth", "Burushaski_Yeh_Barree", "Dal",
     744            "Dalath_Rish", "E", "Farsi_Yeh", "Fe", "Feh", "Final_Semkath",
     745            "Gaf", "Gamal", "Hah", "He", "Heh", "Heh_Goal", "Heth", "Kaf",
     746            "Kaph", "Khaph", "Knotted_Heh", "Lam", "Lamadh",
    729747            "Manichaean_Aleph", "Manichaean_Ayin", "Manichaean_Beth",
    730748            "Manichaean_Daleth", "Manichaean_Dhamedh", "Manichaean_Five",
     
    760778    namespace LB_ns {
    761779        enum value_t {
    762             AI, AL, B2, BA, BB, BK, CB, CJ, CL, CM, CP, CR, EX, GL, H2, H3,
    763             HL, HY, ID, IN, IS, JL, JT, JV, LF, NL, NS, NU, OP, PO, PR, QU,
    764             RI, SA, SG, SP, SY, WJ, XX, ZW};
     780            AI, AL, B2, BA, BB, BK, CB, CJ, CL, CM, CP, CR, EB, EM, EX, GL,
     781            H2, H3, HL, HY, ID, IN, IS, JL, JT, JV, LF, NL, NS, NU, OP, PO,
     782            PR, QU, RI, SA, SG, SP, SY, WJ, XX, ZW, ZWJ};
    765783        const static std::vector<std::string> enum_names = {
    766784            "AI", "AL", "B2", "BA", "BB", "BK", "CB", "CJ", "CL", "CM",
    767             "CP", "CR", "EX", "GL", "H2", "H3", "HL", "HY", "ID", "IN",
    768             "IS", "JL", "JT", "JV", "LF", "NL", "NS", "NU", "OP", "PO",
    769             "PR", "QU", "RI", "SA", "SG", "SP", "SY", "WJ", "XX", "ZW"};
     785            "CP", "CR", "EB", "EM", "EX", "GL", "H2", "H3", "HL", "HY",
     786            "ID", "IN", "IS", "JL", "JT", "JV", "LF", "NL", "NS", "NU",
     787            "OP", "PO", "PR", "QU", "RI", "SA", "SG", "SP", "SY", "WJ",
     788            "XX", "ZW", "ZWJ"};
    770789        const static std::vector<std::string> value_names = {
    771790            "Ambiguous", "Alphabetic", "Break_Both", "Break_After",
     
    773792            "Conditional_Japanese_Starter", "Close_Punctuation",
    774793            "Combining_Mark", "Close_Parenthesis", "Carriage_Return",
    775             "Exclamation", "Glue", "H2", "H3", "Hebrew_Letter", "Hyphen",
    776             "Ideographic", "Inseparable", "Infix_Numeric", "JL", "JT", "JV",
    777             "Line_Feed", "Next_Line", "Nonstarter", "Numeric",
    778             "Open_Punctuation", "Postfix_Numeric", "Prefix_Numeric",
    779             "Quotation", "Regional_Indicator", "Complex_Context",
    780             "Surrogate", "Space", "Break_Symbols", "Word_Joiner", "Unknown",
    781             "ZWSpace"};
     794            "E_Base", "E_Modifier", "Exclamation", "Glue", "H2", "H3",
     795            "Hebrew_Letter", "Hyphen", "Ideographic", "Inseparable",
     796            "Infix_Numeric", "JL", "JT", "JV", "Line_Feed", "Next_Line",
     797            "Nonstarter", "Numeric", "Open_Punctuation", "Postfix_Numeric",
     798            "Prefix_Numeric", "Quotation", "Regional_Indicator",
     799            "Complex_Context", "Surrogate", "Space", "Break_Symbols",
     800            "Word_Joiner", "Unknown", "ZWSpace", "ZWJ"};
    782801        static std::unordered_map<std::string, int> aliases_only_map {{
    783802            {"inseperable", LB_ns::IN}}};
     
    855874    namespace WB_ns {
    856875        enum value_t {
    857             CR, DQ, EX, Extend, FO, HL, KA, LE, LF, MB, ML, MN, NL, NU, RI,
    858             SQ, XX};
    859         const static std::vector<std::string> enum_names = {
    860             "CR", "DQ", "EX", "Extend", "FO", "HL", "KA", "LE", "LF", "MB",
    861             "ML", "MN", "NL", "NU", "RI", "SQ", "XX"};
    862         const static std::vector<std::string> value_names = {
    863             "CR", "Double_Quote", "ExtendNumLet", "Extend", "Format",
     876            CR, DQ, EB, EBG, EM, EX, Extend, FO, GAZ, HL, KA, LE, LF, MB,
     877            ML, MN, NL, NU, RI, SQ, XX, ZWJ};
     878        const static std::vector<std::string> enum_names = {
     879            "CR", "DQ", "EB", "EBG", "EM", "EX", "Extend", "FO", "GAZ",
     880            "HL", "KA", "LE", "LF", "MB", "ML", "MN", "NL", "NU", "RI",
     881            "SQ", "XX", "ZWJ"};
     882        const static std::vector<std::string> value_names = {
     883            "CR", "Double_Quote", "E_Base", "E_Base_GAZ", "E_Modifier",
     884            "ExtendNumLet", "Extend", "Format", "Glue_After_Zwj",
    864885            "Hebrew_Letter", "Katakana", "ALetter", "LF", "MidNumLet",
    865886            "MidLetter", "MidNum", "Newline", "Numeric",
    866             "Regional_Indicator", "Single_Quote", "Other"};
     887            "Regional_Indicator", "Single_Quote", "Other", "ZWJ"};
    867888        static std::unordered_map<std::string, int> aliases_only_map {{
    868889            }};
Note: See TracChangeset for help on using the changeset viewer.