Ignore:
Timestamp:
Oct 11, 2017, 6:48:36 PM (2 years ago)
Author:
cameron
Message:

Update to UCD 10.0.0

File:
1 edited

Legend:

Unmodified
Added
Removed
  • icGREP/icgrep-devel/icgrep/UCD/PropertyValueAliases.h

    r5661 r5686  
    3030        enum value_t {
    3131            Unassigned, V1_1, V2_0, V2_1, V3_0, V3_1, V3_2, V4_0, V4_1,
    32             V5_0, V5_1, V5_2, V6_0, V6_1, V6_2, V6_3, V7_0, V8_0, V9_0};
     32            V5_0, V5_1, V5_2, V6_0, V6_1, V6_2, V6_3, V7_0, V8_0, V9_0,
     33            V10_0};
    3334        const static std::vector<std::string> enum_names = {
    3435            "Unassigned", "V1_1", "V2_0", "V2_1", "V3_0", "V3_1", "V3_2",
    3536            "V4_0", "V4_1", "V5_0", "V5_1", "V5_2", "V6_0", "V6_1", "V6_2",
    36             "V6_3", "V7_0", "V8_0", "V9_0"};
     37            "V6_3", "V7_0", "V8_0", "V9_0", "V10_0"};
    3738        const static std::vector<std::string> value_names = {
    3839            "Unassigned", "V1_1", "V2_0", "V2_1", "V3_0", "V3_1", "V3_2",
    3940            "V4_0", "V4_1", "V5_0", "V5_1", "V5_2", "V6_0", "V6_1", "V6_2",
    40             "V6_3", "V7_0", "V8_0", "V9_0"};
    41         static std::unordered_map<std::string, int> aliases_only_map {{
    42             {"1.1", AGE_ns::V1_1}, {"2.0", AGE_ns::V2_0},
    43             {"2.1", AGE_ns::V2_1}, {"3.0", AGE_ns::V3_0},
    44             {"3.1", AGE_ns::V3_1}, {"3.2", AGE_ns::V3_2},
    45             {"4.0", AGE_ns::V4_0}, {"4.1", AGE_ns::V4_1},
    46             {"5.0", AGE_ns::V5_0}, {"5.1", AGE_ns::V5_1},
    47             {"5.2", AGE_ns::V5_2}, {"6.0", AGE_ns::V6_0},
    48             {"6.1", AGE_ns::V6_1}, {"6.2", AGE_ns::V6_2},
    49             {"6.3", AGE_ns::V6_3}, {"7.0", AGE_ns::V7_0},
    50             {"8.0", AGE_ns::V8_0}, {"9.0", AGE_ns::V9_0},
    51             {"na", AGE_ns::Unassigned}}};
     41            "V6_3", "V7_0", "V8_0", "V9_0", "V10_0"};
     42        static std::unordered_map<std::string, int> aliases_only_map {{
     43            {"1.1", AGE_ns::V1_1}, {"10.0", AGE_ns::V10_0},
     44            {"2.0", AGE_ns::V2_0}, {"2.1", AGE_ns::V2_1},
     45            {"3.0", AGE_ns::V3_0}, {"3.1", AGE_ns::V3_1},
     46            {"3.2", AGE_ns::V3_2}, {"4.0", AGE_ns::V4_0},
     47            {"4.1", AGE_ns::V4_1}, {"5.0", AGE_ns::V5_0},
     48            {"5.1", AGE_ns::V5_1}, {"5.2", AGE_ns::V5_2},
     49            {"6.0", AGE_ns::V6_0}, {"6.1", AGE_ns::V6_1},
     50            {"6.2", AGE_ns::V6_2}, {"6.3", AGE_ns::V6_3},
     51            {"7.0", AGE_ns::V7_0}, {"8.0", AGE_ns::V8_0},
     52            {"9.0", AGE_ns::V9_0}, {"na", AGE_ns::Unassigned}}};
    5253    }
    5354
     
    5758            Modifier_Letters, Diacriticals, Greek, Cyrillic, Cyrillic_Sup,
    5859            Armenian, Hebrew, Arabic, Syriac, Arabic_Sup, Thaana, NKo,
    59             Samaritan, Mandaic, Arabic_Ext_A, Devanagari, Bengali, Gurmukhi,
    60             Gujarati, Oriya, Tamil, Telugu, Kannada, Malayalam, Sinhala,
    61             Thai, Lao, Tibetan, Myanmar, Georgian, Jamo, Ethiopic,
    62             Ethiopic_Sup, Cherokee, UCAS, Ogham, Runic, Tagalog, Hanunoo,
    63             Buhid, Tagbanwa, Khmer, Mongolian, UCAS_Ext, Limbu, Tai_Le,
    64             New_Tai_Lue, Khmer_Symbols, Buginese, Tai_Tham,
     60            Samaritan, Mandaic, Syriac_Sup, Arabic_Ext_A, Devanagari,
     61            Bengali, Gurmukhi, Gujarati, Oriya, Tamil, Telugu, Kannada,
     62            Malayalam, Sinhala, Thai, Lao, Tibetan, Myanmar, Georgian, Jamo,
     63            Ethiopic, Ethiopic_Sup, Cherokee, UCAS, Ogham, Runic, Tagalog,
     64            Hanunoo, Buhid, Tagbanwa, Khmer, Mongolian, UCAS_Ext, Limbu,
     65            Tai_Le, New_Tai_Lue, Khmer_Symbols, Buginese, Tai_Tham,
    6566            Diacriticals_Ext, Balinese, Sundanese, Batak, Lepcha, Ol_Chiki,
    6667            Cyrillic_Ext_C, Sundanese_Sup, Vedic_Ext, Phonetic_Ext,
     
    99100            Mahajani, Sharada, Sinhala_Archaic_Numbers, Khojki, Multani,
    100101            Khudawadi, Grantha, Newa, Tirhuta, Siddham, Modi, Mongolian_Sup,
    101             Takri, Ahom, Warang_Citi, Pau_Cin_Hau, Bhaiksuki, Marchen,
    102             Cuneiform, Cuneiform_Numbers, Early_Dynastic_Cuneiform,
     102            Takri, Ahom, Warang_Citi, Zanabazar_Square, Soyombo,
     103            Pau_Cin_Hau, Bhaiksuki, Marchen, Masaram_Gondi, Cuneiform,
     104            Cuneiform_Numbers, Early_Dynastic_Cuneiform,
    103105            Egyptian_Hieroglyphs, Anatolian_Hieroglyphs, Bamum_Sup, Mro,
    104106            Bassa_Vah, Pahawh_Hmong, Miao, Ideographic_Symbols, Tangut,
    105             Tangut_Components, Kana_Sup, Duployan,
     107            Tangut_Components, Kana_Sup, Kana_Ext_A, Nushu, Duployan,
    106108            Shorthand_Format_Controls, Byzantine_Music, Music,
    107109            Ancient_Greek_Music, Tai_Xuan_Jing, Counting_Rod, Math_Alphanum,
     
    112114            Transport_And_Map, Alchemical, Geometric_Shapes_Ext,
    113115            Sup_Arrows_C, Sup_Symbols_And_Pictographs, CJK_Ext_B, CJK_Ext_C,
    114             CJK_Ext_D, CJK_Ext_E, CJK_Compat_Ideographs_Sup, Tags, VS_Sup,
    115             Sup_PUA_A, Sup_PUA_B};
     116            CJK_Ext_D, CJK_Ext_E, CJK_Ext_F, CJK_Compat_Ideographs_Sup,
     117            Tags, VS_Sup, Sup_PUA_A, Sup_PUA_B};
    116118        const static std::vector<std::string> enum_names = {
    117119            "NB", "ASCII", "Latin_1_Sup", "Latin_Ext_A", "Latin_Ext_B",
     
    119121            "Cyrillic", "Cyrillic_Sup", "Armenian", "Hebrew", "Arabic",
    120122            "Syriac", "Arabic_Sup", "Thaana", "NKo", "Samaritan", "Mandaic",
    121             "Arabic_Ext_A", "Devanagari", "Bengali", "Gurmukhi", "Gujarati",
    122             "Oriya", "Tamil", "Telugu", "Kannada", "Malayalam", "Sinhala",
    123             "Thai", "Lao", "Tibetan", "Myanmar", "Georgian", "Jamo",
    124             "Ethiopic", "Ethiopic_Sup", "Cherokee", "UCAS", "Ogham",
    125             "Runic", "Tagalog", "Hanunoo", "Buhid", "Tagbanwa", "Khmer",
    126             "Mongolian", "UCAS_Ext", "Limbu", "Tai_Le", "New_Tai_Lue",
    127             "Khmer_Symbols", "Buginese", "Tai_Tham", "Diacriticals_Ext",
    128             "Balinese", "Sundanese", "Batak", "Lepcha", "Ol_Chiki",
    129             "Cyrillic_Ext_C", "Sundanese_Sup", "Vedic_Ext", "Phonetic_Ext",
    130             "Phonetic_Ext_Sup", "Diacriticals_Sup", "Latin_Ext_Additional",
    131             "Greek_Ext", "Punctuation", "Super_And_Sub", "Currency_Symbols",
    132             "Diacriticals_For_Symbols", "Letterlike_Symbols",
    133             "Number_Forms", "Arrows", "Math_Operators", "Misc_Technical",
    134             "Control_Pictures", "OCR", "Enclosed_Alphanum", "Box_Drawing",
    135             "Block_Elements", "Geometric_Shapes", "Misc_Symbols",
    136             "Dingbats", "Misc_Math_Symbols_A", "Sup_Arrows_A", "Braille",
     123            "Syriac_Sup", "Arabic_Ext_A", "Devanagari", "Bengali",
     124            "Gurmukhi", "Gujarati", "Oriya", "Tamil", "Telugu", "Kannada",
     125            "Malayalam", "Sinhala", "Thai", "Lao", "Tibetan", "Myanmar",
     126            "Georgian", "Jamo", "Ethiopic", "Ethiopic_Sup", "Cherokee",
     127            "UCAS", "Ogham", "Runic", "Tagalog", "Hanunoo", "Buhid",
     128            "Tagbanwa", "Khmer", "Mongolian", "UCAS_Ext", "Limbu", "Tai_Le",
     129            "New_Tai_Lue", "Khmer_Symbols", "Buginese", "Tai_Tham",
     130            "Diacriticals_Ext", "Balinese", "Sundanese", "Batak", "Lepcha",
     131            "Ol_Chiki", "Cyrillic_Ext_C", "Sundanese_Sup", "Vedic_Ext",
     132            "Phonetic_Ext", "Phonetic_Ext_Sup", "Diacriticals_Sup",
     133            "Latin_Ext_Additional", "Greek_Ext", "Punctuation",
     134            "Super_And_Sub", "Currency_Symbols", "Diacriticals_For_Symbols",
     135            "Letterlike_Symbols", "Number_Forms", "Arrows",
     136            "Math_Operators", "Misc_Technical", "Control_Pictures", "OCR",
     137            "Enclosed_Alphanum", "Box_Drawing", "Block_Elements",
     138            "Geometric_Shapes", "Misc_Symbols", "Dingbats",
     139            "Misc_Math_Symbols_A", "Sup_Arrows_A", "Braille",
    137140            "Sup_Arrows_B", "Misc_Math_Symbols_B", "Sup_Math_Operators",
    138141            "Misc_Arrows", "Glagolitic", "Latin_Ext_C", "Coptic",
     
    168171            "Sharada", "Sinhala_Archaic_Numbers", "Khojki", "Multani",
    169172            "Khudawadi", "Grantha", "Newa", "Tirhuta", "Siddham", "Modi",
    170             "Mongolian_Sup", "Takri", "Ahom", "Warang_Citi", "Pau_Cin_Hau",
    171             "Bhaiksuki", "Marchen", "Cuneiform", "Cuneiform_Numbers",
     173            "Mongolian_Sup", "Takri", "Ahom", "Warang_Citi",
     174            "Zanabazar_Square", "Soyombo", "Pau_Cin_Hau", "Bhaiksuki",
     175            "Marchen", "Masaram_Gondi", "Cuneiform", "Cuneiform_Numbers",
    172176            "Early_Dynastic_Cuneiform", "Egyptian_Hieroglyphs",
    173177            "Anatolian_Hieroglyphs", "Bamum_Sup", "Mro", "Bassa_Vah",
    174178            "Pahawh_Hmong", "Miao", "Ideographic_Symbols", "Tangut",
    175             "Tangut_Components", "Kana_Sup", "Duployan",
    176             "Shorthand_Format_Controls", "Byzantine_Music", "Music",
    177             "Ancient_Greek_Music", "Tai_Xuan_Jing", "Counting_Rod",
     179            "Tangut_Components", "Kana_Sup", "Kana_Ext_A", "Nushu",
     180            "Duployan", "Shorthand_Format_Controls", "Byzantine_Music",
     181            "Music", "Ancient_Greek_Music", "Tai_Xuan_Jing", "Counting_Rod",
    178182            "Math_Alphanum", "Sutton_SignWriting", "Glagolitic_Sup",
    179183            "Mende_Kikakui", "Adlam", "Arabic_Math", "Mahjong", "Domino",
     
    183187            "Geometric_Shapes_Ext", "Sup_Arrows_C",
    184188            "Sup_Symbols_And_Pictographs", "CJK_Ext_B", "CJK_Ext_C",
    185             "CJK_Ext_D", "CJK_Ext_E", "CJK_Compat_Ideographs_Sup", "Tags",
    186             "VS_Sup", "Sup_PUA_A", "Sup_PUA_B"};
     189            "CJK_Ext_D", "CJK_Ext_E", "CJK_Ext_F",
     190            "CJK_Compat_Ideographs_Sup", "Tags", "VS_Sup", "Sup_PUA_A",
     191            "Sup_PUA_B"};
    187192        const static std::vector<std::string> value_names = {
    188193            "No_Block", "Basic_Latin", "Latin_1_Supplement",
     
    191196            "Greek_And_Coptic", "Cyrillic", "Cyrillic_Supplement",
    192197            "Armenian", "Hebrew", "Arabic", "Syriac", "Arabic_Supplement",
    193             "Thaana", "NKo", "Samaritan", "Mandaic", "Arabic_Extended_A",
    194             "Devanagari", "Bengali", "Gurmukhi", "Gujarati", "Oriya",
    195             "Tamil", "Telugu", "Kannada", "Malayalam", "Sinhala", "Thai",
    196             "Lao", "Tibetan", "Myanmar", "Georgian", "Hangul_Jamo",
    197             "Ethiopic", "Ethiopic_Supplement", "Cherokee",
     198            "Thaana", "NKo", "Samaritan", "Mandaic", "Syriac_Supplement",
     199            "Arabic_Extended_A", "Devanagari", "Bengali", "Gurmukhi",
     200            "Gujarati", "Oriya", "Tamil", "Telugu", "Kannada", "Malayalam",
     201            "Sinhala", "Thai", "Lao", "Tibetan", "Myanmar", "Georgian",
     202            "Hangul_Jamo", "Ethiopic", "Ethiopic_Supplement", "Cherokee",
    198203            "Unified_Canadian_Aboriginal_Syllabics", "Ogham", "Runic",
    199204            "Tagalog", "Hanunoo", "Buhid", "Tagbanwa", "Khmer", "Mongolian",
     
    260265            "Khojki", "Multani", "Khudawadi", "Grantha", "Newa", "Tirhuta",
    261266            "Siddham", "Modi", "Mongolian_Supplement", "Takri", "Ahom",
    262             "Warang_Citi", "Pau_Cin_Hau", "Bhaiksuki", "Marchen",
    263             "Cuneiform", "Cuneiform_Numbers_And_Punctuation",
    264             "Early_Dynastic_Cuneiform", "Egyptian_Hieroglyphs",
    265             "Anatolian_Hieroglyphs", "Bamum_Supplement", "Mro", "Bassa_Vah",
    266             "Pahawh_Hmong", "Miao", "Ideographic_Symbols_And_Punctuation",
    267             "Tangut", "Tangut_Components", "Kana_Supplement", "Duployan",
    268             "Shorthand_Format_Controls", "Byzantine_Musical_Symbols",
    269             "Musical_Symbols", "Ancient_Greek_Musical_Notation",
    270             "Tai_Xuan_Jing_Symbols", "Counting_Rod_Numerals",
    271             "Mathematical_Alphanumeric_Symbols", "Sutton_SignWriting",
    272             "Glagolitic_Supplement", "Mende_Kikakui", "Adlam",
    273             "Arabic_Mathematical_Alphabetic_Symbols", "Mahjong_Tiles",
    274             "Domino_Tiles", "Playing_Cards",
     267            "Warang_Citi", "Zanabazar_Square", "Soyombo", "Pau_Cin_Hau",
     268            "Bhaiksuki", "Marchen", "Masaram_Gondi", "Cuneiform",
     269            "Cuneiform_Numbers_And_Punctuation", "Early_Dynastic_Cuneiform",
     270            "Egyptian_Hieroglyphs", "Anatolian_Hieroglyphs",
     271            "Bamum_Supplement", "Mro", "Bassa_Vah", "Pahawh_Hmong", "Miao",
     272            "Ideographic_Symbols_And_Punctuation", "Tangut",
     273            "Tangut_Components", "Kana_Supplement", "Kana_Extended_A",
     274            "Nushu", "Duployan", "Shorthand_Format_Controls",
     275            "Byzantine_Musical_Symbols", "Musical_Symbols",
     276            "Ancient_Greek_Musical_Notation", "Tai_Xuan_Jing_Symbols",
     277            "Counting_Rod_Numerals", "Mathematical_Alphanumeric_Symbols",
     278            "Sutton_SignWriting", "Glagolitic_Supplement", "Mende_Kikakui",
     279            "Adlam", "Arabic_Mathematical_Alphabetic_Symbols",
     280            "Mahjong_Tiles", "Domino_Tiles", "Playing_Cards",
    275281            "Enclosed_Alphanumeric_Supplement",
    276282            "Enclosed_Ideographic_Supplement",
     
    283289            "CJK_Unified_Ideographs_Extension_D",
    284290            "CJK_Unified_Ideographs_Extension_E",
     291            "CJK_Unified_Ideographs_Extension_F",
    285292            "CJK_Compatibility_Ideographs_Supplement", "Tags",
    286293            "Variation_Selectors_Supplement",
     
    309316            Lina, Mahj, Mani, Mend, Modi, Mroo, Narb, Nbat, Palm, Pauc,
    310317            Perm, Phlp, Sidd, Sind, Tirh, Wara, Ahom, Hluw, Hatr, Mult,
    311             Hung, Sgnw, Adlm, Bhks, Marc, Newa, Osge, Tang, Hrkt};
     318            Hung, Sgnw, Adlm, Bhks, Marc, Newa, Osge, Tang, Gonm, Nshu,
     319            Soyo, Zanb, Hrkt};
    312320        const static std::vector<std::string> enum_names = {
    313321            "Zzzz", "Zyyy", "Latn", "Grek", "Cyrl", "Armn", "Hebr", "Arab",
     
    328336            "Perm", "Phlp", "Sidd", "Sind", "Tirh", "Wara", "Ahom", "Hluw",
    329337            "Hatr", "Mult", "Hung", "Sgnw", "Adlm", "Bhks", "Marc", "Newa",
    330             "Osge", "Tang", "Hrkt"};
     338            "Osge", "Tang", "Gonm", "Nshu", "Soyo", "Zanb", "Hrkt"};
    331339        const static std::vector<std::string> value_names = {
    332340            "Unknown", "Common", "Latin", "Greek", "Cyrillic", "Armenian",
     
    359367            "Hatran", "Multani", "Old_Hungarian", "SignWriting", "Adlam",
    360368            "Bhaiksuki", "Marchen", "Newa", "Osage", "Tangut",
     369            "Masaram_Gondi", "Nushu", "Soyombo", "Zanabazar_Square",
    361370            "Katakana_Or_Hiragana"};
    362371        static std::unordered_map<std::string, int> aliases_only_map {{
     
    546555            NA, Right, Left, Visual_Order_Left, Left_And_Right, Top, Bottom,
    547556            Top_And_Bottom, Top_And_Right, Top_And_Left,
    548             Top_And_Left_And_Right, Bottom_And_Right,
     557            Top_And_Left_And_Right, Bottom_And_Right, Bottom_And_Left,
    549558            Top_And_Bottom_And_Right, Overstruck};
    550559        const static std::vector<std::string> enum_names = {
     
    552561            "Top", "Bottom", "Top_And_Bottom", "Top_And_Right",
    553562            "Top_And_Left", "Top_And_Left_And_Right", "Bottom_And_Right",
    554             "Top_And_Bottom_And_Right", "Overstruck"};
     563            "Bottom_And_Left", "Top_And_Bottom_And_Right", "Overstruck"};
    555564        const static std::vector<std::string> value_names = {
    556565            "NA", "Right", "Left", "Visual_Order_Left", "Left_And_Right",
    557566            "Top", "Bottom", "Top_And_Bottom", "Top_And_Right",
    558567            "Top_And_Left", "Top_And_Left_And_Right", "Bottom_And_Right",
    559             "Top_And_Bottom_And_Right", "Overstruck"};
     568            "Bottom_And_Left", "Top_And_Bottom_And_Right", "Overstruck"};
    560569        static std::unordered_map<std::string, int> aliases_only_map {{
    561570            }};
     
    620629            Manichaean_Teth, Manichaean_Thamedh, Manichaean_Twenty,
    621630            Manichaean_Waw, Manichaean_Yodh, Manichaean_Zayin, African_Feh,
    622             African_Qaf, African_Noon};
     631            African_Qaf, African_Noon, Malayalam_Nga, Malayalam_Ja,
     632            Malayalam_Nya, Malayalam_Tta, Malayalam_Nna, Malayalam_Nnna,
     633            Malayalam_Bha, Malayalam_Ra, Malayalam_Lla, Malayalam_Llla,
     634            Malayalam_Ssa};
    623635        const static std::vector<std::string> enum_names = {
    624636            "No_Joining_Group", "Ain", "Alaph", "Alef", "Beh", "Beth",
     
    641653            "Manichaean_Thamedh", "Manichaean_Twenty", "Manichaean_Waw",
    642654            "Manichaean_Yodh", "Manichaean_Zayin", "African_Feh",
    643             "African_Qaf", "African_Noon"};
     655            "African_Qaf", "African_Noon", "Malayalam_Nga", "Malayalam_Ja",
     656            "Malayalam_Nya", "Malayalam_Tta", "Malayalam_Nna",
     657            "Malayalam_Nnna", "Malayalam_Bha", "Malayalam_Ra",
     658            "Malayalam_Lla", "Malayalam_Llla", "Malayalam_Ssa"};
    644659        const static std::vector<std::string> value_names = {
    645660            "No_Joining_Group", "Ain", "Alaph", "Alef", "Beh", "Beth",
     
    662677            "Manichaean_Thamedh", "Manichaean_Twenty", "Manichaean_Waw",
    663678            "Manichaean_Yodh", "Manichaean_Zayin", "African_Feh",
    664             "African_Qaf", "African_Noon"};
     679            "African_Qaf", "African_Noon", "Malayalam_Nga", "Malayalam_Ja",
     680            "Malayalam_Nya", "Malayalam_Tta", "Malayalam_Nna",
     681            "Malayalam_Nnna", "Malayalam_Bha", "Malayalam_Ra",
     682            "Malayalam_Lla", "Malayalam_Llla", "Malayalam_Ssa"};
    665683        static std::unordered_map<std::string, int> aliases_only_map {{
    666684            }};
     
    775793    }
    776794
     795    namespace VO_ns {
     796        enum value_t {
     797            R, U, Tr, Tu};
     798        const static std::vector<std::string> enum_names = {
     799            "R", "U", "Tr", "Tu"};
     800        const static std::vector<std::string> value_names = {
     801            "Rotated", "Upright", "Transformed_Rotated",
     802            "Transformed_Upright"};
     803        static std::unordered_map<std::string, int> aliases_only_map {{
     804            }};
     805    }
     806
    777807    namespace WB_ns {
    778808        enum value_t {
Note: See TracChangeset for help on using the changeset viewer.