ICU 62.1  62.1
uchar.h
Go to the documentation of this file.
1 // © 2016 and later: Unicode, Inc. and others.
2 // License & terms of use: http://www.unicode.org/copyright.html
3 /*
4 **********************************************************************
5 * Copyright (C) 1997-2016, International Business Machines
6 * Corporation and others. All Rights Reserved.
7 **********************************************************************
8 *
9 * File UCHAR.H
10 *
11 * Modification History:
12 *
13 * Date Name Description
14 * 04/02/97 aliu Creation.
15 * 03/29/99 helena Updated for C APIs.
16 * 4/15/99 Madhu Updated for C Implementation and Javadoc
17 * 5/20/99 Madhu Added the function u_getVersion()
18 * 8/19/1999 srl Upgraded scripts to Unicode 3.0
19 * 8/27/1999 schererm UCharDirection constants: U_...
20 * 11/11/1999 weiv added u_isalnum(), cleaned comments
21 * 01/11/2000 helena Renamed u_getVersion to u_getUnicodeVersion().
22 ******************************************************************************
23 */
24 
25 #ifndef UCHAR_H
26 #define UCHAR_H
27 
28 #include "unicode/utypes.h"
29 #include "unicode/stringoptions.h"
30 
32 
33 /*==========================================================================*/
34 /* Unicode version number */
35 /*==========================================================================*/
45 #define U_UNICODE_VERSION "11.0"
46 
127 #define UCHAR_MIN_VALUE 0
128 
137 #define UCHAR_MAX_VALUE 0x10ffff
138 
143 #define U_MASK(x) ((uint32_t)1<<(x))
144 
165 typedef enum UProperty {
166  /*
167  * Note: UProperty constants are parsed by preparseucd.py.
168  * It matches lines like
169  * UCHAR_<Unicode property name>=<integer>,
170  */
171 
172  /* Note: Place UCHAR_ALPHABETIC before UCHAR_BINARY_START so that
173  debuggers display UCHAR_ALPHABETIC as the symbolic name for 0,
174  rather than UCHAR_BINARY_START. Likewise for other *_START
175  identifiers. */
176 
456 #ifndef U_HIDE_DEPRECATED_API
457 
462 #endif // U_HIDE_DEPRECATED_API
463 
471  UCHAR_BLOCK=0x1001,
499  UCHAR_SCRIPT=0x100A,
549 #ifndef U_HIDE_DEPRECATED_API
550 
555 #endif // U_HIDE_DEPRECATED_API
556 
568 #ifndef U_HIDE_DEPRECATED_API
569 
574 #endif // U_HIDE_DEPRECATED_API
575 
581 #ifndef U_HIDE_DEPRECATED_API
582 
587 #endif // U_HIDE_DEPRECATED_API
588 
591  UCHAR_AGE=0x4000,
600 #ifndef U_HIDE_DEPRECATED_API
601 
604 #endif /* U_HIDE_DEPRECATED_API */
605 
610  UCHAR_NAME=0x4005,
626 #ifndef U_HIDE_DEPRECATED_API
627 
632 #endif /* U_HIDE_DEPRECATED_API */
633 
639 #ifndef U_HIDE_DEPRECATED_API
640 
645 #endif // U_HIDE_DEPRECATED_API
646 
655 #ifndef U_HIDE_DEPRECATED_API
656 
661 #endif // U_HIDE_DEPRECATED_API
662 
665 } UProperty;
666 
672 typedef enum UCharCategory
673 {
674  /*
675  * Note: UCharCategory constants and their API comments are parsed by preparseucd.py.
676  * It matches pairs of lines like
677  * / ** <Unicode 2-letter General_Category value> comment... * /
678  * U_<[A-Z_]+> = <integer>,
679  */
680 
751 } UCharCategory;
752 
767 #define U_GC_CN_MASK U_MASK(U_GENERAL_OTHER_TYPES)
768 
770 #define U_GC_LU_MASK U_MASK(U_UPPERCASE_LETTER)
771 
772 #define U_GC_LL_MASK U_MASK(U_LOWERCASE_LETTER)
773 
774 #define U_GC_LT_MASK U_MASK(U_TITLECASE_LETTER)
775 
776 #define U_GC_LM_MASK U_MASK(U_MODIFIER_LETTER)
777 
778 #define U_GC_LO_MASK U_MASK(U_OTHER_LETTER)
779 
781 #define U_GC_MN_MASK U_MASK(U_NON_SPACING_MARK)
782 
783 #define U_GC_ME_MASK U_MASK(U_ENCLOSING_MARK)
784 
785 #define U_GC_MC_MASK U_MASK(U_COMBINING_SPACING_MARK)
786 
788 #define U_GC_ND_MASK U_MASK(U_DECIMAL_DIGIT_NUMBER)
789 
790 #define U_GC_NL_MASK U_MASK(U_LETTER_NUMBER)
791 
792 #define U_GC_NO_MASK U_MASK(U_OTHER_NUMBER)
793 
795 #define U_GC_ZS_MASK U_MASK(U_SPACE_SEPARATOR)
796 
797 #define U_GC_ZL_MASK U_MASK(U_LINE_SEPARATOR)
798 
799 #define U_GC_ZP_MASK U_MASK(U_PARAGRAPH_SEPARATOR)
800 
802 #define U_GC_CC_MASK U_MASK(U_CONTROL_CHAR)
803 
804 #define U_GC_CF_MASK U_MASK(U_FORMAT_CHAR)
805 
806 #define U_GC_CO_MASK U_MASK(U_PRIVATE_USE_CHAR)
807 
808 #define U_GC_CS_MASK U_MASK(U_SURROGATE)
809 
811 #define U_GC_PD_MASK U_MASK(U_DASH_PUNCTUATION)
812 
813 #define U_GC_PS_MASK U_MASK(U_START_PUNCTUATION)
814 
815 #define U_GC_PE_MASK U_MASK(U_END_PUNCTUATION)
816 
817 #define U_GC_PC_MASK U_MASK(U_CONNECTOR_PUNCTUATION)
818 
819 #define U_GC_PO_MASK U_MASK(U_OTHER_PUNCTUATION)
820 
822 #define U_GC_SM_MASK U_MASK(U_MATH_SYMBOL)
823 
824 #define U_GC_SC_MASK U_MASK(U_CURRENCY_SYMBOL)
825 
826 #define U_GC_SK_MASK U_MASK(U_MODIFIER_SYMBOL)
827 
828 #define U_GC_SO_MASK U_MASK(U_OTHER_SYMBOL)
829 
831 #define U_GC_PI_MASK U_MASK(U_INITIAL_PUNCTUATION)
832 
833 #define U_GC_PF_MASK U_MASK(U_FINAL_PUNCTUATION)
834 
835 
837 #define U_GC_L_MASK \
838  (U_GC_LU_MASK|U_GC_LL_MASK|U_GC_LT_MASK|U_GC_LM_MASK|U_GC_LO_MASK)
839 
841 #define U_GC_LC_MASK \
842  (U_GC_LU_MASK|U_GC_LL_MASK|U_GC_LT_MASK)
843 
845 #define U_GC_M_MASK (U_GC_MN_MASK|U_GC_ME_MASK|U_GC_MC_MASK)
846 
848 #define U_GC_N_MASK (U_GC_ND_MASK|U_GC_NL_MASK|U_GC_NO_MASK)
849 
851 #define U_GC_Z_MASK (U_GC_ZS_MASK|U_GC_ZL_MASK|U_GC_ZP_MASK)
852 
854 #define U_GC_C_MASK \
855  (U_GC_CN_MASK|U_GC_CC_MASK|U_GC_CF_MASK|U_GC_CO_MASK|U_GC_CS_MASK)
856 
858 #define U_GC_P_MASK \
859  (U_GC_PD_MASK|U_GC_PS_MASK|U_GC_PE_MASK|U_GC_PC_MASK|U_GC_PO_MASK| \
860  U_GC_PI_MASK|U_GC_PF_MASK)
861 
863 #define U_GC_S_MASK (U_GC_SM_MASK|U_GC_SC_MASK|U_GC_SK_MASK|U_GC_SO_MASK)
864 
869 typedef enum UCharDirection {
870  /*
871  * Note: UCharDirection constants and their API comments are parsed by preparseucd.py.
872  * It matches pairs of lines like
873  * / ** <Unicode 1..3-letter Bidi_Class value> comment... * /
874  * U_<[A-Z_]+> = <integer>,
875  */
876 
923 #ifndef U_HIDE_DEPRECATED_API
924 
931 #endif // U_HIDE_DEPRECATED_API
933 
941  /*
942  * Note: UBidiPairedBracketType constants are parsed by preparseucd.py.
943  * It matches lines like
944  * U_BPT_<Unicode Bidi_Paired_Bracket_Type value name>
945  */
946 
953 #ifndef U_HIDE_DEPRECATED_API
954 
960  U_BPT_COUNT /* 3 */
961 #endif // U_HIDE_DEPRECATED_API
963 
969  /*
970  * Note: UBlockCode constants are parsed by preparseucd.py.
971  * It matches lines like
972  * UBLOCK_<Unicode Block value name> = <integer>,
973  */
974 
976  UBLOCK_NO_BLOCK = 0, /*[none]*/ /* Special range indicating No_Block */
977 
979  UBLOCK_BASIC_LATIN = 1, /*[0000]*/
980 
983 
985  UBLOCK_LATIN_EXTENDED_A =3, /*[0100]*/
986 
988  UBLOCK_LATIN_EXTENDED_B =4, /*[0180]*/
989 
991  UBLOCK_IPA_EXTENSIONS =5, /*[0250]*/
992 
995 
998 
1003  UBLOCK_GREEK =8, /*[0370]*/
1004 
1006  UBLOCK_CYRILLIC =9, /*[0400]*/
1007 
1009  UBLOCK_ARMENIAN =10, /*[0530]*/
1010 
1012  UBLOCK_HEBREW =11, /*[0590]*/
1013 
1015  UBLOCK_ARABIC =12, /*[0600]*/
1016 
1018  UBLOCK_SYRIAC =13, /*[0700]*/
1019 
1021  UBLOCK_THAANA =14, /*[0780]*/
1022 
1024  UBLOCK_DEVANAGARI =15, /*[0900]*/
1025 
1027  UBLOCK_BENGALI =16, /*[0980]*/
1028 
1030  UBLOCK_GURMUKHI =17, /*[0A00]*/
1031 
1033  UBLOCK_GUJARATI =18, /*[0A80]*/
1034 
1036  UBLOCK_ORIYA =19, /*[0B00]*/
1037 
1039  UBLOCK_TAMIL =20, /*[0B80]*/
1040 
1042  UBLOCK_TELUGU =21, /*[0C00]*/
1043 
1045  UBLOCK_KANNADA =22, /*[0C80]*/
1046 
1048  UBLOCK_MALAYALAM =23, /*[0D00]*/
1049 
1051  UBLOCK_SINHALA =24, /*[0D80]*/
1052 
1054  UBLOCK_THAI =25, /*[0E00]*/
1055 
1057  UBLOCK_LAO =26, /*[0E80]*/
1058 
1060  UBLOCK_TIBETAN =27, /*[0F00]*/
1061 
1063  UBLOCK_MYANMAR =28, /*[1000]*/
1064 
1066  UBLOCK_GEORGIAN =29, /*[10A0]*/
1067 
1069  UBLOCK_HANGUL_JAMO =30, /*[1100]*/
1070 
1072  UBLOCK_ETHIOPIC =31, /*[1200]*/
1073 
1075  UBLOCK_CHEROKEE =32, /*[13A0]*/
1076 
1079 
1081  UBLOCK_OGHAM =34, /*[1680]*/
1082 
1084  UBLOCK_RUNIC =35, /*[16A0]*/
1085 
1087  UBLOCK_KHMER =36, /*[1780]*/
1088 
1090  UBLOCK_MONGOLIAN =37, /*[1800]*/
1091 
1094 
1096  UBLOCK_GREEK_EXTENDED =39, /*[1F00]*/
1097 
1100 
1103 
1105  UBLOCK_CURRENCY_SYMBOLS =42, /*[20A0]*/
1106 
1112 
1115 
1117  UBLOCK_NUMBER_FORMS =45, /*[2150]*/
1118 
1120  UBLOCK_ARROWS =46, /*[2190]*/
1121 
1124 
1127 
1129  UBLOCK_CONTROL_PICTURES =49, /*[2400]*/
1130 
1133 
1136 
1138  UBLOCK_BOX_DRAWING =52, /*[2500]*/
1139 
1141  UBLOCK_BLOCK_ELEMENTS =53, /*[2580]*/
1142 
1144  UBLOCK_GEOMETRIC_SHAPES =54, /*[25A0]*/
1145 
1148 
1150  UBLOCK_DINGBATS =56, /*[2700]*/
1151 
1153  UBLOCK_BRAILLE_PATTERNS =57, /*[2800]*/
1154 
1157 
1159  UBLOCK_KANGXI_RADICALS =59, /*[2F00]*/
1160 
1163 
1166 
1168  UBLOCK_HIRAGANA =62, /*[3040]*/
1169 
1171  UBLOCK_KATAKANA =63, /*[30A0]*/
1172 
1174  UBLOCK_BOPOMOFO =64, /*[3100]*/
1175 
1178 
1180  UBLOCK_KANBUN =66, /*[3190]*/
1181 
1184 
1187 
1190 
1193 
1196 
1198  UBLOCK_YI_SYLLABLES =72, /*[A000]*/
1199 
1201  UBLOCK_YI_RADICALS =73, /*[A490]*/
1202 
1204  UBLOCK_HANGUL_SYLLABLES =74, /*[AC00]*/
1205 
1207  UBLOCK_HIGH_SURROGATES =75, /*[D800]*/
1208 
1211 
1213  UBLOCK_LOW_SURROGATES =77, /*[DC00]*/
1214 
1224  UBLOCK_PRIVATE_USE_AREA =78, /*[E000]*/
1235 
1238 
1241 
1244 
1247 
1250 
1253 
1256 
1258  UBLOCK_SPECIALS =86, /*[FFF0]*/
1259 
1262 
1263  /* New blocks in Unicode 3.1 */
1264 
1266  UBLOCK_OLD_ITALIC = 88, /*[10300]*/
1268  UBLOCK_GOTHIC = 89, /*[10330]*/
1270  UBLOCK_DESERET = 90, /*[10400]*/
1274  UBLOCK_MUSICAL_SYMBOLS = 92, /*[1D100]*/
1282  UBLOCK_TAGS = 96, /*[E0000]*/
1283 
1284  /* New blocks in Unicode 3.2 */
1285 
1294  UBLOCK_TAGALOG = 98, /*[1700]*/
1296  UBLOCK_HANUNOO = 99, /*[1720]*/
1298  UBLOCK_BUHID = 100, /*[1740]*/
1300  UBLOCK_TAGBANWA = 101, /*[1760]*/
1314  UBLOCK_VARIATION_SELECTORS = 108, /*[FE00]*/
1319 
1320  /* New blocks in Unicode 4 */
1321 
1323  UBLOCK_LIMBU = 111, /*[1900]*/
1325  UBLOCK_TAI_LE = 112, /*[1950]*/
1327  UBLOCK_KHMER_SYMBOLS = 113, /*[19E0]*/
1329  UBLOCK_PHONETIC_EXTENSIONS = 114, /*[1D00]*/
1335  UBLOCK_LINEAR_B_SYLLABARY = 117, /*[10000]*/
1337  UBLOCK_LINEAR_B_IDEOGRAMS = 118, /*[10080]*/
1339  UBLOCK_AEGEAN_NUMBERS = 119, /*[10100]*/
1341  UBLOCK_UGARITIC = 120, /*[10380]*/
1343  UBLOCK_SHAVIAN = 121, /*[10450]*/
1345  UBLOCK_OSMANYA = 122, /*[10480]*/
1347  UBLOCK_CYPRIOT_SYLLABARY = 123, /*[10800]*/
1349  UBLOCK_TAI_XUAN_JING_SYMBOLS = 124, /*[1D300]*/
1352 
1353  /* New blocks in Unicode 4.1 */
1354 
1358  UBLOCK_ANCIENT_GREEK_NUMBERS = 127, /*[10140]*/
1360  UBLOCK_ARABIC_SUPPLEMENT = 128, /*[0750]*/
1362  UBLOCK_BUGINESE = 129, /*[1A00]*/
1364  UBLOCK_CJK_STROKES = 130, /*[31C0]*/
1368  UBLOCK_COPTIC = 132, /*[2C80]*/
1370  UBLOCK_ETHIOPIC_EXTENDED = 133, /*[2D80]*/
1372  UBLOCK_ETHIOPIC_SUPPLEMENT = 134, /*[1380]*/
1374  UBLOCK_GEORGIAN_SUPPLEMENT = 135, /*[2D00]*/
1376  UBLOCK_GLAGOLITIC = 136, /*[2C00]*/
1378  UBLOCK_KHAROSHTHI = 137, /*[10A00]*/
1382  UBLOCK_NEW_TAI_LUE = 139, /*[1980]*/
1384  UBLOCK_OLD_PERSIAN = 140, /*[103A0]*/
1390  UBLOCK_SYLOTI_NAGRI = 143, /*[A800]*/
1392  UBLOCK_TIFINAGH = 144, /*[2D30]*/
1394  UBLOCK_VERTICAL_FORMS = 145, /*[FE10]*/
1395 
1396  /* New blocks in Unicode 5.0 */
1397 
1399  UBLOCK_NKO = 146, /*[07C0]*/
1401  UBLOCK_BALINESE = 147, /*[1B00]*/
1403  UBLOCK_LATIN_EXTENDED_C = 148, /*[2C60]*/
1405  UBLOCK_LATIN_EXTENDED_D = 149, /*[A720]*/
1407  UBLOCK_PHAGS_PA = 150, /*[A840]*/
1409  UBLOCK_PHOENICIAN = 151, /*[10900]*/
1411  UBLOCK_CUNEIFORM = 152, /*[12000]*/
1415  UBLOCK_COUNTING_ROD_NUMERALS = 154, /*[1D360]*/
1416 
1417  /* New blocks in Unicode 5.1 */
1418 
1420  UBLOCK_SUNDANESE = 155, /*[1B80]*/
1422  UBLOCK_LEPCHA = 156, /*[1C00]*/
1424  UBLOCK_OL_CHIKI = 157, /*[1C50]*/
1426  UBLOCK_CYRILLIC_EXTENDED_A = 158, /*[2DE0]*/
1428  UBLOCK_VAI = 159, /*[A500]*/
1430  UBLOCK_CYRILLIC_EXTENDED_B = 160, /*[A640]*/
1432  UBLOCK_SAURASHTRA = 161, /*[A880]*/
1434  UBLOCK_KAYAH_LI = 162, /*[A900]*/
1436  UBLOCK_REJANG = 163, /*[A930]*/
1438  UBLOCK_CHAM = 164, /*[AA00]*/
1440  UBLOCK_ANCIENT_SYMBOLS = 165, /*[10190]*/
1442  UBLOCK_PHAISTOS_DISC = 166, /*[101D0]*/
1444  UBLOCK_LYCIAN = 167, /*[10280]*/
1446  UBLOCK_CARIAN = 168, /*[102A0]*/
1448  UBLOCK_LYDIAN = 169, /*[10920]*/
1450  UBLOCK_MAHJONG_TILES = 170, /*[1F000]*/
1452  UBLOCK_DOMINO_TILES = 171, /*[1F030]*/
1453 
1454  /* New blocks in Unicode 5.2 */
1455 
1457  UBLOCK_SAMARITAN = 172, /*[0800]*/
1461  UBLOCK_TAI_THAM = 174, /*[1A20]*/
1463  UBLOCK_VEDIC_EXTENSIONS = 175, /*[1CD0]*/
1465  UBLOCK_LISU = 176, /*[A4D0]*/
1467  UBLOCK_BAMUM = 177, /*[A6A0]*/
1471  UBLOCK_DEVANAGARI_EXTENDED = 179, /*[A8E0]*/
1475  UBLOCK_JAVANESE = 181, /*[A980]*/
1477  UBLOCK_MYANMAR_EXTENDED_A = 182, /*[AA60]*/
1479  UBLOCK_TAI_VIET = 183, /*[AA80]*/
1481  UBLOCK_MEETEI_MAYEK = 184, /*[ABC0]*/
1485  UBLOCK_IMPERIAL_ARAMAIC = 186, /*[10840]*/
1487  UBLOCK_OLD_SOUTH_ARABIAN = 187, /*[10A60]*/
1489  UBLOCK_AVESTAN = 188, /*[10B00]*/
1493  UBLOCK_INSCRIPTIONAL_PAHLAVI = 190, /*[10B60]*/
1495  UBLOCK_OLD_TURKIC = 191, /*[10C00]*/
1497  UBLOCK_RUMI_NUMERAL_SYMBOLS = 192, /*[10E60]*/
1499  UBLOCK_KAITHI = 193, /*[11080]*/
1501  UBLOCK_EGYPTIAN_HIEROGLYPHS = 194, /*[13000]*/
1508 
1509  /* New blocks in Unicode 6.0 */
1510 
1512  UBLOCK_MANDAIC = 198, /*[0840]*/
1514  UBLOCK_BATAK = 199, /*[1BC0]*/
1516  UBLOCK_ETHIOPIC_EXTENDED_A = 200, /*[AB00]*/
1518  UBLOCK_BRAHMI = 201, /*[11000]*/
1520  UBLOCK_BAMUM_SUPPLEMENT = 202, /*[16800]*/
1522  UBLOCK_KANA_SUPPLEMENT = 203, /*[1B000]*/
1524  UBLOCK_PLAYING_CARDS = 204, /*[1F0A0]*/
1528  UBLOCK_EMOTICONS = 206, /*[1F600]*/
1532  UBLOCK_ALCHEMICAL_SYMBOLS = 208, /*[1F700]*/
1535 
1536  /* New blocks in Unicode 6.1 */
1537 
1539  UBLOCK_ARABIC_EXTENDED_A = 210, /*[08A0]*/
1543  UBLOCK_CHAKMA = 212, /*[11100]*/
1547  UBLOCK_MEROITIC_CURSIVE = 214, /*[109A0]*/
1549  UBLOCK_MEROITIC_HIEROGLYPHS = 215, /*[10980]*/
1551  UBLOCK_MIAO = 216, /*[16F00]*/
1553  UBLOCK_SHARADA = 217, /*[11180]*/
1555  UBLOCK_SORA_SOMPENG = 218, /*[110D0]*/
1559  UBLOCK_TAKRI = 220, /*[11680]*/
1560 
1561  /* New blocks in Unicode 7.0 */
1562 
1564  UBLOCK_BASSA_VAH = 221, /*[16AD0]*/
1566  UBLOCK_CAUCASIAN_ALBANIAN = 222, /*[10530]*/
1568  UBLOCK_COPTIC_EPACT_NUMBERS = 223, /*[102E0]*/
1572  UBLOCK_DUPLOYAN = 225, /*[1BC00]*/
1574  UBLOCK_ELBASAN = 226, /*[10500]*/
1578  UBLOCK_GRANTHA = 228, /*[11300]*/
1580  UBLOCK_KHOJKI = 229, /*[11200]*/
1582  UBLOCK_KHUDAWADI = 230, /*[112B0]*/
1584  UBLOCK_LATIN_EXTENDED_E = 231, /*[AB30]*/
1586  UBLOCK_LINEAR_A = 232, /*[10600]*/
1588  UBLOCK_MAHAJANI = 233, /*[11150]*/
1590  UBLOCK_MANICHAEAN = 234, /*[10AC0]*/
1592  UBLOCK_MENDE_KIKAKUI = 235, /*[1E800]*/
1594  UBLOCK_MODI = 236, /*[11600]*/
1596  UBLOCK_MRO = 237, /*[16A40]*/
1598  UBLOCK_MYANMAR_EXTENDED_B = 238, /*[A9E0]*/
1600  UBLOCK_NABATAEAN = 239, /*[10880]*/
1602  UBLOCK_OLD_NORTH_ARABIAN = 240, /*[10A80]*/
1604  UBLOCK_OLD_PERMIC = 241, /*[10350]*/
1606  UBLOCK_ORNAMENTAL_DINGBATS = 242, /*[1F650]*/
1608  UBLOCK_PAHAWH_HMONG = 243, /*[16B00]*/
1610  UBLOCK_PALMYRENE = 244, /*[10860]*/
1612  UBLOCK_PAU_CIN_HAU = 245, /*[11AC0]*/
1614  UBLOCK_PSALTER_PAHLAVI = 246, /*[10B80]*/
1618  UBLOCK_SIDDHAM = 248, /*[11580]*/
1622  UBLOCK_SUPPLEMENTAL_ARROWS_C = 250, /*[1F800]*/
1624  UBLOCK_TIRHUTA = 251, /*[11480]*/
1626  UBLOCK_WARANG_CITI = 252, /*[118A0]*/
1627 
1628  /* New blocks in Unicode 8.0 */
1629 
1631  UBLOCK_AHOM = 253, /*[11700]*/
1633  UBLOCK_ANATOLIAN_HIEROGLYPHS = 254, /*[14400]*/
1635  UBLOCK_CHEROKEE_SUPPLEMENT = 255, /*[AB70]*/
1641  UBLOCK_HATRAN = 258, /*[108E0]*/
1643  UBLOCK_MULTANI = 259, /*[11280]*/
1645  UBLOCK_OLD_HUNGARIAN = 260, /*[10C80]*/
1649  UBLOCK_SUTTON_SIGNWRITING = 262, /*[1D800]*/
1650 
1651  /* New blocks in Unicode 9.0 */
1652 
1654  UBLOCK_ADLAM = 263, /*[1E900]*/
1656  UBLOCK_BHAIKSUKI = 264, /*[11C00]*/
1658  UBLOCK_CYRILLIC_EXTENDED_C = 265, /*[1C80]*/
1660  UBLOCK_GLAGOLITIC_SUPPLEMENT = 266, /*[1E000]*/
1664  UBLOCK_MARCHEN = 268, /*[11C70]*/
1666  UBLOCK_MONGOLIAN_SUPPLEMENT = 269, /*[11660]*/
1668  UBLOCK_NEWA = 270, /*[11400]*/
1670  UBLOCK_OSAGE = 271, /*[104B0]*/
1672  UBLOCK_TANGUT = 272, /*[17000]*/
1674  UBLOCK_TANGUT_COMPONENTS = 273, /*[18800]*/
1675 
1676  // New blocks in Unicode 10.0
1677 
1681  UBLOCK_KANA_EXTENDED_A = 275, /*[1B100]*/
1683  UBLOCK_MASARAM_GONDI = 276, /*[11D00]*/
1685  UBLOCK_NUSHU = 277, /*[1B170]*/
1687  UBLOCK_SOYOMBO = 278, /*[11A50]*/
1689  UBLOCK_SYRIAC_SUPPLEMENT = 279, /*[0860]*/
1691  UBLOCK_ZANABAZAR_SQUARE = 280, /*[11A00]*/
1692 
1693  // New blocks in Unicode 11.0
1694 
1696  UBLOCK_CHESS_SYMBOLS = 281, /*[1FA00]*/
1698  UBLOCK_DOGRA = 282, /*[11800]*/
1700  UBLOCK_GEORGIAN_EXTENDED = 283, /*[1C90]*/
1702  UBLOCK_GUNJALA_GONDI = 284, /*[11D60]*/
1704  UBLOCK_HANIFI_ROHINGYA = 285, /*[10D00]*/
1706  UBLOCK_INDIC_SIYAQ_NUMBERS = 286, /*[1EC70]*/
1708  UBLOCK_MAKASAR = 287, /*[11EE0]*/
1710  UBLOCK_MAYAN_NUMERALS = 288, /*[1D2E0]*/
1712  UBLOCK_MEDEFAIDRIN = 289, /*[16E40]*/
1714  UBLOCK_OLD_SOGDIAN = 290, /*[10F00]*/
1716  UBLOCK_SOGDIAN = 291, /*[10F30]*/
1717 
1718 #ifndef U_HIDE_DEPRECATED_API
1719 
1726 #endif // U_HIDE_DEPRECATED_API
1727 
1730 };
1731 
1733 typedef enum UBlockCode UBlockCode;
1734 
1742 typedef enum UEastAsianWidth {
1743  /*
1744  * Note: UEastAsianWidth constants are parsed by preparseucd.py.
1745  * It matches lines like
1746  * U_EA_<Unicode East_Asian_Width value name>
1747  */
1748 
1749  U_EA_NEUTRAL, /*[N]*/
1750  U_EA_AMBIGUOUS, /*[A]*/
1751  U_EA_HALFWIDTH, /*[H]*/
1752  U_EA_FULLWIDTH, /*[F]*/
1753  U_EA_NARROW, /*[Na]*/
1754  U_EA_WIDE, /*[W]*/
1755 #ifndef U_HIDE_DEPRECATED_API
1756 
1763 #endif // U_HIDE_DEPRECATED_API
1764 } UEastAsianWidth;
1765 
1777 typedef enum UCharNameChoice {
1780 #ifndef U_HIDE_DEPRECATED_API
1781 
1787 #endif /* U_HIDE_DEPRECATED_API */
1788 
1792 #ifndef U_HIDE_DEPRECATED_API
1793 
1798 #endif // U_HIDE_DEPRECATED_API
1799 } UCharNameChoice;
1800 
1814 typedef enum UPropertyNameChoice {
1815  U_SHORT_PROPERTY_NAME,
1816  U_LONG_PROPERTY_NAME,
1817 #ifndef U_HIDE_DEPRECATED_API
1818 
1823 #endif // U_HIDE_DEPRECATED_API
1825 
1832 typedef enum UDecompositionType {
1833  /*
1834  * Note: UDecompositionType constants are parsed by preparseucd.py.
1835  * It matches lines like
1836  * U_DT_<Unicode Decomposition_Type value name>
1837  */
1838 
1839  U_DT_NONE, /*[none]*/
1840  U_DT_CANONICAL, /*[can]*/
1841  U_DT_COMPAT, /*[com]*/
1842  U_DT_CIRCLE, /*[enc]*/
1843  U_DT_FINAL, /*[fin]*/
1844  U_DT_FONT, /*[font]*/
1845  U_DT_FRACTION, /*[fra]*/
1846  U_DT_INITIAL, /*[init]*/
1847  U_DT_ISOLATED, /*[iso]*/
1848  U_DT_MEDIAL, /*[med]*/
1849  U_DT_NARROW, /*[nar]*/
1850  U_DT_NOBREAK, /*[nb]*/
1851  U_DT_SMALL, /*[sml]*/
1852  U_DT_SQUARE, /*[sqr]*/
1853  U_DT_SUB, /*[sub]*/
1854  U_DT_SUPER, /*[sup]*/
1855  U_DT_VERTICAL, /*[vert]*/
1856  U_DT_WIDE, /*[wide]*/
1857 #ifndef U_HIDE_DEPRECATED_API
1858 
1864  U_DT_COUNT /* 18 */
1865 #endif // U_HIDE_DEPRECATED_API
1867 
1874 typedef enum UJoiningType {
1875  /*
1876  * Note: UJoiningType constants are parsed by preparseucd.py.
1877  * It matches lines like
1878  * U_JT_<Unicode Joining_Type value name>
1879  */
1880 
1881  U_JT_NON_JOINING, /*[U]*/
1882  U_JT_JOIN_CAUSING, /*[C]*/
1883  U_JT_DUAL_JOINING, /*[D]*/
1884  U_JT_LEFT_JOINING, /*[L]*/
1885  U_JT_RIGHT_JOINING, /*[R]*/
1886  U_JT_TRANSPARENT, /*[T]*/
1887 #ifndef U_HIDE_DEPRECATED_API
1888 
1894  U_JT_COUNT /* 6 */
1895 #endif // U_HIDE_DEPRECATED_API
1896 } UJoiningType;
1897 
1904 typedef enum UJoiningGroup {
1905  /*
1906  * Note: UJoiningGroup constants are parsed by preparseucd.py.
1907  * It matches lines like
1908  * U_JG_<Unicode Joining_Group value name>
1909  */
1910 
1911  U_JG_NO_JOINING_GROUP,
1912  U_JG_AIN,
1913  U_JG_ALAPH,
1914  U_JG_ALEF,
1915  U_JG_BEH,
1916  U_JG_BETH,
1917  U_JG_DAL,
1918  U_JG_DALATH_RISH,
1919  U_JG_E,
1920  U_JG_FEH,
1921  U_JG_FINAL_SEMKATH,
1922  U_JG_GAF,
1923  U_JG_GAMAL,
1924  U_JG_HAH,
1926  U_JG_HAMZA_ON_HEH_GOAL=U_JG_TEH_MARBUTA_GOAL,
1927  U_JG_HE,
1928  U_JG_HEH,
1929  U_JG_HEH_GOAL,
1930  U_JG_HETH,
1931  U_JG_KAF,
1932  U_JG_KAPH,
1933  U_JG_KNOTTED_HEH,
1934  U_JG_LAM,
1935  U_JG_LAMADH,
1936  U_JG_MEEM,
1937  U_JG_MIM,
1938  U_JG_NOON,
1939  U_JG_NUN,
1940  U_JG_PE,
1941  U_JG_QAF,
1942  U_JG_QAPH,
1943  U_JG_REH,
1944  U_JG_REVERSED_PE,
1945  U_JG_SAD,
1946  U_JG_SADHE,
1947  U_JG_SEEN,
1948  U_JG_SEMKATH,
1949  U_JG_SHIN,
1950  U_JG_SWASH_KAF,
1951  U_JG_SYRIAC_WAW,
1952  U_JG_TAH,
1953  U_JG_TAW,
1954  U_JG_TEH_MARBUTA,
1955  U_JG_TETH,
1956  U_JG_WAW,
1957  U_JG_YEH,
1958  U_JG_YEH_BARREE,
1959  U_JG_YEH_WITH_TAIL,
1960  U_JG_YUDH,
1961  U_JG_YUDH_HE,
1962  U_JG_ZAIN,
2017 #ifndef U_HIDE_DEPRECATED_API
2018 
2025 #endif // U_HIDE_DEPRECATED_API
2026 } UJoiningGroup;
2027 
2035  /*
2036  * Note: UGraphemeClusterBreak constants are parsed by preparseucd.py.
2037  * It matches lines like
2038  * U_GCB_<Unicode Grapheme_Cluster_Break value name>
2039  */
2040 
2041  U_GCB_OTHER = 0, /*[XX]*/
2042  U_GCB_CONTROL = 1, /*[CN]*/
2043  U_GCB_CR = 2, /*[CR]*/
2044  U_GCB_EXTEND = 3, /*[EX]*/
2045  U_GCB_L = 4, /*[L]*/
2046  U_GCB_LF = 5, /*[LF]*/
2047  U_GCB_LV = 6, /*[LV]*/
2048  U_GCB_LVT = 7, /*[LVT]*/
2049  U_GCB_T = 8, /*[T]*/
2050  U_GCB_V = 9, /*[V]*/
2052  U_GCB_SPACING_MARK = 10, /*[SM]*/ /* from here on: new in Unicode 5.1/ICU 4.0 */
2054  U_GCB_PREPEND = 11, /*[PP]*/
2056  U_GCB_REGIONAL_INDICATOR = 12, /*[RI]*/ /* new in Unicode 6.2/ICU 50 */
2058  U_GCB_E_BASE = 13, /*[EB]*/ /* from here on: new in Unicode 9.0/ICU 58 */
2060  U_GCB_E_BASE_GAZ = 14, /*[EBG]*/
2062  U_GCB_E_MODIFIER = 15, /*[EM]*/
2064  U_GCB_GLUE_AFTER_ZWJ = 16, /*[GAZ]*/
2066  U_GCB_ZWJ = 17, /*[ZWJ]*/
2067 
2068 #ifndef U_HIDE_DEPRECATED_API
2069 
2076 #endif // U_HIDE_DEPRECATED_API
2078 
2086 typedef enum UWordBreakValues {
2087  /*
2088  * Note: UWordBreakValues constants are parsed by preparseucd.py.
2089  * It matches lines like
2090  * U_WB_<Unicode Word_Break value name>
2091  */
2092 
2093  U_WB_OTHER = 0, /*[XX]*/
2094  U_WB_ALETTER = 1, /*[LE]*/
2095  U_WB_FORMAT = 2, /*[FO]*/
2096  U_WB_KATAKANA = 3, /*[KA]*/
2097  U_WB_MIDLETTER = 4, /*[ML]*/
2098  U_WB_MIDNUM = 5, /*[MN]*/
2099  U_WB_NUMERIC = 6, /*[NU]*/
2100  U_WB_EXTENDNUMLET = 7, /*[EX]*/
2102  U_WB_CR = 8, /*[CR]*/ /* from here on: new in Unicode 5.1/ICU 4.0 */
2104  U_WB_EXTEND = 9, /*[Extend]*/
2106  U_WB_LF = 10, /*[LF]*/
2108  U_WB_MIDNUMLET =11, /*[MB]*/
2110  U_WB_NEWLINE =12, /*[NL]*/
2112  U_WB_REGIONAL_INDICATOR = 13, /*[RI]*/ /* new in Unicode 6.2/ICU 50 */
2114  U_WB_HEBREW_LETTER = 14, /*[HL]*/ /* from here on: new in Unicode 6.3/ICU 52 */
2116  U_WB_SINGLE_QUOTE = 15, /*[SQ]*/
2118  U_WB_DOUBLE_QUOTE = 16, /*[DQ]*/
2120  U_WB_E_BASE = 17, /*[EB]*/ /* from here on: new in Unicode 9.0/ICU 58 */
2122  U_WB_E_BASE_GAZ = 18, /*[EBG]*/
2124  U_WB_E_MODIFIER = 19, /*[EM]*/
2126  U_WB_GLUE_AFTER_ZWJ = 20, /*[GAZ]*/
2128  U_WB_ZWJ = 21, /*[ZWJ]*/
2130  U_WB_WSEGSPACE = 22, /*[WSEGSPACE]*/
2131 
2132 #ifndef U_HIDE_DEPRECATED_API
2133 
2140 #endif // U_HIDE_DEPRECATED_API
2142 
2149 typedef enum USentenceBreak {
2150  /*
2151  * Note: USentenceBreak constants are parsed by preparseucd.py.
2152  * It matches lines like
2153  * U_SB_<Unicode Sentence_Break value name>
2154  */
2155 
2156  U_SB_OTHER = 0, /*[XX]*/
2157  U_SB_ATERM = 1, /*[AT]*/
2158  U_SB_CLOSE = 2, /*[CL]*/
2159  U_SB_FORMAT = 3, /*[FO]*/
2160  U_SB_LOWER = 4, /*[LO]*/
2161  U_SB_NUMERIC = 5, /*[NU]*/
2162  U_SB_OLETTER = 6, /*[LE]*/
2163  U_SB_SEP = 7, /*[SE]*/
2164  U_SB_SP = 8, /*[SP]*/
2165  U_SB_STERM = 9, /*[ST]*/
2166  U_SB_UPPER = 10, /*[UP]*/
2167  U_SB_CR = 11, /*[CR]*/ /* from here on: new in Unicode 5.1/ICU 4.0 */
2168  U_SB_EXTEND = 12, /*[EX]*/
2169  U_SB_LF = 13, /*[LF]*/
2170  U_SB_SCONTINUE = 14, /*[SC]*/
2171 #ifndef U_HIDE_DEPRECATED_API
2172 
2179 #endif // U_HIDE_DEPRECATED_API
2180 } USentenceBreak;
2181 
2188 typedef enum ULineBreak {
2189  /*
2190  * Note: ULineBreak constants are parsed by preparseucd.py.
2191  * It matches lines like
2192  * U_LB_<Unicode Line_Break value name>
2193  */
2194 
2195  U_LB_UNKNOWN = 0, /*[XX]*/
2196  U_LB_AMBIGUOUS = 1, /*[AI]*/
2197  U_LB_ALPHABETIC = 2, /*[AL]*/
2198  U_LB_BREAK_BOTH = 3, /*[B2]*/
2199  U_LB_BREAK_AFTER = 4, /*[BA]*/
2200  U_LB_BREAK_BEFORE = 5, /*[BB]*/
2201  U_LB_MANDATORY_BREAK = 6, /*[BK]*/
2202  U_LB_CONTINGENT_BREAK = 7, /*[CB]*/
2203  U_LB_CLOSE_PUNCTUATION = 8, /*[CL]*/
2204  U_LB_COMBINING_MARK = 9, /*[CM]*/
2205  U_LB_CARRIAGE_RETURN = 10, /*[CR]*/
2206  U_LB_EXCLAMATION = 11, /*[EX]*/
2207  U_LB_GLUE = 12, /*[GL]*/
2208  U_LB_HYPHEN = 13, /*[HY]*/
2209  U_LB_IDEOGRAPHIC = 14, /*[ID]*/
2211  U_LB_INSEPARABLE = 15, /*[IN]*/
2212  U_LB_INSEPERABLE = U_LB_INSEPARABLE,
2213  U_LB_INFIX_NUMERIC = 16, /*[IS]*/
2214  U_LB_LINE_FEED = 17, /*[LF]*/
2215  U_LB_NONSTARTER = 18, /*[NS]*/
2216  U_LB_NUMERIC = 19, /*[NU]*/
2217  U_LB_OPEN_PUNCTUATION = 20, /*[OP]*/
2218  U_LB_POSTFIX_NUMERIC = 21, /*[PO]*/
2219  U_LB_PREFIX_NUMERIC = 22, /*[PR]*/
2220  U_LB_QUOTATION = 23, /*[QU]*/
2221  U_LB_COMPLEX_CONTEXT = 24, /*[SA]*/
2222  U_LB_SURROGATE = 25, /*[SG]*/
2223  U_LB_SPACE = 26, /*[SP]*/
2224  U_LB_BREAK_SYMBOLS = 27, /*[SY]*/
2225  U_LB_ZWSPACE = 28, /*[ZW]*/
2227  U_LB_NEXT_LINE = 29, /*[NL]*/ /* from here on: new in Unicode 4/ICU 2.6 */
2229  U_LB_WORD_JOINER = 30, /*[WJ]*/
2231  U_LB_H2 = 31, /*[H2]*/ /* from here on: new in Unicode 4.1/ICU 3.4 */
2233  U_LB_H3 = 32, /*[H3]*/
2235  U_LB_JL = 33, /*[JL]*/
2237  U_LB_JT = 34, /*[JT]*/
2239  U_LB_JV = 35, /*[JV]*/
2241  U_LB_CLOSE_PARENTHESIS = 36, /*[CP]*/ /* new in Unicode 5.2/ICU 4.4 */
2243  U_LB_CONDITIONAL_JAPANESE_STARTER = 37,/*[CJ]*/ /* new in Unicode 6.1/ICU 49 */
2245  U_LB_HEBREW_LETTER = 38, /*[HL]*/ /* new in Unicode 6.1/ICU 49 */
2247  U_LB_REGIONAL_INDICATOR = 39,/*[RI]*/ /* new in Unicode 6.2/ICU 50 */
2249  U_LB_E_BASE = 40, /*[EB]*/ /* from here on: new in Unicode 9.0/ICU 58 */
2251  U_LB_E_MODIFIER = 41, /*[EM]*/
2253  U_LB_ZWJ = 42, /*[ZWJ]*/
2254 #ifndef U_HIDE_DEPRECATED_API
2255 
2262 #endif // U_HIDE_DEPRECATED_API
2263 } ULineBreak;
2264 
2271 typedef enum UNumericType {
2272  /*
2273  * Note: UNumericType constants are parsed by preparseucd.py.
2274  * It matches lines like
2275  * U_NT_<Unicode Numeric_Type value name>
2276  */
2277 
2278  U_NT_NONE, /*[None]*/
2279  U_NT_DECIMAL, /*[de]*/
2280  U_NT_DIGIT, /*[di]*/
2281  U_NT_NUMERIC, /*[nu]*/
2282 #ifndef U_HIDE_DEPRECATED_API
2283 
2290 #endif // U_HIDE_DEPRECATED_API
2291 } UNumericType;
2292 
2299 typedef enum UHangulSyllableType {
2300  /*
2301  * Note: UHangulSyllableType constants are parsed by preparseucd.py.
2302  * It matches lines like
2303  * U_HST_<Unicode Hangul_Syllable_Type value name>
2304  */
2305 
2306  U_HST_NOT_APPLICABLE, /*[NA]*/
2307  U_HST_LEADING_JAMO, /*[L]*/
2308  U_HST_VOWEL_JAMO, /*[V]*/
2309  U_HST_TRAILING_JAMO, /*[T]*/
2310  U_HST_LV_SYLLABLE, /*[LV]*/
2311  U_HST_LVT_SYLLABLE, /*[LVT]*/
2312 #ifndef U_HIDE_DEPRECATED_API
2313 
2320 #endif // U_HIDE_DEPRECATED_API
2322 
2349 U_STABLE UBool U_EXPORT2
2351 
2364 U_STABLE UBool U_EXPORT2
2366 
2379 U_STABLE UBool U_EXPORT2
2381 
2394 U_STABLE UBool U_EXPORT2
2396 
2415 U_STABLE UBool U_EXPORT2
2417 
2455 U_STABLE int32_t U_EXPORT2
2457 
2476 U_STABLE int32_t U_EXPORT2
2478 
2505 U_STABLE int32_t U_EXPORT2
2507 
2530 U_STABLE double U_EXPORT2
2532 
2540 #define U_NO_NUMERIC_VALUE ((double)-123456789.)
2541 
2565 U_STABLE UBool U_EXPORT2
2566 u_islower(UChar32 c);
2567 
2592 U_STABLE UBool U_EXPORT2
2593 u_isupper(UChar32 c);
2594 
2609 U_STABLE UBool U_EXPORT2
2610 u_istitle(UChar32 c);
2611 
2630 U_STABLE UBool U_EXPORT2
2631 u_isdigit(UChar32 c);
2632 
2651 U_STABLE UBool U_EXPORT2
2652 u_isalpha(UChar32 c);
2653 
2672 U_STABLE UBool U_EXPORT2
2673 u_isalnum(UChar32 c);
2674 
2695 U_STABLE UBool U_EXPORT2
2696 u_isxdigit(UChar32 c);
2697 
2711 U_STABLE UBool U_EXPORT2
2712 u_ispunct(UChar32 c);
2713 
2730 U_STABLE UBool U_EXPORT2
2731 u_isgraph(UChar32 c);
2732 
2758 U_STABLE UBool U_EXPORT2
2759 u_isblank(UChar32 c);
2760 
2783 U_STABLE UBool U_EXPORT2
2784 u_isdefined(UChar32 c);
2785 
2804 U_STABLE UBool U_EXPORT2
2805 u_isspace(UChar32 c);
2806 
2825 U_STABLE UBool U_EXPORT2
2827 
2865 U_STABLE UBool U_EXPORT2
2867 
2889 U_STABLE UBool U_EXPORT2
2890 u_iscntrl(UChar32 c);
2891 
2904 U_STABLE UBool U_EXPORT2
2906 
2922 U_STABLE UBool U_EXPORT2
2923 u_isprint(UChar32 c);
2924 
2943 U_STABLE UBool U_EXPORT2
2944 u_isbase(UChar32 c);
2945 
2962 U_STABLE UCharDirection U_EXPORT2
2964 
2980 U_STABLE UBool U_EXPORT2
2982 
3002 U_STABLE UChar32 U_EXPORT2
3004 
3021 U_STABLE UChar32 U_EXPORT2
3023 
3035 U_STABLE int8_t U_EXPORT2
3036 u_charType(UChar32 c);
3037 
3051 #define U_GET_GC_MASK(c) U_MASK(u_charType(c))
3052 
3070 typedef UBool U_CALLCONV
3071 UCharEnumTypeRange(const void *context, UChar32 start, UChar32 limit, UCharCategory type);
3072 
3092 U_STABLE void U_EXPORT2
3093 u_enumCharTypes(UCharEnumTypeRange *enumRange, const void *context);
3094 
3095 #if !UCONFIG_NO_NORMALIZATION
3096 
3104 U_STABLE uint8_t U_EXPORT2
3106 
3107 #endif
3108 
3132 U_STABLE int32_t U_EXPORT2
3134 
3144 U_STABLE UBlockCode U_EXPORT2
3146 
3179 U_STABLE int32_t U_EXPORT2
3180 u_charName(UChar32 code, UCharNameChoice nameChoice,
3181  char *buffer, int32_t bufferLength,
3182  UErrorCode *pErrorCode);
3183 
3184 #ifndef U_HIDE_DEPRECATED_API
3185 
3203 U_DEPRECATED int32_t U_EXPORT2
3205  char *dest, int32_t destCapacity,
3206  UErrorCode *pErrorCode);
3207 #endif /* U_HIDE_DEPRECATED_API */
3208 
3229 U_STABLE UChar32 U_EXPORT2
3230 u_charFromName(UCharNameChoice nameChoice,
3231  const char *name,
3232  UErrorCode *pErrorCode);
3233 
3251 typedef UBool U_CALLCONV UEnumCharNamesFn(void *context,
3252  UChar32 code,
3253  UCharNameChoice nameChoice,
3254  const char *name,
3255  int32_t length);
3256 
3278 U_STABLE void U_EXPORT2
3279 u_enumCharNames(UChar32 start, UChar32 limit,
3280  UEnumCharNamesFn *fn,
3281  void *context,
3282  UCharNameChoice nameChoice,
3283  UErrorCode *pErrorCode);
3284 
3316 U_STABLE const char* U_EXPORT2
3317 u_getPropertyName(UProperty property,
3318  UPropertyNameChoice nameChoice);
3319 
3339 U_STABLE UProperty U_EXPORT2
3340 u_getPropertyEnum(const char* alias);
3341 
3389 U_STABLE const char* U_EXPORT2
3391  int32_t value,
3392  UPropertyNameChoice nameChoice);
3393 
3425 U_STABLE int32_t U_EXPORT2
3427  const char* alias);
3428 
3446 U_STABLE UBool U_EXPORT2
3447 u_isIDStart(UChar32 c);
3448 
3470 U_STABLE UBool U_EXPORT2
3471 u_isIDPart(UChar32 c);
3472 
3493 U_STABLE UBool U_EXPORT2
3495 
3512 U_STABLE UBool U_EXPORT2
3514 
3533 U_STABLE UBool U_EXPORT2
3535 
3558 U_STABLE UChar32 U_EXPORT2
3559 u_tolower(UChar32 c);
3560 
3583 U_STABLE UChar32 U_EXPORT2
3584 u_toupper(UChar32 c);
3585 
3608 U_STABLE UChar32 U_EXPORT2
3609 u_totitle(UChar32 c);
3610 
3633 U_STABLE UChar32 U_EXPORT2
3634 u_foldCase(UChar32 c, uint32_t options);
3635 
3674 U_STABLE int32_t U_EXPORT2
3675 u_digit(UChar32 ch, int8_t radix);
3676 
3705 U_STABLE UChar32 U_EXPORT2
3706 u_forDigit(int32_t digit, int8_t radix);
3707 
3722 U_STABLE void U_EXPORT2
3723 u_charAge(UChar32 c, UVersionInfo versionArray);
3724 
3736 U_STABLE void U_EXPORT2
3737 u_getUnicodeVersion(UVersionInfo versionArray);
3738 
3739 #if !UCONFIG_NO_NORMALIZATION
3740 
3761 U_STABLE int32_t U_EXPORT2
3762 u_getFC_NFKC_Closure(UChar32 c, UChar *dest, int32_t destCapacity, UErrorCode *pErrorCode);
3763 
3764 #endif
3765 
3766 
3768 
3769 #endif /*_UCHAR*/
3770 /*eof*/
UBLOCK_CJK_COMPATIBILITY_IDEOGRAPHS
@ UBLOCK_CJK_COMPATIBILITY_IDEOGRAPHS
Definition: uchar.h:1237
U_POP_DIRECTIONAL_ISOLATE
@ U_POP_DIRECTIONAL_ISOLATE
PDI.
Definition: uchar.h:922
U_JG_TEH_MARBUTA_GOAL
@ U_JG_TEH_MARBUTA_GOAL
Definition: uchar.h:1925
U_GCB_GLUE_AFTER_ZWJ
@ U_GCB_GLUE_AFTER_ZWJ
Definition: uchar.h:2064
u_getPropertyValueEnum
int32_t u_getPropertyValueEnum(UProperty property, const char *alias)
Return the property value integer for a given value name, as specified in the Unicode database file P...
UBLOCK_HANIFI_ROHINGYA
@ UBLOCK_HANIFI_ROHINGYA
Definition: uchar.h:1704
U_JG_NYA
@ U_JG_NYA
Definition: uchar.h:1968
UBLOCK_MEDEFAIDRIN
@ UBLOCK_MEDEFAIDRIN
Definition: uchar.h:1712
UCHAR_JOINING_TYPE
@ UCHAR_JOINING_TYPE
Enumerated property Joining_Type.
Definition: uchar.h:490
UCHAR_POSIX_XDIGIT
@ UCHAR_POSIX_XDIGIT
Binary property xdigit (a C/POSIX character class).
Definition: uchar.h:387
UCHAR_ALPHABETIC
@ UCHAR_ALPHABETIC
Binary property Alphabetic.
Definition: uchar.h:179
u_isalnum
UBool u_isalnum(UChar32 c)
Determines whether the specified code point is an alphanumeric character (letter or digit) according ...
U_ENCLOSING_MARK
@ U_ENCLOSING_MARK
Me.
Definition: uchar.h:698
UBLOCK_EARLY_DYNASTIC_CUNEIFORM
@ UBLOCK_EARLY_DYNASTIC_CUNEIFORM
Definition: uchar.h:1639
UCHAR_ASCII_HEX_DIGIT
@ UCHAR_ASCII_HEX_DIGIT
Binary property ASCII_Hex_Digit.
Definition: uchar.h:183
UBLOCK_SUPPLEMENTAL_SYMBOLS_AND_PICTOGRAPHS
@ UBLOCK_SUPPLEMENTAL_SYMBOLS_AND_PICTOGRAPHS
Definition: uchar.h:1647
UCHAR_RADICAL
@ UCHAR_RADICAL
Binary property Radical (new in Unicode 3.2).
Definition: uchar.h:271
U_NT_COUNT
@ U_NT_COUNT
One more than the highest normal UNumericType value.
Definition: uchar.h:2289
UBLOCK_DINGBATS
@ UBLOCK_DINGBATS
Definition: uchar.h:1150
UBLOCK_GREEK
@ UBLOCK_GREEK
Unicode 3.2 renames this block to "Greek and Coptic".
Definition: uchar.h:1003
U_LB_ZWJ
@ U_LB_ZWJ
Definition: uchar.h:2253
UBLOCK_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_F
@ UBLOCK_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_F
Definition: uchar.h:1679
UCHAR_BIDI_PAIRED_BRACKET
@ UCHAR_BIDI_PAIRED_BRACKET
String property Bidi_Paired_Bracket (new in Unicode 6.3).
Definition: uchar.h:638
UCHAR_NFD_QUICK_CHECK
@ UCHAR_NFD_QUICK_CHECK
Enumerated property NFD_Quick_Check.
Definition: uchar.h:505
UCHAR_SIMPLE_UPPERCASE_MAPPING
@ UCHAR_SIMPLE_UPPERCASE_MAPPING
String property Simple_Uppercase_Mapping.
Definition: uchar.h:622
UBLOCK_UGARITIC
@ UBLOCK_UGARITIC
Definition: uchar.h:1341
U_JG_MANICHAEAN_QOPH
@ U_JG_MANICHAEAN_QOPH
Definition: uchar.h:1985
U_JG_AFRICAN_QAF
@ U_JG_AFRICAN_QAF
Definition: uchar.h:2000
U_ARABIC_NUMBER
@ U_ARABIC_NUMBER
AN.
Definition: uchar.h:888
UBLOCK_LIMBU
@ UBLOCK_LIMBU
Definition: uchar.h:1323
UBLOCK_SORA_SOMPENG
@ UBLOCK_SORA_SOMPENG
Definition: uchar.h:1555
u_charAge
void u_charAge(UChar32 c, UVersionInfo versionArray)
Get the "age" of the code point.
UBLOCK_CJK_STROKES
@ UBLOCK_CJK_STROKES
Definition: uchar.h:1364
UBLOCK_MISCELLANEOUS_TECHNICAL
@ UBLOCK_MISCELLANEOUS_TECHNICAL
Definition: uchar.h:1126
U_LB_WORD_JOINER
@ U_LB_WORD_JOINER
Definition: uchar.h:2229
UBLOCK_PHAGS_PA
@ UBLOCK_PHAGS_PA
Definition: uchar.h:1407
UCHAR_CASE_FOLDING
@ UCHAR_CASE_FOLDING
String property Case_Folding.
Definition: uchar.h:599
UBLOCK_CUNEIFORM_NUMBERS_AND_PUNCTUATION
@ UBLOCK_CUNEIFORM_NUMBERS_AND_PUNCTUATION
Definition: uchar.h:1413
UBLOCK_MEETEI_MAYEK_EXTENSIONS
@ UBLOCK_MEETEI_MAYEK_EXTENSIONS
Definition: uchar.h:1545
UBLOCK_ADLAM
@ UBLOCK_ADLAM
Definition: uchar.h:1654
UBLOCK_SUTTON_SIGNWRITING
@ UBLOCK_SUTTON_SIGNWRITING
Definition: uchar.h:1649
UBLOCK_MISCELLANEOUS_SYMBOLS
@ UBLOCK_MISCELLANEOUS_SYMBOLS
Definition: uchar.h:1147
u_charDirection
UCharDirection u_charDirection(UChar32 c)
Returns the bidirectional category value for the code point, which is used in the Unicode bidirection...
UBLOCK_DESERET
@ UBLOCK_DESERET
Definition: uchar.h:1270
U_TITLECASE_LETTER
@ U_TITLECASE_LETTER
Lt.
Definition: uchar.h:690
UCHAR_MASK_LIMIT
@ UCHAR_MASK_LIMIT
One more than the last constant for bit-mask Unicode properties.
Definition: uchar.h:573
UCHAR_SIMPLE_TITLECASE_MAPPING
@ UCHAR_SIMPLE_TITLECASE_MAPPING
String property Simple_Titlecase_Mapping.
Definition: uchar.h:619
UBLOCK_OLD_SOUTH_ARABIAN
@ UBLOCK_OLD_SOUTH_ARABIAN
Definition: uchar.h:1487
UCHAR_DOUBLE_LIMIT
@ UCHAR_DOUBLE_LIMIT
One more than the last constant for double Unicode properties.
Definition: uchar.h:586
UBLOCK_MODIFIER_TONE_LETTERS
@ UBLOCK_MODIFIER_TONE_LETTERS
Definition: uchar.h:1380
UCHAR_EMOJI_MODIFIER
@ UCHAR_EMOJI_MODIFIER
Binary property Emoji_Modifier.
Definition: uchar.h:424
u_getIntPropertyValue
int32_t u_getIntPropertyValue(UChar32 c, UProperty which)
Get the property value for an enumerated or integer Unicode property for a code point.
UBLOCK_MANDAIC
@ UBLOCK_MANDAIC
Definition: uchar.h:1512
UBLOCK_GREEK_EXTENDED
@ UBLOCK_GREEK_EXTENDED
Definition: uchar.h:1096
UBLOCK_MARCHEN
@ UBLOCK_MARCHEN
Definition: uchar.h:1664
U_LOWERCASE_LETTER
@ U_LOWERCASE_LETTER
Ll.
Definition: uchar.h:688
UCHAR_HYPHEN
@ UCHAR_HYPHEN
Binary property Hyphen.
Definition: uchar.h:229
UCHAR_NUMERIC_VALUE
@ UCHAR_NUMERIC_VALUE
Double property Numeric_Value.
Definition: uchar.h:578
UBLOCK_NUMBER_FORMS
@ UBLOCK_NUMBER_FORMS
Definition: uchar.h:1117
UBLOCK_SHORTHAND_FORMAT_CONTROLS
@ UBLOCK_SHORTHAND_FORMAT_CONTROLS
Definition: uchar.h:1616
UBLOCK_MEROITIC_CURSIVE
@ UBLOCK_MEROITIC_CURSIVE
Definition: uchar.h:1547
utypes.h
Basic definitions for ICU, for both C and C++ APIs.
UBLOCK_ENCLOSED_IDEOGRAPHIC_SUPPLEMENT
@ UBLOCK_ENCLOSED_IDEOGRAPHIC_SUPPLEMENT
Definition: uchar.h:1505
u_charName
int32_t u_charName(UChar32 code, UCharNameChoice nameChoice, char *buffer, int32_t bufferLength, UErrorCode *pErrorCode)
Retrieve the name of a Unicode character.
UCHAR_NFKD_INERT
@ UCHAR_NFKD_INERT
Binary property NFKD_Inert.
Definition: uchar.h:327
UBLOCK_OSAGE
@ UBLOCK_OSAGE
Definition: uchar.h:1670
UBLOCK_LETTERLIKE_SYMBOLS
@ UBLOCK_LETTERLIKE_SYMBOLS
Definition: uchar.h:1114
UCHAR_LOGICAL_ORDER_EXCEPTION
@ UCHAR_LOGICAL_ORDER_EXCEPTION
Binary property Logical_Order_Exception (new in Unicode 3.2).
Definition: uchar.h:256
U_LINE_SEPARATOR
@ U_LINE_SEPARATOR
Zl.
Definition: uchar.h:710
UCHAR_TITLECASE_MAPPING
@ UCHAR_TITLECASE_MAPPING
String property Titlecase_Mapping.
Definition: uchar.h:625
u_isspace
UBool u_isspace(UChar32 c)
Determines if the specified character is a space character or not.
UBLOCK_COUNT
@ UBLOCK_COUNT
One more than the highest normal UBlockCode value.
Definition: uchar.h:1725
U_JG_STRAIGHT_WAW
@ U_JG_STRAIGHT_WAW
Definition: uchar.h:1997
UCHAR_SENTENCE_BREAK
@ UCHAR_SENTENCE_BREAK
Enumerated property Sentence_Break (new in Unicode 4.1).
Definition: uchar.h:538
U_COMBINING_SPACING_MARK
@ U_COMBINING_SPACING_MARK
Mc.
Definition: uchar.h:700
U_EUROPEAN_NUMBER_TERMINATOR
@ U_EUROPEAN_NUMBER_TERMINATOR
ET.
Definition: uchar.h:886
UBLOCK_VARIATION_SELECTORS
@ UBLOCK_VARIATION_SELECTORS
Definition: uchar.h:1314
U_WB_COUNT
@ U_WB_COUNT
One more than the highest normal UWordBreakValues value.
Definition: uchar.h:2139
U_LB_REGIONAL_INDICATOR
@ U_LB_REGIONAL_INDICATOR
Definition: uchar.h:2247
U_CHAR_CATEGORY_COUNT
@ U_CHAR_CATEGORY_COUNT
One higher than the last enum UCharCategory constant.
Definition: uchar.h:750
U_PROPERTY_NAME_CHOICE_COUNT
@ U_PROPERTY_NAME_CHOICE_COUNT
One more than the highest normal UPropertyNameChoice value.
Definition: uchar.h:1822
UBool
int8_t UBool
The ICU boolean type.
Definition: umachine.h:236
UBLOCK_UNIFIED_CANADIAN_ABORIGINAL_SYLLABICS_EXTENDED
@ UBLOCK_UNIFIED_CANADIAN_ABORIGINAL_SYLLABICS_EXTENDED
Definition: uchar.h:1459
UCHAR_NFKC_INERT
@ UCHAR_NFKC_INERT
Binary property NFKC_Inert.
Definition: uchar.h:341
UBLOCK_TANGUT
@ UBLOCK_TANGUT
Definition: uchar.h:1672
UBLOCK_CJK_COMPATIBILITY_IDEOGRAPHS_SUPPLEMENT
@ UBLOCK_CJK_COMPATIBILITY_IDEOGRAPHS_SUPPLEMENT
Definition: uchar.h:1280
UBLOCK_CYRILLIC_EXTENDED_B
@ UBLOCK_CYRILLIC_EXTENDED_B
Definition: uchar.h:1430
UBLOCK_MAHAJANI
@ UBLOCK_MAHAJANI
Definition: uchar.h:1588
U_FINAL_PUNCTUATION
@ U_FINAL_PUNCTUATION
Pf.
Definition: uchar.h:742
u_getISOComment
int32_t u_getISOComment(UChar32 c, char *dest, int32_t destCapacity, UErrorCode *pErrorCode)
Returns an empty string.
U_JG_MALAYALAM_NNNA
@ U_JG_MALAYALAM_NNNA
Definition: uchar.h:2008
UBLOCK_LAO
@ UBLOCK_LAO
Definition: uchar.h:1057
UBLOCK_ARABIC_MATHEMATICAL_ALPHABETIC_SYMBOLS
@ UBLOCK_ARABIC_MATHEMATICAL_ALPHABETIC_SYMBOLS
Definition: uchar.h:1541
u_enumCharTypes
void u_enumCharTypes(UCharEnumTypeRange *enumRange, const void *context)
Enumerate efficiently all code points with their Unicode general categories.
u_getIntPropertyMaxValue
int32_t u_getIntPropertyMaxValue(UProperty which)
Get the maximum value for an enumerated/integer/binary Unicode property.
U_WB_LF
@ U_WB_LF
Definition: uchar.h:2106
UCHAR_ISO_COMMENT
@ UCHAR_ISO_COMMENT
Deprecated string property ISO_Comment.
Definition: uchar.h:603
UCHAR_CHANGES_WHEN_CASEMAPPED
@ UCHAR_CHANGES_WHEN_CASEMAPPED
Binary property Changes_When_Casemapped.
Definition: uchar.h:401
UBLOCK_CARIAN
@ UBLOCK_CARIAN
Definition: uchar.h:1446
UBLOCK_HIGH_SURROGATES
@ UBLOCK_HIGH_SURROGATES
Definition: uchar.h:1207
U_RIGHT_TO_LEFT_ARABIC
@ U_RIGHT_TO_LEFT_ARABIC
AL.
Definition: uchar.h:904
UBLOCK_UNIFIED_CANADIAN_ABORIGINAL_SYLLABICS
@ UBLOCK_UNIFIED_CANADIAN_ABORIGINAL_SYLLABICS
Definition: uchar.h:1078
U_LB_H2
@ U_LB_H2
Definition: uchar.h:2231
UBLOCK_RUNIC
@ UBLOCK_RUNIC
Definition: uchar.h:1084
UCHAR_POSIX_BLANK
@ UCHAR_POSIX_BLANK
Binary property blank (a C/POSIX character class).
Definition: uchar.h:372
U_LB_NEXT_LINE
@ U_LB_NEXT_LINE
Definition: uchar.h:2227
u_iscntrl
UBool u_iscntrl(UChar32 c)
Determines whether the specified code point is a control character (as defined by this function).
UBLOCK_MALAYALAM
@ UBLOCK_MALAYALAM
Definition: uchar.h:1048
UCHAR_POSIX_GRAPH
@ UCHAR_POSIX_GRAPH
Binary property graph (a C/POSIX character class).
Definition: uchar.h:377
UCHAR_NONCHARACTER_CODE_POINT
@ UCHAR_NONCHARACTER_CODE_POINT
Binary property Noncharacter_Code_Point.
Definition: uchar.h:265
UBLOCK_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_A
@ UBLOCK_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_A
Definition: uchar.h:1192
u_isUUppercase
UBool u_isUUppercase(UChar32 c)
Check if a code point has the Uppercase Unicode property.
UBLOCK_OLD_PERMIC
@ UBLOCK_OLD_PERMIC
Definition: uchar.h:1604
U_JG_MANICHAEAN_WAW
@ U_JG_MANICHAEAN_WAW
Definition: uchar.h:1994
UBLOCK_SUPPLEMENTAL_ARROWS_A
@ UBLOCK_SUPPLEMENTAL_ARROWS_A
Definition: uchar.h:1304
u_getBidiPairedBracket
UChar32 u_getBidiPairedBracket(UChar32 c)
Maps the specified character to its paired bracket character.
UBLOCK_CJK_COMPATIBILITY
@ UBLOCK_CJK_COMPATIBILITY
Definition: uchar.h:1189
U_CALLCONV
#define U_CALLCONV
Definition: platform.h:836
UBLOCK_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_D
@ UBLOCK_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_D
Definition: uchar.h:1534
UBLOCK_PLAYING_CARDS
@ UBLOCK_PLAYING_CARDS
Definition: uchar.h:1524
U_LB_CLOSE_PARENTHESIS
@ U_LB_CLOSE_PARENTHESIS
Definition: uchar.h:2241
U_JG_MANICHAEAN_ZAYIN
@ U_JG_MANICHAEAN_ZAYIN
Definition: uchar.h:1996
U_OTHER_PUNCTUATION
@ U_OTHER_PUNCTUATION
Po.
Definition: uchar.h:730
UBLOCK_HANGUL_SYLLABLES
@ UBLOCK_HANGUL_SYLLABLES
Definition: uchar.h:1204
UBLOCK_NEW_TAI_LUE
@ UBLOCK_NEW_TAI_LUE
Definition: uchar.h:1382
UBLOCK_BOPOMOFO_EXTENDED
@ UBLOCK_BOPOMOFO_EXTENDED
Definition: uchar.h:1183
UCHAR_AGE
@ UCHAR_AGE
String property Age.
Definition: uchar.h:591
UBLOCK_ETHIOPIC_SUPPLEMENT
@ UBLOCK_ETHIOPIC_SUPPLEMENT
Definition: uchar.h:1372
UBLOCK_MANICHAEAN
@ UBLOCK_MANICHAEAN
Definition: uchar.h:1590
UBLOCK_GURMUKHI
@ UBLOCK_GURMUKHI
Definition: uchar.h:1030
UCHAR_BIDI_PAIRED_BRACKET_TYPE
@ UCHAR_BIDI_PAIRED_BRACKET_TYPE
Enumerated property Bidi_Paired_Bracket_Type (new in Unicode 6.3).
Definition: uchar.h:548
UBLOCK_REJANG
@ UBLOCK_REJANG
Definition: uchar.h:1436
UCHAR_INVALID_CODE
@ UCHAR_INVALID_CODE
Represents a nonexistent or invalid property or property value.
Definition: uchar.h:664
U_JG_MANICHAEAN_RESH
@ U_JG_MANICHAEAN_RESH
Definition: uchar.h:1986
UBLOCK_BUHID
@ UBLOCK_BUHID
Definition: uchar.h:1298
U_LB_JL
@ U_LB_JL
Definition: uchar.h:2235
U_CHAR_DIRECTION_COUNT
@ U_CHAR_DIRECTION_COUNT
One more than the highest UCharDirection value.
Definition: uchar.h:930
UBLOCK_COMBINING_MARKS_FOR_SYMBOLS
@ UBLOCK_COMBINING_MARKS_FOR_SYMBOLS
Unicode 3.2 renames this block to "Combining Diacritical Marks for Symbols".
Definition: uchar.h:1111
U_UNICODE_10_CHAR_NAME
@ U_UNICODE_10_CHAR_NAME
The Unicode_1_Name property value which is of little practical value.
Definition: uchar.h:1786
UBLOCK_LATIN_EXTENDED_E
@ UBLOCK_LATIN_EXTENDED_E
Definition: uchar.h:1584
UBLOCK_DOGRA
@ UBLOCK_DOGRA
Definition: uchar.h:1698
u_isUAlphabetic
UBool u_isUAlphabetic(UChar32 c)
Check if a code point has the Alphabetic Unicode property.
U_OTHER_NUMBER
@ U_OTHER_NUMBER
No.
Definition: uchar.h:706
UBLOCK_CYPRIOT_SYLLABARY
@ UBLOCK_CYPRIOT_SYLLABARY
Definition: uchar.h:1347
UBLOCK_CHEROKEE_SUPPLEMENT
@ UBLOCK_CHEROKEE_SUPPLEMENT
Definition: uchar.h:1635
UBlockCode
UBlockCode
Constants for Unicode blocks, see the Unicode Data file Blocks.txt.
Definition: uchar.h:968
UCHAR_WHITE_SPACE
@ UCHAR_WHITE_SPACE
Binary property White_Space.
Definition: uchar.h:291
UBLOCK_EMOTICONS
@ UBLOCK_EMOTICONS
Definition: uchar.h:1528
UBLOCK_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_C
@ UBLOCK_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_C
Definition: uchar.h:1507
U_CURRENCY_SYMBOL
@ U_CURRENCY_SYMBOL
Sc.
Definition: uchar.h:734
U_LETTER_NUMBER
@ U_LETTER_NUMBER
Nl.
Definition: uchar.h:704
UProperty
UProperty
Selection constants for Unicode properties.
Definition: uchar.h:165
UBLOCK_MATHEMATICAL_ALPHANUMERIC_SYMBOLS
@ UBLOCK_MATHEMATICAL_ALPHANUMERIC_SYMBOLS
Definition: uchar.h:1276
UBLOCK_KHUDAWADI
@ UBLOCK_KHUDAWADI
Definition: uchar.h:1582
u_enumCharNames
void u_enumCharNames(UChar32 start, UChar32 limit, UEnumCharNamesFn *fn, void *context, UCharNameChoice nameChoice, UErrorCode *pErrorCode)
Enumerate all assigned Unicode characters between the start and limit code points (start inclusive,...
UBLOCK_KANA_EXTENDED_A
@ UBLOCK_KANA_EXTENDED_A
Definition: uchar.h:1681
U_WB_REGIONAL_INDICATOR
@ U_WB_REGIONAL_INDICATOR
Definition: uchar.h:2112
U_EUROPEAN_NUMBER
@ U_EUROPEAN_NUMBER
EN.
Definition: uchar.h:882
U_DEPRECATED
#define U_DEPRECATED
This is used to declare a function as a deprecated public ICU C API
Definition: umachine.h:115
UBLOCK_LYCIAN
@ UBLOCK_LYCIAN
Definition: uchar.h:1444
UBLOCK_SOGDIAN
@ UBLOCK_SOGDIAN
Definition: uchar.h:1716
UBLOCK_INSCRIPTIONAL_PARTHIAN
@ UBLOCK_INSCRIPTIONAL_PARTHIAN
Definition: uchar.h:1491
U_COMMON_NUMBER_SEPARATOR
@ U_COMMON_NUMBER_SEPARATOR
CS.
Definition: uchar.h:890
UBLOCK_IDEOGRAPHIC_DESCRIPTION_CHARACTERS
@ UBLOCK_IDEOGRAPHIC_DESCRIPTION_CHARACTERS
Definition: uchar.h:1162
u_isJavaIDStart
UBool u_isJavaIDStart(UChar32 c)
Determines if the specified character is permissible as the first character in a Java identifier.
u_isMirrored
UBool u_isMirrored(UChar32 c)
Determines whether the code point has the Bidi_Mirrored property.
U_WB_GLUE_AFTER_ZWJ
@ U_WB_GLUE_AFTER_ZWJ
Definition: uchar.h:2126
UBLOCK_VEDIC_EXTENSIONS
@ UBLOCK_VEDIC_EXTENSIONS
Definition: uchar.h:1463
UBLOCK_VAI
@ UBLOCK_VAI
Definition: uchar.h:1428
UBLOCK_SUPPLEMENTARY_PRIVATE_USE_AREA_B
@ UBLOCK_SUPPLEMENTARY_PRIVATE_USE_AREA_B
Definition: uchar.h:1318
UBLOCK_EGYPTIAN_HIEROGLYPHS
@ UBLOCK_EGYPTIAN_HIEROGLYPHS
Definition: uchar.h:1501
UBLOCK_PRIVATE_USE
@ UBLOCK_PRIVATE_USE
Same as UBLOCK_PRIVATE_USE_AREA.
Definition: uchar.h:1234
UBLOCK_ANCIENT_GREEK_NUMBERS
@ UBLOCK_ANCIENT_GREEK_NUMBERS
Definition: uchar.h:1358
U_CHAR_NAME_ALIAS
@ U_CHAR_NAME_ALIAS
Corrected name from NameAliases.txt.
Definition: uchar.h:1791
U_DT_COUNT
@ U_DT_COUNT
One more than the highest normal UDecompositionType value.
Definition: uchar.h:1864
UBLOCK_SOYOMBO
@ UBLOCK_SOYOMBO
Definition: uchar.h:1687
UBLOCK_YIJING_HEXAGRAM_SYMBOLS
@ UBLOCK_YIJING_HEXAGRAM_SYMBOLS
Definition: uchar.h:1333
UBLOCK_ZANABAZAR_SQUARE
@ UBLOCK_ZANABAZAR_SQUARE
Definition: uchar.h:1691
U_SURROGATE
@ U_SURROGATE
Cs.
Definition: uchar.h:720
UCHAR_CASE_IGNORABLE
@ UCHAR_CASE_IGNORABLE
Binary property Case_Ignorable.
Definition: uchar.h:391
UBLOCK_ARABIC_PRESENTATION_FORMS_B
@ UBLOCK_ARABIC_PRESENTATION_FORMS_B
Definition: uchar.h:1255
UCHAR_CANONICAL_COMBINING_CLASS
@ UCHAR_CANONICAL_COMBINING_CLASS
Enumerated property Canonical_Combining_Class.
Definition: uchar.h:474
UCHAR_REGIONAL_INDICATOR
@ UCHAR_REGIONAL_INDICATOR
Binary property Regional_Indicator.
Definition: uchar.h:443
UCHAR_LINE_BREAK
@ UCHAR_LINE_BREAK
Enumerated property Line_Break.
Definition: uchar.h:493
UBLOCK_BALINESE
@ UBLOCK_BALINESE
Definition: uchar.h:1401
UBLOCK_AEGEAN_NUMBERS
@ UBLOCK_AEGEAN_NUMBERS
Definition: uchar.h:1339
u_digit
int32_t u_digit(UChar32 ch, int8_t radix)
Returns the decimal digit value of the code point in the specified radix.
UBLOCK_ANCIENT_SYMBOLS
@ UBLOCK_ANCIENT_SYMBOLS
Definition: uchar.h:1440
U_PARAGRAPH_SEPARATOR
@ U_PARAGRAPH_SEPARATOR
Zp.
Definition: uchar.h:712
UBLOCK_COMBINING_DIACRITICAL_MARKS_EXTENDED
@ UBLOCK_COMBINING_DIACRITICAL_MARKS_EXTENDED
Definition: uchar.h:1570
UBLOCK_BOPOMOFO
@ UBLOCK_BOPOMOFO
Definition: uchar.h:1174
U_WB_ZWJ
@ U_WB_ZWJ
Definition: uchar.h:2128
UBLOCK_NEWA
@ UBLOCK_NEWA
Definition: uchar.h:1668
UBLOCK_GEOMETRIC_SHAPES_EXTENDED
@ UBLOCK_GEOMETRIC_SHAPES_EXTENDED
Definition: uchar.h:1576
UEnumCharNamesFn
UBool UEnumCharNamesFn(void *context, UChar32 code, UCharNameChoice nameChoice, const char *name, int32_t length)
Type of a callback function for u_enumCharNames() that gets called for each Unicode character with th...
Definition: uchar.h:3251
UBLOCK_DEVANAGARI
@ UBLOCK_DEVANAGARI
Definition: uchar.h:1024
UCHAR_GENERAL_CATEGORY_MASK
@ UCHAR_GENERAL_CATEGORY_MASK
Bitmask property General_Category_Mask.
Definition: uchar.h:565
U_JG_AFRICAN_NOON
@ U_JG_AFRICAN_NOON
Definition: uchar.h:1999
UCHAR_UPPERCASE_MAPPING
@ UCHAR_UPPERCASE_MAPPING
String property Uppercase_Mapping.
Definition: uchar.h:635
UBLOCK_TIBETAN
@ UBLOCK_TIBETAN
Definition: uchar.h:1060
UHangulSyllableType
UHangulSyllableType
Hangul Syllable Type constants.
Definition: uchar.h:2299
u_tolower
UChar32 u_tolower(UChar32 c)
The given character is mapped to its lowercase equivalent according to UnicodeData....
U_WB_E_BASE
@ U_WB_E_BASE
Definition: uchar.h:2120
UBLOCK_GEORGIAN_EXTENDED
@ UBLOCK_GEORGIAN_EXTENDED
Definition: uchar.h:1700
UBLOCK_COMBINING_DIACRITICAL_MARKS_SUPPLEMENT
@ UBLOCK_COMBINING_DIACRITICAL_MARKS_SUPPLEMENT
Definition: uchar.h:1366
u_isbase
UBool u_isbase(UChar32 c)
Determines whether the specified code point is a base character.
UBLOCK_MAHJONG_TILES
@ UBLOCK_MAHJONG_TILES
Definition: uchar.h:1450
UBLOCK_OGHAM
@ UBLOCK_OGHAM
Definition: uchar.h:1081
U_JG_MANICHAEAN_TAW
@ U_JG_MANICHAEAN_TAW
Definition: uchar.h:1989
UBLOCK_ARABIC_SUPPLEMENT
@ UBLOCK_ARABIC_SUPPLEMENT
Definition: uchar.h:1360
UCHAR_DASH
@ UCHAR_DASH
Binary property Dash.
Definition: uchar.h:194
UBLOCK_SPECIALS
@ UBLOCK_SPECIALS
Definition: uchar.h:1258
U_NON_SPACING_MARK
@ U_NON_SPACING_MARK
Mn.
Definition: uchar.h:696
UBLOCK_TAI_LE
@ UBLOCK_TAI_LE
Definition: uchar.h:1325
u_isdefined
UBool u_isdefined(UChar32 c)
Determines whether the specified code point is "defined", which usually means that it is assigned a c...
U_WHITE_SPACE_NEUTRAL
@ U_WHITE_SPACE_NEUTRAL
WS.
Definition: uchar.h:896
u_charType
int8_t u_charType(UChar32 c)
Returns the general category value for the code point.
U_FIRST_STRONG_ISOLATE
@ U_FIRST_STRONG_ISOLATE
FSI.
Definition: uchar.h:916
U_WB_NEWLINE
@ U_WB_NEWLINE
Definition: uchar.h:2110
U_MODIFIER_LETTER
@ U_MODIFIER_LETTER
Lm.
Definition: uchar.h:692
UCHAR_BIDI_MIRRORED
@ UCHAR_BIDI_MIRRORED
Binary property Bidi_Mirrored.
Definition: uchar.h:192
UCHAR_BIDI_MIRRORING_GLYPH
@ UCHAR_BIDI_MIRRORING_GLYPH
String property Bidi_Mirroring_Glyph.
Definition: uchar.h:596
U_JG_MANICHAEAN_DHAMEDH
@ U_JG_MANICHAEAN_DHAMEDH
Definition: uchar.h:1974
UBLOCK_MONGOLIAN_SUPPLEMENT
@ UBLOCK_MONGOLIAN_SUPPLEMENT
Definition: uchar.h:1666
UBLOCK_OLD_TURKIC
@ UBLOCK_OLD_TURKIC
Definition: uchar.h:1495
U_JG_COUNT
@ U_JG_COUNT
One more than the highest normal UJoiningGroup value.
Definition: uchar.h:2024
UBLOCK_TAKRI
@ UBLOCK_TAKRI
Definition: uchar.h:1559
UBLOCK_DUPLOYAN
@ UBLOCK_DUPLOYAN
Definition: uchar.h:1572
UCHAR_INT_START
@ UCHAR_INT_START
First constant for enumerated/integer Unicode properties.
Definition: uchar.h:468
UBLOCK_NKO
@ UBLOCK_NKO
Definition: uchar.h:1399
UBLOCK_BHAIKSUKI
@ UBLOCK_BHAIKSUKI
Definition: uchar.h:1656
UBLOCK_IPA_EXTENSIONS
@ UBLOCK_IPA_EXTENSIONS
Definition: uchar.h:991
U_LEFT_TO_RIGHT_ISOLATE
@ U_LEFT_TO_RIGHT_ISOLATE
LRI.
Definition: uchar.h:918
UBLOCK_TRANSPORT_AND_MAP_SYMBOLS
@ UBLOCK_TRANSPORT_AND_MAP_SYMBOLS
Definition: uchar.h:1530
UCHAR_EXTENDER
@ UCHAR_EXTENDER
Binary property Extender.
Definition: uchar.h:208
UCHAR_IDS_TRINARY_OPERATOR
@ UCHAR_IDS_TRINARY_OPERATOR
Binary property IDS_Trinary_Operator (new in Unicode 3.2).
Definition: uchar.h:249
u_isalpha
UBool u_isalpha(UChar32 c)
Determines whether the specified code point is a letter character.
UCHAR_CHANGES_WHEN_UPPERCASED
@ UCHAR_CHANGES_WHEN_UPPERCASED
Binary property Changes_When_Uppercased.
Definition: uchar.h:395
U_LB_E_MODIFIER
@ U_LB_E_MODIFIER
Definition: uchar.h:2251
UBLOCK_KANGXI_RADICALS
@ UBLOCK_KANGXI_RADICALS
Definition: uchar.h:1159
UBLOCK_ARABIC
@ UBLOCK_ARABIC
Definition: uchar.h:1015
U_JG_MALAYALAM_NGA
@ U_JG_MALAYALAM_NGA
Definition: uchar.h:2006
UBLOCK_SAURASHTRA
@ UBLOCK_SAURASHTRA
Definition: uchar.h:1432
UBLOCK_NUSHU
@ UBLOCK_NUSHU
Definition: uchar.h:1685
UCHAR_DECOMPOSITION_TYPE
@ UCHAR_DECOMPOSITION_TYPE
Enumerated property Decomposition_Type.
Definition: uchar.h:477
UCHAR_IDS_BINARY_OPERATOR
@ UCHAR_IDS_BINARY_OPERATOR
Binary property IDS_Binary_Operator (new in Unicode 3.2).
Definition: uchar.h:245
U_RIGHT_TO_LEFT_ISOLATE
@ U_RIGHT_TO_LEFT_ISOLATE
RLI.
Definition: uchar.h:920
UBLOCK_BENGALI
@ UBLOCK_BENGALI
Definition: uchar.h:1027
UBLOCK_PHAISTOS_DISC
@ UBLOCK_PHAISTOS_DISC
Definition: uchar.h:1442
U_PRIVATE_USE_CHAR
@ U_PRIVATE_USE_CHAR
Co.
Definition: uchar.h:718
UBLOCK_NO_BLOCK
@ UBLOCK_NO_BLOCK
New No_Block value in Unicode 4.
Definition: uchar.h:976
UBLOCK_HIRAGANA
@ UBLOCK_HIRAGANA
Definition: uchar.h:1168
UBLOCK_IDEOGRAPHIC_SYMBOLS_AND_PUNCTUATION
@ UBLOCK_IDEOGRAPHIC_SYMBOLS_AND_PUNCTUATION
Definition: uchar.h:1662
UJoiningType
UJoiningType
Joining Type constants.
Definition: uchar.h:1874
UCHAR_EXTENDED_PICTOGRAPHIC
@ UCHAR_EXTENDED_PICTOGRAPHIC
Binary property Extended_Pictographic.
Definition: uchar.h:455
UBLOCK_CYRILLIC_EXTENDED_A
@ UBLOCK_CYRILLIC_EXTENDED_A
Definition: uchar.h:1426
U_JG_MANICHAEAN_PE
@ U_JG_MANICHAEAN_PE
Definition: uchar.h:1984
u_getCombiningClass
uint8_t u_getCombiningClass(UChar32 c)
Returns the combining class of the code point as specified in UnicodeData.txt.
UCHAR_MATH
@ UCHAR_MATH
Binary property Math.
Definition: uchar.h:261
UCHAR_MASK_START
@ UCHAR_MASK_START
First constant for bit-mask Unicode properties.
Definition: uchar.h:567
U_JG_MANICHAEAN_LAMEDH
@ U_JG_MANICHAEAN_LAMEDH
Definition: uchar.h:1980
UCHAR_DIACRITIC
@ UCHAR_DIACRITIC
Binary property Diacritic.
Definition: uchar.h:204
u_isblank
UBool u_isblank(UChar32 c)
Determines whether the specified code point is a "blank" or "horizontal space", a character that visi...
UBLOCK_ARABIC_EXTENDED_A
@ UBLOCK_ARABIC_EXTENDED_A
Definition: uchar.h:1539
UBLOCK_ORIYA
@ UBLOCK_ORIYA
Definition: uchar.h:1036
UBLOCK_BUGINESE
@ UBLOCK_BUGINESE
Definition: uchar.h:1362
UCHAR_IDEOGRAPHIC
@ UCHAR_IDEOGRAPHIC
Binary property Ideographic.
Definition: uchar.h:241
UPropertyNameChoice
UPropertyNameChoice
Selector constants for u_getPropertyName() and u_getPropertyValueName().
Definition: uchar.h:1814
UChar32
int32_t UChar32
Define UChar32 as a type for single Unicode code points.
Definition: umachine.h:400
UBLOCK_COMMON_INDIC_NUMBER_FORMS
@ UBLOCK_COMMON_INDIC_NUMBER_FORMS
Definition: uchar.h:1469
U_OTHER_NEUTRAL
@ U_OTHER_NEUTRAL
ON.
Definition: uchar.h:898
UBLOCK_GENERAL_PUNCTUATION
@ UBLOCK_GENERAL_PUNCTUATION
Definition: uchar.h:1099
UBLOCK_ENCLOSED_ALPHANUMERIC_SUPPLEMENT
@ UBLOCK_ENCLOSED_ALPHANUMERIC_SUPPLEMENT
Definition: uchar.h:1503
UCHAR_GRAPHEME_BASE
@ UCHAR_GRAPHEME_BASE
Binary property Grapheme_Base (new in Unicode 3.2).
Definition: uchar.h:216
U_JG_MANICHAEAN_GIMEL
@ U_JG_MANICHAEAN_GIMEL
Definition: uchar.h:1976
UBLOCK_MATHEMATICAL_OPERATORS
@ UBLOCK_MATHEMATICAL_OPERATORS
Definition: uchar.h:1123
UCHAR_ID_START
@ UCHAR_ID_START
Binary property ID_Start.
Definition: uchar.h:238
U_OTHER_LETTER
@ U_OTHER_LETTER
Lo.
Definition: uchar.h:694
UCHAR_QUOTATION_MARK
@ UCHAR_QUOTATION_MARK
Binary property Quotation_Mark.
Definition: uchar.h:267
UBLOCK_ALPHABETIC_PRESENTATION_FORMS
@ UBLOCK_ALPHABETIC_PRESENTATION_FORMS
Definition: uchar.h:1240
UCHAR_DEFAULT_IGNORABLE_CODE_POINT
@ UCHAR_DEFAULT_IGNORABLE_CODE_POINT
Binary property Default_Ignorable_Code_Point (new in Unicode 3.2).
Definition: uchar.h:198
U_DECIMAL_DIGIT_NUMBER
@ U_DECIMAL_DIGIT_NUMBER
Nd.
Definition: uchar.h:702
u_isdigit
UBool u_isdigit(UChar32 c)
Determines whether the specified code point is a digit character according to Java.
UErrorCode
UErrorCode
Error code to replace exception handling, so that the code is compatible with all C++ compilers,...
Definition: utypes.h:396
UBLOCK_SUPPLEMENTARY_PRIVATE_USE_AREA_A
@ UBLOCK_SUPPLEMENTARY_PRIVATE_USE_AREA_A
Definition: uchar.h:1316
UBLOCK_PALMYRENE
@ UBLOCK_PALMYRENE
Definition: uchar.h:1610
UBLOCK_TANGUT_COMPONENTS
@ UBLOCK_TANGUT_COMPONENTS
Definition: uchar.h:1674
U_SPACE_SEPARATOR
@ U_SPACE_SEPARATOR
Zs.
Definition: uchar.h:708
UBLOCK_LYDIAN
@ UBLOCK_LYDIAN
Definition: uchar.h:1448
UBLOCK_CJK_COMPATIBILITY_FORMS
@ UBLOCK_CJK_COMPATIBILITY_FORMS
Definition: uchar.h:1249
UCharDirection
UCharDirection
This specifies the language directional property of a character set.
Definition: uchar.h:869
UBLOCK_TIFINAGH
@ UBLOCK_TIFINAGH
Definition: uchar.h:1392
U_SB_COUNT
@ U_SB_COUNT
One more than the highest normal USentenceBreak value.
Definition: uchar.h:2178
U_GCB_ZWJ
@ U_GCB_ZWJ
Definition: uchar.h:2066
UCHAR_BINARY_START
@ UCHAR_BINARY_START
First constant for binary Unicode properties.
Definition: uchar.h:181
UCHAR_CHANGES_WHEN_LOWERCASED
@ UCHAR_CHANGES_WHEN_LOWERCASED
Binary property Changes_When_Lowercased.
Definition: uchar.h:393
UBLOCK_MASARAM_GONDI
@ UBLOCK_MASARAM_GONDI
Definition: uchar.h:1683
UCHAR_EMOJI_MODIFIER_BASE
@ UCHAR_EMOJI_MODIFIER_BASE
Binary property Emoji_Modifier_Base.
Definition: uchar.h:431
U_JG_MANICHAEAN_SAMEKH
@ U_JG_MANICHAEAN_SAMEKH
Definition: uchar.h:1988
UBLOCK_GEORGIAN
@ UBLOCK_GEORGIAN
Definition: uchar.h:1066
UBLOCK_KATAKANA_PHONETIC_EXTENSIONS
@ UBLOCK_KATAKANA_PHONETIC_EXTENSIONS
Definition: uchar.h:1312
u_isIDIgnorable
UBool u_isIDIgnorable(UChar32 c)
Determines if the specified character should be regarded as an ignorable character in an identifier,...
UBLOCK_KANNADA
@ UBLOCK_KANNADA
Definition: uchar.h:1045
u_charMirror
UChar32 u_charMirror(UChar32 c)
Maps the specified character to a "mirror-image" character.
UBLOCK_SUNDANESE
@ UBLOCK_SUNDANESE
Definition: uchar.h:1420
UBLOCK_HANGUL_JAMO_EXTENDED_A
@ UBLOCK_HANGUL_JAMO_EXTENDED_A
Definition: uchar.h:1473
UBLOCK_COMBINING_DIACRITICAL_MARKS
@ UBLOCK_COMBINING_DIACRITICAL_MARKS
Definition: uchar.h:997
U_EUROPEAN_NUMBER_SEPARATOR
@ U_EUROPEAN_NUMBER_SEPARATOR
ES.
Definition: uchar.h:884
UCHAR_HANGUL_SYLLABLE_TYPE
@ UCHAR_HANGUL_SYLLABLE_TYPE
Enumerated property Hangul_Syllable_Type, new in Unicode 4.
Definition: uchar.h:502
U_GCB_PREPEND
@ U_GCB_PREPEND
Definition: uchar.h:2054
UBLOCK_SMALL_FORM_VARIANTS
@ UBLOCK_SMALL_FORM_VARIANTS
Definition: uchar.h:1252
UCHAR_NFD_INERT
@ UCHAR_NFD_INERT
Binary property NFD_Inert.
Definition: uchar.h:320
UBLOCK_RUMI_NUMERAL_SYMBOLS
@ UBLOCK_RUMI_NUMERAL_SYMBOLS
Definition: uchar.h:1497
UBLOCK_BRAHMI
@ UBLOCK_BRAHMI
Definition: uchar.h:1518
ublock_getCode
UBlockCode ublock_getCode(UChar32 c)
Returns the Unicode allocation block that contains the character.
UCHAR_NUMERIC_TYPE
@ UCHAR_NUMERIC_TYPE
Enumerated property Numeric_Type.
Definition: uchar.h:496
U_JG_MANICHAEAN_TEN
@ U_JG_MANICHAEAN_TEN
Definition: uchar.h:1990
UBLOCK_OL_CHIKI
@ UBLOCK_OL_CHIKI
Definition: uchar.h:1424
UBLOCK_MEROITIC_HIEROGLYPHS
@ UBLOCK_MEROITIC_HIEROGLYPHS
Definition: uchar.h:1549
UBLOCK_THAANA
@ UBLOCK_THAANA
Definition: uchar.h:1021
UBLOCK_KAYAH_LI
@ UBLOCK_KAYAH_LI
Definition: uchar.h:1434
UBLOCK_ETHIOPIC_EXTENDED_A
@ UBLOCK_ETHIOPIC_EXTENDED_A
Definition: uchar.h:1516
U_JG_MALAYALAM_LLA
@ U_JG_MALAYALAM_LLA
Definition: uchar.h:2004
U_LB_INSEPARABLE
@ U_LB_INSEPARABLE
Renamed from the misspelled "inseperable" in Unicode 4.0.1/ICU 3.0.
Definition: uchar.h:2211
U_DIR_NON_SPACING_MARK
@ U_DIR_NON_SPACING_MARK
NSM.
Definition: uchar.h:912
U_LB_H3
@ U_LB_H3
Definition: uchar.h:2233
UBLOCK_ORNAMENTAL_DINGBATS
@ UBLOCK_ORNAMENTAL_DINGBATS
Definition: uchar.h:1606
UCHAR_GRAPHEME_CLUSTER_BREAK
@ UCHAR_GRAPHEME_CLUSTER_BREAK
Enumerated property Grapheme_Cluster_Break (new in Unicode 4.1).
Definition: uchar.h:533
U_JG_MANICHAEAN_MEM
@ U_JG_MANICHAEAN_MEM
Definition: uchar.h:1981
UGraphemeClusterBreak
UGraphemeClusterBreak
Grapheme Cluster Break constants.
Definition: uchar.h:2034
u_charFromName
UChar32 u_charFromName(UCharNameChoice nameChoice, const char *name, UErrorCode *pErrorCode)
Find a Unicode character by its name and return its code point value.
UCHAR_LOWERCASE_MAPPING
@ UCHAR_LOWERCASE_MAPPING
String property Lowercase_Mapping.
Definition: uchar.h:607
U_LEFT_TO_RIGHT_OVERRIDE
@ U_LEFT_TO_RIGHT_OVERRIDE
LRO.
Definition: uchar.h:902
U_MODIFIER_SYMBOL
@ U_MODIFIER_SYMBOL
Sk.
Definition: uchar.h:736
UBLOCK_NABATAEAN
@ UBLOCK_NABATAEAN
Definition: uchar.h:1600
U_BPT_CLOSE
@ U_BPT_CLOSE
Close paired bracket.
Definition: uchar.h:952
UCHAR_POSIX_PRINT
@ UCHAR_POSIX_PRINT
Binary property print (a C/POSIX character class).
Definition: uchar.h:382
UBLOCK_LATIN_EXTENDED_C
@ UBLOCK_LATIN_EXTENDED_C
Definition: uchar.h:1403
UBLOCK_ETHIOPIC_EXTENDED
@ UBLOCK_ETHIOPIC_EXTENDED
Definition: uchar.h:1370
U_WB_WSEGSPACE
@ U_WB_WSEGSPACE
Definition: uchar.h:2130
U_JG_MANICHAEAN_YODH
@ U_JG_MANICHAEAN_YODH
Definition: uchar.h:1995
UBLOCK_INDIC_SIYAQ_NUMBERS
@ UBLOCK_INDIC_SIYAQ_NUMBERS
Definition: uchar.h:1706
UBLOCK_SYRIAC
@ UBLOCK_SYRIAC
Definition: uchar.h:1018
U_WB_EXTEND
@ U_WB_EXTEND
Definition: uchar.h:2104
UBLOCK_SUPPLEMENTAL_ARROWS_C
@ UBLOCK_SUPPLEMENTAL_ARROWS_C
Definition: uchar.h:1622
U_RIGHT_TO_LEFT
@ U_RIGHT_TO_LEFT
R.
Definition: uchar.h:880
USentenceBreak
USentenceBreak
Sentence Break constants.
Definition: uchar.h:2149
u_getPropertyValueName
const char * u_getPropertyValueName(UProperty property, int32_t value, UPropertyNameChoice nameChoice)
Return the Unicode name for a given property value, as given in the Unicode database file PropertyVal...
UCHAR_JOINING_GROUP
@ UCHAR_JOINING_GROUP
Enumerated property Joining_Group.
Definition: uchar.h:487
UBLOCK_KANA_SUPPLEMENT
@ UBLOCK_KANA_SUPPLEMENT
Definition: uchar.h:1522
UBLOCK_BASIC_LATIN
@ UBLOCK_BASIC_LATIN
Definition: uchar.h:979
U_CONNECTOR_PUNCTUATION
@ U_CONNECTOR_PUNCTUATION
Pc.
Definition: uchar.h:728
UCharCategory
UCharCategory
Data for enumerated Unicode general category types.
Definition: uchar.h:672
UCHAR_NFKC_QUICK_CHECK
@ UCHAR_NFKC_QUICK_CHECK
Enumerated property NFKC_Quick_Check.
Definition: uchar.h:514
u_isJavaSpaceChar
UBool u_isJavaSpaceChar(UChar32 c)
Determine if the specified code point is a space character according to Java.
U_LEFT_TO_RIGHT_EMBEDDING
@ U_LEFT_TO_RIGHT_EMBEDDING
LRE.
Definition: uchar.h:900
UCHAR_WORD_BREAK
@ UCHAR_WORD_BREAK
Enumerated property Word_Break (new in Unicode 4.1).
Definition: uchar.h:543
UCHAR_DOUBLE_START
@ UCHAR_DOUBLE_START
First constant for double Unicode properties.
Definition: uchar.h:580
UCHAR_CHANGES_WHEN_NFKC_CASEFOLDED
@ UCHAR_CHANGES_WHEN_NFKC_CASEFOLDED
Binary property Changes_When_NFKC_Casefolded.
Definition: uchar.h:403
U_JG_MANICHAEAN_FIVE
@ U_JG_MANICHAEAN_FIVE
Definition: uchar.h:1975
UBLOCK_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_E
@ UBLOCK_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_E
Definition: uchar.h:1637
u_foldCase
UChar32 u_foldCase(UChar32 c, uint32_t options)
The given character is mapped to its case folding equivalent according to UnicodeData....
UBLOCK_CAUCASIAN_ALBANIAN
@ UBLOCK_CAUCASIAN_ALBANIAN
Definition: uchar.h:1566
U_POP_DIRECTIONAL_FORMAT
@ U_POP_DIRECTIONAL_FORMAT
PDF.
Definition: uchar.h:910
U_CDECL_END
#define U_CDECL_END
Definition: umachine.h:85
UCHAR_CASED
@ UCHAR_CASED
Binary property Cased.
Definition: uchar.h:389
UBLOCK_MRO
@ UBLOCK_MRO
Definition: uchar.h:1596
U_JG_HANIFI_ROHINGYA_KINNA_YA
@ U_JG_HANIFI_ROHINGYA_KINNA_YA
Definition: uchar.h:2014
U_CDECL_BEGIN
#define U_CDECL_BEGIN
Definition: umachine.h:84
UBLOCK_ANATOLIAN_HIEROGLYPHS
@ UBLOCK_ANATOLIAN_HIEROGLYPHS
Definition: uchar.h:1633
UBLOCK_HANUNOO
@ UBLOCK_HANUNOO
Definition: uchar.h:1296
UBLOCK_BYZANTINE_MUSICAL_SYMBOLS
@ UBLOCK_BYZANTINE_MUSICAL_SYMBOLS
Definition: uchar.h:1272
UBLOCK_COMBINING_HALF_MARKS
@ UBLOCK_COMBINING_HALF_MARKS
Definition: uchar.h:1246
UCHAR_CHANGES_WHEN_CASEFOLDED
@ UCHAR_CHANGES_WHEN_CASEFOLDED
Binary property Changes_When_Casefolded.
Definition: uchar.h:399
UBLOCK_THAI
@ UBLOCK_THAI
Definition: uchar.h:1054
U_JG_MALAYALAM_TTA
@ U_JG_MALAYALAM_TTA
Definition: uchar.h:2012
UBLOCK_KATAKANA
@ UBLOCK_KATAKANA
Definition: uchar.h:1171
UBLOCK_ANCIENT_GREEK_MUSICAL_NOTATION
@ UBLOCK_ANCIENT_GREEK_MUSICAL_NOTATION
Definition: uchar.h:1356
U_CHAR_NAME_CHOICE_COUNT
@ U_CHAR_NAME_CHOICE_COUNT
One more than the highest normal UCharNameChoice value.
Definition: uchar.h:1797
UBLOCK_BOX_DRAWING
@ UBLOCK_BOX_DRAWING
Definition: uchar.h:1138
UCHAR_POSIX_ALNUM
@ UCHAR_POSIX_ALNUM
Binary property alnum (a C/POSIX character class).
Definition: uchar.h:367
u_isUWhiteSpace
UBool u_isUWhiteSpace(UChar32 c)
Check if a code point has the White_Space Unicode property.
UBLOCK_CHESS_SYMBOLS
@ UBLOCK_CHESS_SYMBOLS
Definition: uchar.h:1696
u_isJavaIDPart
UBool u_isJavaIDPart(UChar32 c)
Determines if the specified character is permissible in a Java identifier.
UBLOCK_VERTICAL_FORMS
@ UBLOCK_VERTICAL_FORMS
Definition: uchar.h:1394
U_GCB_E_BASE
@ U_GCB_E_BASE
Definition: uchar.h:2058
UBLOCK_AVESTAN
@ UBLOCK_AVESTAN
Definition: uchar.h:1489
UBLOCK_TAI_XUAN_JING_SYMBOLS
@ UBLOCK_TAI_XUAN_JING_SYMBOLS
Definition: uchar.h:1349
UCHAR_TRAIL_CANONICAL_COMBINING_CLASS
@ UCHAR_TRAIL_CANONICAL_COMBINING_CLASS
Enumerated property Trail_Canonical_Combining_Class.
Definition: uchar.h:528
UBLOCK_BATAK
@ UBLOCK_BATAK
Definition: uchar.h:1514
U_RIGHT_TO_LEFT_OVERRIDE
@ U_RIGHT_TO_LEFT_OVERRIDE
RLO.
Definition: uchar.h:908
UCHAR_DEPRECATED
@ UCHAR_DEPRECATED
Binary property Deprecated (new in Unicode 3.2).
Definition: uchar.h:201
U_BPT_NONE
@ U_BPT_NONE
Not a paired bracket.
Definition: uchar.h:948
UCHAR_UPPERCASE
@ UCHAR_UPPERCASE
Binary property Uppercase.
Definition: uchar.h:287
U_LB_JT
@ U_LB_JT
Definition: uchar.h:2237
UBLOCK_SYRIAC_SUPPLEMENT
@ UBLOCK_SYRIAC_SUPPLEMENT
Definition: uchar.h:1689
UBLOCK_LATIN_EXTENDED_A
@ UBLOCK_LATIN_EXTENDED_A
Definition: uchar.h:985
UDecompositionType
UDecompositionType
Decomposition Type constants.
Definition: uchar.h:1832
U_UPPERCASE_LETTER
@ U_UPPERCASE_LETTER
Lu.
Definition: uchar.h:686
UBLOCK_IMPERIAL_ARAMAIC
@ UBLOCK_IMPERIAL_ARAMAIC
Definition: uchar.h:1485
UBLOCK_GUJARATI
@ UBLOCK_GUJARATI
Definition: uchar.h:1033
u_toupper
UChar32 u_toupper(UChar32 c)
The given character is mapped to its uppercase equivalent according to UnicodeData....
UBLOCK_TAI_THAM
@ UBLOCK_TAI_THAM
Definition: uchar.h:1461
U_LEFT_TO_RIGHT
@ U_LEFT_TO_RIGHT
L.
Definition: uchar.h:878
UBLOCK_PRIVATE_USE_AREA
@ UBLOCK_PRIVATE_USE_AREA
Same as UBLOCK_PRIVATE_USE.
Definition: uchar.h:1224
U_WB_E_BASE_GAZ
@ U_WB_E_BASE_GAZ
Definition: uchar.h:2122
U_START_PUNCTUATION
@ U_START_PUNCTUATION
Ps.
Definition: uchar.h:724
UBLOCK_GRANTHA
@ UBLOCK_GRANTHA
Definition: uchar.h:1578
U_LB_HEBREW_LETTER
@ U_LB_HEBREW_LETTER
Definition: uchar.h:2245
U_GENERAL_OTHER_TYPES
@ U_GENERAL_OTHER_TYPES
Cn "Other, Not Assigned (no characters in [UnicodeData.txt] have this property)" (same as U_UNASSIGNE...
Definition: uchar.h:684
UBLOCK_HIGH_PRIVATE_USE_SURROGATES
@ UBLOCK_HIGH_PRIVATE_USE_SURROGATES
Definition: uchar.h:1210
U_JG_FE
@ U_JG_FE
Definition: uchar.h:1963
UBLOCK_INVALID_CODE
@ UBLOCK_INVALID_CODE
Definition: uchar.h:1729
UCHAR_S_TERM
@ UCHAR_S_TERM
Binary property STerm (new in Unicode 4.0.1).
Definition: uchar.h:307
UBLOCK_CHEROKEE
@ UBLOCK_CHEROKEE
Definition: uchar.h:1075
u_getPropertyEnum
UProperty u_getPropertyEnum(const char *alias)
Return the UProperty enum for a given property name, as specified in the Unicode database file Proper...
U_UNASSIGNED
@ U_UNASSIGNED
Non-category for unassigned and non-character code points.
Definition: uchar.h:682
UCHAR_BIDI_CLASS
@ UCHAR_BIDI_CLASS
Enumerated property Bidi_Class.
Definition: uchar.h:466
U_JG_HANIFI_ROHINGYA_PA
@ U_JG_HANIFI_ROHINGYA_PA
Definition: uchar.h:2015
UCHAR_EMOJI
@ UCHAR_EMOJI
Binary property Emoji.
Definition: uchar.h:410
UBLOCK_SINHALA
@ UBLOCK_SINHALA
Definition: uchar.h:1051
U_JG_MALAYALAM_NNA
@ U_JG_MALAYALAM_NNA
Definition: uchar.h:2007
UBLOCK_SYLOTI_NAGRI
@ UBLOCK_SYLOTI_NAGRI
Definition: uchar.h:1390
u_istitle
UBool u_istitle(UChar32 c)
Determines whether the specified code point is a titlecase letter.
UBLOCK_MAYAN_NUMERALS
@ UBLOCK_MAYAN_NUMERALS
Definition: uchar.h:1710
UBLOCK_MEETEI_MAYEK
@ UBLOCK_MEETEI_MAYEK
Definition: uchar.h:1481
UCHAR_TERMINAL_PUNCTUATION
@ UCHAR_TERMINAL_PUNCTUATION
Binary property Terminal_Punctuation.
Definition: uchar.h:280
UBLOCK_MULTANI
@ UBLOCK_MULTANI
Definition: uchar.h:1643
UBLOCK_PSALTER_PAHLAVI
@ UBLOCK_PSALTER_PAHLAVI
Definition: uchar.h:1614
UBLOCK_OLD_ITALIC
@ UBLOCK_OLD_ITALIC
Definition: uchar.h:1266
UBLOCK_BAMUM_SUPPLEMENT
@ UBLOCK_BAMUM_SUPPLEMENT
Definition: uchar.h:1520
UCHAR_NFC_QUICK_CHECK
@ UCHAR_NFC_QUICK_CHECK
Enumerated property NFC_Quick_Check.
Definition: uchar.h:511
UBLOCK_CYRILLIC
@ UBLOCK_CYRILLIC
Definition: uchar.h:1006
UCHAR_JOIN_CONTROL
@ UCHAR_JOIN_CONTROL
Binary property Join_Control.
Definition: uchar.h:252
UBLOCK_ALCHEMICAL_SYMBOLS
@ UBLOCK_ALCHEMICAL_SYMBOLS
Definition: uchar.h:1532
UBLOCK_MUSICAL_SYMBOLS
@ UBLOCK_MUSICAL_SYMBOLS
Definition: uchar.h:1274
UBLOCK_BRAILLE_PATTERNS
@ UBLOCK_BRAILLE_PATTERNS
Definition: uchar.h:1153
U_JG_MALAYALAM_BHA
@ U_JG_MALAYALAM_BHA
Definition: uchar.h:2002
U_JG_MANICHAEAN_TETH
@ U_JG_MANICHAEAN_TETH
Definition: uchar.h:1991
u_isprint
UBool u_isprint(UChar32 c)
Determines whether the specified code point is a printable character.
UCHAR_SCRIPT
@ UCHAR_SCRIPT
Enumerated property Script.
Definition: uchar.h:499
UBLOCK_CUNEIFORM
@ UBLOCK_CUNEIFORM
Definition: uchar.h:1411
UBLOCK_CURRENCY_SYMBOLS
@ UBLOCK_CURRENCY_SYMBOLS
Definition: uchar.h:1105
U_GCB_E_BASE_GAZ
@ U_GCB_E_BASE_GAZ
Definition: uchar.h:2060
UCHAR_SOFT_DOTTED
@ UCHAR_SOFT_DOTTED
Binary property Soft_Dotted (new in Unicode 3.2).
Definition: uchar.h:276
UBLOCK_BLOCK_ELEMENTS
@ UBLOCK_BLOCK_ELEMENTS
Definition: uchar.h:1141
UBLOCK_VARIATION_SELECTORS_SUPPLEMENT
@ UBLOCK_VARIATION_SELECTORS_SUPPLEMENT
Definition: uchar.h:1351
UCharEnumTypeRange
UBool UCharEnumTypeRange(const void *context, UChar32 start, UChar32 limit, UCharCategory type)
Callback from u_enumCharTypes(), is called for each contiguous range of code points c (where start<=c...
Definition: uchar.h:3071
UBLOCK_ENCLOSED_CJK_LETTERS_AND_MONTHS
@ UBLOCK_ENCLOSED_CJK_LETTERS_AND_MONTHS
Definition: uchar.h:1186
UCHAR_GENERAL_CATEGORY
@ UCHAR_GENERAL_CATEGORY
Enumerated property General_Category.
Definition: uchar.h:484
UCHAR_PREPENDED_CONCATENATION_MARK
@ UCHAR_PREPENDED_CONCATENATION_MARK
Binary property Prepended_Concatenation_Mark.
Definition: uchar.h:448
U_BPT_OPEN
@ U_BPT_OPEN
Open paired bracket.
Definition: uchar.h:950
UBLOCK_MISCELLANEOUS_SYMBOLS_AND_ARROWS
@ UBLOCK_MISCELLANEOUS_SYMBOLS_AND_ARROWS
Definition: uchar.h:1331
U_WB_HEBREW_LETTER
@ U_WB_HEBREW_LETTER
Definition: uchar.h:2114
u_isxdigit
UBool u_isxdigit(UChar32 c)
Determines whether the specified code point is a hexadecimal digit.
UCHAR_EAST_ASIAN_WIDTH
@ UCHAR_EAST_ASIAN_WIDTH
Enumerated property East_Asian_Width.
Definition: uchar.h:481
U_JG_AFRICAN_FEH
@ U_JG_AFRICAN_FEH
Definition: uchar.h:1998
U_LB_CONDITIONAL_JAPANESE_STARTER
@ U_LB_CONDITIONAL_JAPANESE_STARTER
Definition: uchar.h:2243
UWordBreakValues
UWordBreakValues
Word Break constants.
Definition: uchar.h:2086
U_JG_MANICHAEAN_SADHE
@ U_JG_MANICHAEAN_SADHE
Definition: uchar.h:1987
U_END_PUNCTUATION
@ U_END_PUNCTUATION
Pe.
Definition: uchar.h:726
UBLOCK_PAU_CIN_HAU
@ UBLOCK_PAU_CIN_HAU
Definition: uchar.h:1612
UBLOCK_SINHALA_ARCHAIC_NUMBERS
@ UBLOCK_SINHALA_ARCHAIC_NUMBERS
Definition: uchar.h:1620
UBLOCK_ETHIOPIC
@ UBLOCK_ETHIOPIC
Definition: uchar.h:1072
U_MATH_SYMBOL
@ U_MATH_SYMBOL
Sm.
Definition: uchar.h:732
UBLOCK_HALFWIDTH_AND_FULLWIDTH_FORMS
@ UBLOCK_HALFWIDTH_AND_FULLWIDTH_FORMS
Definition: uchar.h:1261
UCHAR_SIMPLE_LOWERCASE_MAPPING
@ UCHAR_SIMPLE_LOWERCASE_MAPPING
String property Simple_Lowercase_Mapping.
Definition: uchar.h:616
UBLOCK_CHAKMA
@ UBLOCK_CHAKMA
Definition: uchar.h:1543
UCHAR_CHANGES_WHEN_TITLECASED
@ UCHAR_CHANGES_WHEN_TITLECASED
Binary property Changes_When_Titlecased.
Definition: uchar.h:397
UEastAsianWidth
UEastAsianWidth
East Asian Width constants.
Definition: uchar.h:1742
u_isIDPart
UBool u_isIDPart(UChar32 c)
Determines if the specified character is permissible in an identifier according to Java.
U_GCB_E_MODIFIER
@ U_GCB_E_MODIFIER
Definition: uchar.h:2062
UBLOCK_SHAVIAN
@ UBLOCK_SHAVIAN
Definition: uchar.h:1343
u_isgraph
UBool u_isgraph(UChar32 c)
Determines whether the specified code point is a "graphic" character (printable, excluding spaces).
UBLOCK_DEVANAGARI_EXTENDED
@ UBLOCK_DEVANAGARI_EXTENDED
Definition: uchar.h:1471
U_INITIAL_PUNCTUATION
@ U_INITIAL_PUNCTUATION
Pi.
Definition: uchar.h:740
U_GCB_SPACING_MARK
@ U_GCB_SPACING_MARK
Definition: uchar.h:2052
UBLOCK_MISCELLANEOUS_MATHEMATICAL_SYMBOLS_B
@ UBLOCK_MISCELLANEOUS_MATHEMATICAL_SYMBOLS_B
Definition: uchar.h:1308
UBLOCK_LATIN_EXTENDED_ADDITIONAL
@ UBLOCK_LATIN_EXTENDED_ADDITIONAL
Definition: uchar.h:1093
u_ispunct
UBool u_ispunct(UChar32 c)
Determines whether the specified code point is a punctuation character.
UBLOCK_PHONETIC_EXTENSIONS_SUPPLEMENT
@ UBLOCK_PHONETIC_EXTENSIONS_SUPPLEMENT
Definition: uchar.h:1386
UBLOCK_KHAROSHTHI
@ UBLOCK_KHAROSHTHI
Definition: uchar.h:1378
U_JG_MANICHAEAN_TWENTY
@ U_JG_MANICHAEAN_TWENTY
Definition: uchar.h:1993
UBLOCK_ELBASAN
@ UBLOCK_ELBASAN
Definition: uchar.h:1574
UBLOCK_BASSA_VAH
@ UBLOCK_BASSA_VAH
Definition: uchar.h:1564
UBLOCK_TAMIL
@ UBLOCK_TAMIL
Definition: uchar.h:1039
U_JG_MANICHAEAN_HUNDRED
@ U_JG_MANICHAEAN_HUNDRED
Definition: uchar.h:1978
UBLOCK_TAGS
@ UBLOCK_TAGS
Definition: uchar.h:1282
UBLOCK_MYANMAR
@ UBLOCK_MYANMAR
Definition: uchar.h:1063
UBLOCK_LATIN_1_SUPPLEMENT
@ UBLOCK_LATIN_1_SUPPLEMENT
Definition: uchar.h:982
UBLOCK_LATIN_EXTENDED_B
@ UBLOCK_LATIN_EXTENDED_B
Definition: uchar.h:988
UBLOCK_ENCLOSED_ALPHANUMERICS
@ UBLOCK_ENCLOSED_ALPHANUMERICS
Definition: uchar.h:1135
UCHAR_INT_LIMIT
@ UCHAR_INT_LIMIT
One more than the last constant for enumerated/integer Unicode properties.
Definition: uchar.h:554
UBLOCK_LINEAR_B_SYLLABARY
@ UBLOCK_LINEAR_B_SYLLABARY
Definition: uchar.h:1335
UCHAR_EMOJI_PRESENTATION
@ UCHAR_EMOJI_PRESENTATION
Binary property Emoji_Presentation.
Definition: uchar.h:417
UBLOCK_GLAGOLITIC_SUPPLEMENT
@ UBLOCK_GLAGOLITIC_SUPPLEMENT
Definition: uchar.h:1660
U_JG_MALAYALAM_RA
@ U_JG_MALAYALAM_RA
Definition: uchar.h:2010
UCHAR_STRING_START
@ UCHAR_STRING_START
First constant for string Unicode properties.
Definition: uchar.h:593
U_CONTROL_CHAR
@ U_CONTROL_CHAR
Cc.
Definition: uchar.h:714
UBLOCK_LINEAR_B_IDEOGRAMS
@ UBLOCK_LINEAR_B_IDEOGRAMS
Definition: uchar.h:1337
U_JG_MANICHAEAN_DALETH
@ U_JG_MANICHAEAN_DALETH
Definition: uchar.h:1973
UBLOCK_GEORGIAN_SUPPLEMENT
@ UBLOCK_GEORGIAN_SUPPLEMENT
Definition: uchar.h:1374
UBLOCK_OLD_SOGDIAN
@ UBLOCK_OLD_SOGDIAN
Definition: uchar.h:1714
UBLOCK_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_B
@ UBLOCK_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_B
Definition: uchar.h:1278
UBLOCK_COPTIC
@ UBLOCK_COPTIC
Definition: uchar.h:1368
U_UNICODE_CHAR_NAME
@ U_UNICODE_CHAR_NAME
Unicode character name (Name property).
Definition: uchar.h:1779
u_getPropertyName
const char * u_getPropertyName(UProperty property, UPropertyNameChoice nameChoice)
Return the Unicode name for a given property, as given in the Unicode database file PropertyAliases....
UBLOCK_HANGUL_JAMO_EXTENDED_B
@ UBLOCK_HANGUL_JAMO_EXTENDED_B
Definition: uchar.h:1483
UBLOCK_INSCRIPTIONAL_PAHLAVI
@ UBLOCK_INSCRIPTIONAL_PAHLAVI
Definition: uchar.h:1493
UBLOCK_SUPPLEMENTAL_PUNCTUATION
@ UBLOCK_SUPPLEMENTAL_PUNCTUATION
Definition: uchar.h:1388
U_JG_BURUSHASKI_YEH_BARREE
@ U_JG_BURUSHASKI_YEH_BARREE
Definition: uchar.h:1966
UCHAR_SEGMENT_STARTER
@ UCHAR_SEGMENT_STARTER
Binary Property Segment_Starter.
Definition: uchar.h:352
UBLOCK_SHARADA
@ UBLOCK_SHARADA
Definition: uchar.h:1553
UBLOCK_OLD_PERSIAN
@ UBLOCK_OLD_PERSIAN
Definition: uchar.h:1384
UBLOCK_KHOJKI
@ UBLOCK_KHOJKI
Definition: uchar.h:1580
UBLOCK_YI_RADICALS
@ UBLOCK_YI_RADICALS
Definition: uchar.h:1201
UBLOCK_DOMINO_TILES
@ UBLOCK_DOMINO_TILES
Definition: uchar.h:1452
U_LB_E_BASE
@ U_LB_E_BASE
Definition: uchar.h:2249
U_JG_KHAPH
@ U_JG_KHAPH
Definition: uchar.h:1964
UCHAR_NFKD_QUICK_CHECK
@ UCHAR_NFKD_QUICK_CHECK
Enumerated property NFKD_Quick_Check.
Definition: uchar.h:508
U_LB_COUNT
@ U_LB_COUNT
One more than the highest normal ULineBreak value.
Definition: uchar.h:2261
U_EA_COUNT
@ U_EA_COUNT
One more than the highest normal UEastAsianWidth value.
Definition: uchar.h:1762
u_isISOControl
UBool u_isISOControl(UChar32 c)
Determines whether the specified code point is an ISO control code.
UCHAR_VARIATION_SELECTOR
@ UCHAR_VARIATION_SELECTOR
Binary property Variation_Selector (new in Unicode 4.0.1).
Definition: uchar.h:313
UCHAR_ID_CONTINUE
@ UCHAR_ID_CONTINUE
Binary property ID_Continue.
Definition: uchar.h:234
UBLOCK_ARABIC_PRESENTATION_FORMS_A
@ UBLOCK_ARABIC_PRESENTATION_FORMS_A
Definition: uchar.h:1243
UBLOCK_TAI_VIET
@ UBLOCK_TAI_VIET
Definition: uchar.h:1479
U_HST_COUNT
@ U_HST_COUNT
One more than the highest normal UHangulSyllableType value.
Definition: uchar.h:2319
UBLOCK_SUPPLEMENTAL_MATHEMATICAL_OPERATORS
@ UBLOCK_SUPPLEMENTAL_MATHEMATICAL_OPERATORS
Definition: uchar.h:1310
U_DASH_PUNCTUATION
@ U_DASH_PUNCTUATION
Pd.
Definition: uchar.h:722
U_EXTENDED_CHAR_NAME
@ U_EXTENDED_CHAR_NAME
Standard or synthetic character name.
Definition: uchar.h:1789
UBLOCK_SIDDHAM
@ UBLOCK_SIDDHAM
Definition: uchar.h:1618
UCHAR_BIDI_CONTROL
@ UCHAR_BIDI_CONTROL
Binary property Bidi_Control.
Definition: uchar.h:187
U_STABLE
#define U_STABLE
This is used to declare a function as a stable public ICU C API.
Definition: umachine.h:111
UCHAR_PATTERN_SYNTAX
@ UCHAR_PATTERN_SYNTAX
Binary property Pattern_Syntax (new in Unicode 4.1).
Definition: uchar.h:357
U_JG_MANICHAEAN_ONE
@ U_JG_MANICHAEAN_ONE
Definition: uchar.h:1983
UCHAR_LOWERCASE
@ UCHAR_LOWERCASE
Binary property Lowercase.
Definition: uchar.h:259
u_isWhitespace
UBool u_isWhitespace(UChar32 c)
Determines if the specified code point is a whitespace character according to Java/ICU.
U_JG_MALAYALAM_JA
@ U_JG_MALAYALAM_JA
Definition: uchar.h:2003
UBLOCK_PAHAWH_HMONG
@ UBLOCK_PAHAWH_HMONG
Definition: uchar.h:1608
UBLOCK_MONGOLIAN
@ UBLOCK_MONGOLIAN
Definition: uchar.h:1090
UBLOCK_COUNTING_ROD_NUMERALS
@ UBLOCK_COUNTING_ROD_NUMERALS
Definition: uchar.h:1415
UBLOCK_OLD_NORTH_ARABIAN
@ UBLOCK_OLD_NORTH_ARABIAN
Definition: uchar.h:1602
UBLOCK_HANGUL_COMPATIBILITY_JAMO
@ UBLOCK_HANGUL_COMPATIBILITY_JAMO
Definition: uchar.h:1177
u_islower
UBool u_islower(UChar32 c)
Determines whether the specified code point has the general category "Ll" (lowercase letter).
UBLOCK_PHOENICIAN
@ UBLOCK_PHOENICIAN
Definition: uchar.h:1409
u_getIntPropertyMinValue
int32_t u_getIntPropertyMinValue(UProperty which)
Get the minimum value for an enumerated/integer/binary Unicode property.
UBLOCK_KANBUN
@ UBLOCK_KANBUN
Definition: uchar.h:1180
UBLOCK_MISCELLANEOUS_SYMBOLS_AND_PICTOGRAPHS
@ UBLOCK_MISCELLANEOUS_SYMBOLS_AND_PICTOGRAPHS
Definition: uchar.h:1526
U_WB_DOUBLE_QUOTE
@ U_WB_DOUBLE_QUOTE
Definition: uchar.h:2118
UBLOCK_BAMUM
@ UBLOCK_BAMUM
Definition: uchar.h:1467
UBLOCK_ARROWS
@ UBLOCK_ARROWS
Definition: uchar.h:1120
U_JG_MALAYALAM_LLLA
@ U_JG_MALAYALAM_LLLA
Definition: uchar.h:2005
UBLOCK_LATIN_EXTENDED_D
@ UBLOCK_LATIN_EXTENDED_D
Definition: uchar.h:1405
UBidiPairedBracketType
UBidiPairedBracketType
Bidi Paired Bracket Type constants.
Definition: uchar.h:940
UCHAR_BLOCK
@ UCHAR_BLOCK
Enumerated property Block.
Definition: uchar.h:471
U_JG_MANICHAEAN_HETH
@ U_JG_MANICHAEAN_HETH
Definition: uchar.h:1977
UBLOCK_GEOMETRIC_SHAPES
@ UBLOCK_GEOMETRIC_SHAPES
Definition: uchar.h:1144
UBLOCK_LEPCHA
@ UBLOCK_LEPCHA
Definition: uchar.h:1422
UCHAR_FULL_COMPOSITION_EXCLUSION
@ UCHAR_FULL_COMPOSITION_EXCLUSION
Binary property Full_Composition_Exclusion.
Definition: uchar.h:212
UCHAR_STRING_LIMIT
@ UCHAR_STRING_LIMIT
One more than the last constant for string Unicode properties.
Definition: uchar.h:644
u_charDigitValue
int32_t u_charDigitValue(UChar32 c)
Returns the decimal digit value of a decimal digit character.
UBLOCK_KHMER
@ UBLOCK_KHMER
Definition: uchar.h:1087
U_JG_MANICHAEAN_AYIN
@ U_JG_MANICHAEAN_AYIN
Definition: uchar.h:1971
UBLOCK_CYRILLIC_SUPPLEMENTARY
@ UBLOCK_CYRILLIC_SUPPLEMENTARY
Unicode 4.0.1 renames the "Cyrillic Supplementary" block to "Cyrillic Supplement".
Definition: uchar.h:1292
UChar
uint16_t UChar
Definition: umachine.h:353
U_JG_MALAYALAM_SSA
@ U_JG_MALAYALAM_SSA
Definition: uchar.h:2011
u_totitle
UChar32 u_totitle(UChar32 c)
The given character is mapped to its titlecase equivalent according to UnicodeData....
UCHAR_OTHER_PROPERTY_START
@ UCHAR_OTHER_PROPERTY_START
First constant for Unicode properties with unusual value types.
Definition: uchar.h:654
UCHAR_OTHER_PROPERTY_LIMIT
@ UCHAR_OTHER_PROPERTY_LIMIT
One more than the last constant for Unicode properties with unusual value types.
Definition: uchar.h:660
U_BPT_COUNT
@ U_BPT_COUNT
One more than the highest normal UBidiPairedBracketType value.
Definition: uchar.h:960
U_JG_MANICHAEAN_THAMEDH
@ U_JG_MANICHAEAN_THAMEDH
Definition: uchar.h:1992
UVersionInfo
uint8_t UVersionInfo[U_MAX_VERSION_LENGTH]
The binary form of a version on ICU APIs is an array of 4 uint8_t.
Definition: uversion.h:59
U_JG_MANICHAEAN_BETH
@ U_JG_MANICHAEAN_BETH
Definition: uchar.h:1972
UBLOCK_LINEAR_A
@ UBLOCK_LINEAR_A
Definition: uchar.h:1586
UCHAR_UNIFIED_IDEOGRAPH
@ UCHAR_UNIFIED_IDEOGRAPH
Binary property Unified_Ideograph (new in Unicode 3.2).
Definition: uchar.h:284
UCHAR_SIMPLE_CASE_FOLDING
@ UCHAR_SIMPLE_CASE_FOLDING
String property Simple_Case_Folding.
Definition: uchar.h:613
UBLOCK_SUNDANESE_SUPPLEMENT
@ UBLOCK_SUNDANESE_SUPPLEMENT
Definition: uchar.h:1557
UCHAR_GRAPHEME_LINK
@ UCHAR_GRAPHEME_LINK
Binary property Grapheme_Link (new in Unicode 3.2).
Definition: uchar.h:223
u_forDigit
UChar32 u_forDigit(int32_t digit, int8_t radix)
Determines the character representation for a specific digit in the specified radix.
UCHAR_SCRIPT_EXTENSIONS
@ UCHAR_SCRIPT_EXTENSIONS
Miscellaneous property Script_Extensions (new in Unicode 6.0).
Definition: uchar.h:652
u_hasBinaryProperty
UBool u_hasBinaryProperty(UChar32 c, UProperty which)
Check a binary Unicode property for a code point.
UBLOCK_ARMENIAN
@ UBLOCK_ARMENIAN
Definition: uchar.h:1009
U_JG_MALAYALAM_NYA
@ U_JG_MALAYALAM_NYA
Definition: uchar.h:2009
UCHAR_LEAD_CANONICAL_COMBINING_CLASS
@ UCHAR_LEAD_CANONICAL_COMBINING_CLASS
Enumerated property Lead_Canonical_Combining_Class.
Definition: uchar.h:521
UBLOCK_GOTHIC
@ UBLOCK_GOTHIC
Definition: uchar.h:1268
u_getUnicodeVersion
void u_getUnicodeVersion(UVersionInfo versionArray)
Gets the Unicode version information.
u_isupper
UBool u_isupper(UChar32 c)
Determines whether the specified code point has the general category "Lu" (uppercase letter).
U_JG_MANICHAEAN_NUN
@ U_JG_MANICHAEAN_NUN
Definition: uchar.h:1982
UCHAR_HEX_DIGIT
@ UCHAR_HEX_DIGIT
Binary property Hex_Digit.
Definition: uchar.h:226
U_WB_CR
@ U_WB_CR
Definition: uchar.h:2102
ULineBreak
ULineBreak
Line Break constants.
Definition: uchar.h:2188
UCHAR_XID_START
@ UCHAR_XID_START
Binary property XID_Start.
Definition: uchar.h:298
UBLOCK_SPACING_MODIFIER_LETTERS
@ UBLOCK_SPACING_MODIFIER_LETTERS
Definition: uchar.h:994
UBLOCK_HEBREW
@ UBLOCK_HEBREW
Definition: uchar.h:1012
UCHAR_UNICODE_1_NAME
@ UCHAR_UNICODE_1_NAME
String property Unicode_1_Name.
Definition: uchar.h:631
U_JG_ZHAIN
@ U_JG_ZHAIN
Definition: uchar.h:1965
UBLOCK_CHAM
@ UBLOCK_CHAM
Definition: uchar.h:1438
UBLOCK_GLAGOLITIC
@ UBLOCK_GLAGOLITIC
Definition: uchar.h:1376
UBLOCK_MIAO
@ UBLOCK_MIAO
Definition: uchar.h:1551
UCHAR_BINARY_LIMIT
@ UCHAR_BINARY_LIMIT
One more than the last constant for binary Unicode properties.
Definition: uchar.h:461
UCHAR_PATTERN_WHITE_SPACE
@ UCHAR_PATTERN_WHITE_SPACE
Binary property Pattern_White_Space (new in Unicode 4.1).
Definition: uchar.h:362
UBLOCK_LISU
@ UBLOCK_LISU
Definition: uchar.h:1465
U_WB_SINGLE_QUOTE
@ U_WB_SINGLE_QUOTE
Definition: uchar.h:2116
UBLOCK_OLD_HUNGARIAN
@ UBLOCK_OLD_HUNGARIAN
Definition: uchar.h:1645
UBLOCK_CYRILLIC_SUPPLEMENT
@ UBLOCK_CYRILLIC_SUPPLEMENT
Definition: uchar.h:1287
U_JG_MANICHAEAN_ALEPH
@ U_JG_MANICHAEAN_ALEPH
Definition: uchar.h:1970
UBLOCK_MYANMAR_EXTENDED_B
@ UBLOCK_MYANMAR_EXTENDED_B
Definition: uchar.h:1598
UBLOCK_MAKASAR
@ UBLOCK_MAKASAR
Definition: uchar.h:1708
U_JG_FARSI_YEH
@ U_JG_FARSI_YEH
Definition: uchar.h:1967
U_FORMAT_CHAR
@ U_FORMAT_CHAR
Cf.
Definition: uchar.h:716
UBLOCK_CONTROL_PICTURES
@ UBLOCK_CONTROL_PICTURES
Definition: uchar.h:1129
UBLOCK_OPTICAL_CHARACTER_RECOGNITION
@ UBLOCK_OPTICAL_CHARACTER_RECOGNITION
Definition: uchar.h:1132
UBLOCK_GUNJALA_GONDI
@ UBLOCK_GUNJALA_GONDI
Definition: uchar.h:1702
UBLOCK_CJK_UNIFIED_IDEOGRAPHS
@ UBLOCK_CJK_UNIFIED_IDEOGRAPHS
Definition: uchar.h:1195
UCHAR_NAME
@ UCHAR_NAME
String property Name.
Definition: uchar.h:610
UBLOCK_CJK_RADICALS_SUPPLEMENT
@ UBLOCK_CJK_RADICALS_SUPPLEMENT
Definition: uchar.h:1156
UBLOCK_COPTIC_EPACT_NUMBERS
@ UBLOCK_COPTIC_EPACT_NUMBERS
Definition: uchar.h:1568
UJoiningGroup
UJoiningGroup
Joining Group constants.
Definition: uchar.h:1904
UBLOCK_CYRILLIC_EXTENDED_C
@ UBLOCK_CYRILLIC_EXTENDED_C
Definition: uchar.h:1658
UBLOCK_SAMARITAN
@ UBLOCK_SAMARITAN
Definition: uchar.h:1457
U_GCB_REGIONAL_INDICATOR
@ U_GCB_REGIONAL_INDICATOR
Definition: uchar.h:2056
UBLOCK_SUPERSCRIPTS_AND_SUBSCRIPTS
@ UBLOCK_SUPERSCRIPTS_AND_SUBSCRIPTS
Definition: uchar.h:1102
UCHAR_GRAPHEME_EXTEND
@ UCHAR_GRAPHEME_EXTEND
Binary property Grapheme_Extend (new in Unicode 3.2).
Definition: uchar.h:220
U_JT_COUNT
@ U_JT_COUNT
One more than the highest normal UJoiningType value.
Definition: uchar.h:1894
UBLOCK_KHMER_SYMBOLS
@ UBLOCK_KHMER_SYMBOLS
Definition: uchar.h:1327
UCharNameChoice
UCharNameChoice
Selector constants for u_charName().
Definition: uchar.h:1777
U_GCB_COUNT
@ U_GCB_COUNT
One more than the highest normal UGraphemeClusterBreak value.
Definition: uchar.h:2075
UBLOCK_TAGALOG
@ UBLOCK_TAGALOG
Definition: uchar.h:1294
UBLOCK_CJK_SYMBOLS_AND_PUNCTUATION
@ UBLOCK_CJK_SYMBOLS_AND_PUNCTUATION
Definition: uchar.h:1165
u_getNumericValue
double u_getNumericValue(UChar32 c)
Get the numeric value for a Unicode code point as defined in the Unicode Character Database.
U_JG_ROHINGYA_YEH
@ U_JG_ROHINGYA_YEH
Definition: uchar.h:1969
stringoptions.h
C API: Bit set option bit constants for various string and character processing functions.
U_BLOCK_SEPARATOR
@ U_BLOCK_SEPARATOR
B.
Definition: uchar.h:892
UNumericType
UNumericType
Numeric Type constants.
Definition: uchar.h:2271
UBLOCK_TAGBANWA
@ UBLOCK_TAGBANWA
Definition: uchar.h:1300
u_isIDStart
UBool u_isIDStart(UChar32 c)
Determines if the specified character is permissible as the first character in an identifier accordin...
U_LB_JV
@ U_LB_JV
Definition: uchar.h:2239
U_JG_MANICHAEAN_KAPH
@ U_JG_MANICHAEAN_KAPH
Definition: uchar.h:1979
UBLOCK_YI_SYLLABLES
@ UBLOCK_YI_SYLLABLES
Definition: uchar.h:1198
UBLOCK_AHOM
@ UBLOCK_AHOM
Definition: uchar.h:1631
UBLOCK_PHONETIC_EXTENSIONS
@ UBLOCK_PHONETIC_EXTENSIONS
Definition: uchar.h:1329
UBLOCK_MODI
@ UBLOCK_MODI
Definition: uchar.h:1594
UBLOCK_HANGUL_JAMO
@ UBLOCK_HANGUL_JAMO
Definition: uchar.h:1069
U_SEGMENT_SEPARATOR
@ U_SEGMENT_SEPARATOR
S.
Definition: uchar.h:894
UBLOCK_LOW_SURROGATES
@ UBLOCK_LOW_SURROGATES
Definition: uchar.h:1213
U_WB_MIDNUMLET
@ U_WB_MIDNUMLET
Definition: uchar.h:2108
UBLOCK_MISCELLANEOUS_MATHEMATICAL_SYMBOLS_A
@ UBLOCK_MISCELLANEOUS_MATHEMATICAL_SYMBOLS_A
Definition: uchar.h:1302
U_BOUNDARY_NEUTRAL
@ U_BOUNDARY_NEUTRAL
BN.
Definition: uchar.h:914
UBLOCK_SUPPLEMENTAL_ARROWS_B
@ UBLOCK_SUPPLEMENTAL_ARROWS_B
Definition: uchar.h:1306
UCHAR_CASE_SENSITIVE
@ UCHAR_CASE_SENSITIVE
Binary property Case_Sensitive.
Definition: uchar.h:302
U_RIGHT_TO_LEFT_EMBEDDING
@ U_RIGHT_TO_LEFT_EMBEDDING
RLE.
Definition: uchar.h:906
u_getFC_NFKC_Closure
int32_t u_getFC_NFKC_Closure(UChar32 c, UChar *dest, int32_t destCapacity, UErrorCode *pErrorCode)
Get the FC_NFKC_Closure property string for a character.
UBLOCK_WARANG_CITI
@ UBLOCK_WARANG_CITI
Definition: uchar.h:1626
UBLOCK_TIRHUTA
@ UBLOCK_TIRHUTA
Definition: uchar.h:1624
UBLOCK_KAITHI
@ UBLOCK_KAITHI
Definition: uchar.h:1499
u_isULowercase
UBool u_isULowercase(UChar32 c)
Check if a code point has the Lowercase Unicode property.
UBLOCK_MENDE_KIKAKUI
@ UBLOCK_MENDE_KIKAKUI
Definition: uchar.h:1592
UCHAR_EMOJI_COMPONENT
@ UCHAR_EMOJI_COMPONENT
Binary property Emoji_Component.
Definition: uchar.h:438
UBLOCK_MYANMAR_EXTENDED_A
@ UBLOCK_MYANMAR_EXTENDED_A
Definition: uchar.h:1477
UBLOCK_JAVANESE
@ UBLOCK_JAVANESE
Definition: uchar.h:1475
UBLOCK_TELUGU
@ UBLOCK_TELUGU
Definition: uchar.h:1042
U_OTHER_SYMBOL
@ U_OTHER_SYMBOL
So.
Definition: uchar.h:738
UCHAR_XID_CONTINUE
@ UCHAR_XID_CONTINUE
Binary property XID_Continue.
Definition: uchar.h:295
U_WB_E_MODIFIER
@ U_WB_E_MODIFIER
Definition: uchar.h:2124
UBLOCK_OSMANYA
@ UBLOCK_OSMANYA
Definition: uchar.h:1345
UBLOCK_HATRAN
@ UBLOCK_HATRAN
Definition: uchar.h:1641
UCHAR_NFC_INERT
@ UCHAR_NFC_INERT
Binary property NFC_Inert.
Definition: uchar.h:334