32 #if !defined(USET_DEFINED) && !defined(U_IN_DOXYGEN)
63 #define U_UNICODE_VERSION "14.0"
157 #define UCHAR_MIN_VALUE 0
167 #define UCHAR_MAX_VALUE 0x10ffff
173 #define U_MASK(x) ((uint32_t)1<<(x))
486 #ifndef U_HIDE_DRAFT_API
536 #endif // U_HIDE_DRAFT_API
537 #ifndef U_HIDE_DEPRECATED_API
543 #endif // U_HIDE_DEPRECATED_API
652 #ifndef U_HIDE_DEPRECATED_API
658 #endif // U_HIDE_DEPRECATED_API
671 #ifndef U_HIDE_DEPRECATED_API
677 #endif // U_HIDE_DEPRECATED_API
684 #ifndef U_HIDE_DEPRECATED_API
690 #endif // U_HIDE_DEPRECATED_API
703 #ifndef U_HIDE_DEPRECATED_API
729 #ifndef U_HIDE_DEPRECATED_API
742 #ifndef U_HIDE_DEPRECATED_API
748 #endif // U_HIDE_DEPRECATED_API
758 #ifndef U_HIDE_DEPRECATED_API
764 #endif // U_HIDE_DEPRECATED_API
870 #define U_GC_CN_MASK U_MASK(U_GENERAL_OTHER_TYPES)
873 #define U_GC_LU_MASK U_MASK(U_UPPERCASE_LETTER)
875 #define U_GC_LL_MASK U_MASK(U_LOWERCASE_LETTER)
877 #define U_GC_LT_MASK U_MASK(U_TITLECASE_LETTER)
879 #define U_GC_LM_MASK U_MASK(U_MODIFIER_LETTER)
881 #define U_GC_LO_MASK U_MASK(U_OTHER_LETTER)
884 #define U_GC_MN_MASK U_MASK(U_NON_SPACING_MARK)
886 #define U_GC_ME_MASK U_MASK(U_ENCLOSING_MARK)
888 #define U_GC_MC_MASK U_MASK(U_COMBINING_SPACING_MARK)
891 #define U_GC_ND_MASK U_MASK(U_DECIMAL_DIGIT_NUMBER)
893 #define U_GC_NL_MASK U_MASK(U_LETTER_NUMBER)
895 #define U_GC_NO_MASK U_MASK(U_OTHER_NUMBER)
898 #define U_GC_ZS_MASK U_MASK(U_SPACE_SEPARATOR)
900 #define U_GC_ZL_MASK U_MASK(U_LINE_SEPARATOR)
902 #define U_GC_ZP_MASK U_MASK(U_PARAGRAPH_SEPARATOR)
905 #define U_GC_CC_MASK U_MASK(U_CONTROL_CHAR)
907 #define U_GC_CF_MASK U_MASK(U_FORMAT_CHAR)
909 #define U_GC_CO_MASK U_MASK(U_PRIVATE_USE_CHAR)
911 #define U_GC_CS_MASK U_MASK(U_SURROGATE)
914 #define U_GC_PD_MASK U_MASK(U_DASH_PUNCTUATION)
916 #define U_GC_PS_MASK U_MASK(U_START_PUNCTUATION)
918 #define U_GC_PE_MASK U_MASK(U_END_PUNCTUATION)
920 #define U_GC_PC_MASK U_MASK(U_CONNECTOR_PUNCTUATION)
922 #define U_GC_PO_MASK U_MASK(U_OTHER_PUNCTUATION)
925 #define U_GC_SM_MASK U_MASK(U_MATH_SYMBOL)
927 #define U_GC_SC_MASK U_MASK(U_CURRENCY_SYMBOL)
929 #define U_GC_SK_MASK U_MASK(U_MODIFIER_SYMBOL)
931 #define U_GC_SO_MASK U_MASK(U_OTHER_SYMBOL)
934 #define U_GC_PI_MASK U_MASK(U_INITIAL_PUNCTUATION)
936 #define U_GC_PF_MASK U_MASK(U_FINAL_PUNCTUATION)
940 #define U_GC_L_MASK \
941 (U_GC_LU_MASK|U_GC_LL_MASK|U_GC_LT_MASK|U_GC_LM_MASK|U_GC_LO_MASK)
944 #define U_GC_LC_MASK \
945 (U_GC_LU_MASK|U_GC_LL_MASK|U_GC_LT_MASK)
948 #define U_GC_M_MASK (U_GC_MN_MASK|U_GC_ME_MASK|U_GC_MC_MASK)
951 #define U_GC_N_MASK (U_GC_ND_MASK|U_GC_NL_MASK|U_GC_NO_MASK)
954 #define U_GC_Z_MASK (U_GC_ZS_MASK|U_GC_ZL_MASK|U_GC_ZP_MASK)
957 #define U_GC_C_MASK \
958 (U_GC_CN_MASK|U_GC_CC_MASK|U_GC_CF_MASK|U_GC_CO_MASK|U_GC_CS_MASK)
961 #define U_GC_P_MASK \
962 (U_GC_PD_MASK|U_GC_PS_MASK|U_GC_PE_MASK|U_GC_PC_MASK|U_GC_PO_MASK| \
963 U_GC_PI_MASK|U_GC_PF_MASK)
966 #define U_GC_S_MASK (U_GC_SM_MASK|U_GC_SC_MASK|U_GC_SK_MASK|U_GC_SO_MASK)
1026 #ifndef U_HIDE_DEPRECATED_API
1034 #endif // U_HIDE_DEPRECATED_API
1056 #ifndef U_HIDE_DEPRECATED_API
1064 #endif // U_HIDE_DEPRECATED_API
1888 #ifndef U_HIDE_DEPRECATED_API
1896 #endif // U_HIDE_DEPRECATED_API
1925 #ifndef U_HIDE_DEPRECATED_API
1933 #endif // U_HIDE_DEPRECATED_API
1950 #ifndef U_HIDE_DEPRECATED_API
1962 #ifndef U_HIDE_DEPRECATED_API
1968 #endif // U_HIDE_DEPRECATED_API
1985 U_SHORT_PROPERTY_NAME,
1986 U_LONG_PROPERTY_NAME,
1987 #ifndef U_HIDE_DEPRECATED_API
1993 #endif // U_HIDE_DEPRECATED_API
2027 #ifndef U_HIDE_DEPRECATED_API
2035 #endif // U_HIDE_DEPRECATED_API
2057 #ifndef U_HIDE_DEPRECATED_API
2065 #endif // U_HIDE_DEPRECATED_API
2081 U_JG_NO_JOINING_GROUP,
2190 #ifndef U_HIDE_DEPRECATED_API
2198 #endif // U_HIDE_DEPRECATED_API
2241 #ifndef U_HIDE_DEPRECATED_API
2249 #endif // U_HIDE_DEPRECATED_API
2273 U_WB_EXTENDNUMLET = 7,
2305 #ifndef U_HIDE_DEPRECATED_API
2313 #endif // U_HIDE_DEPRECATED_API
2343 U_SB_SCONTINUE = 14,
2344 #ifndef U_HIDE_DEPRECATED_API
2352 #endif // U_HIDE_DEPRECATED_API
2370 U_LB_ALPHABETIC = 2,
2371 U_LB_BREAK_BOTH = 3,
2372 U_LB_BREAK_AFTER = 4,
2373 U_LB_BREAK_BEFORE = 5,
2374 U_LB_MANDATORY_BREAK = 6,
2375 U_LB_CONTINGENT_BREAK = 7,
2376 U_LB_CLOSE_PUNCTUATION = 8,
2377 U_LB_COMBINING_MARK = 9,
2378 U_LB_CARRIAGE_RETURN = 10,
2379 U_LB_EXCLAMATION = 11,
2382 U_LB_IDEOGRAPHIC = 14,
2386 U_LB_INFIX_NUMERIC = 16,
2387 U_LB_LINE_FEED = 17,
2388 U_LB_NONSTARTER = 18,
2390 U_LB_OPEN_PUNCTUATION = 20,
2391 U_LB_POSTFIX_NUMERIC = 21,
2392 U_LB_PREFIX_NUMERIC = 22,
2393 U_LB_QUOTATION = 23,
2394 U_LB_COMPLEX_CONTEXT = 24,
2395 U_LB_SURROGATE = 25,
2397 U_LB_BREAK_SYMBOLS = 27,
2427 #ifndef U_HIDE_DEPRECATED_API
2435 #endif // U_HIDE_DEPRECATED_API
2455 #ifndef U_HIDE_DEPRECATED_API
2463 #endif // U_HIDE_DEPRECATED_API
2479 U_HST_NOT_APPLICABLE,
2482 U_HST_TRAILING_JAMO,
2485 #ifndef U_HIDE_DEPRECATED_API
2493 #endif // U_HIDE_DEPRECATED_API
2683 #ifndef U_HIDE_DRAFT_API
2712 #endif // U_HIDE_DRAFT_API
2939 #define U_NO_NUMERIC_VALUE ((double)-123456789.)
3449 #define U_GET_GC_MASK(c) U_MASK(u_charType(c))
3493 #if !UCONFIG_NO_NORMALIZATION
3579 char *buffer, int32_t bufferLength,
3582 #ifndef U_HIDE_DEPRECATED_API
3603 char *dest, int32_t destCapacity,
3714 U_CAPI const char* U_EXPORT2
3787 U_CAPI const char* U_EXPORT2
4137 #if !UCONFIG_NO_NORMALIZATION
uint8_t UVersionInfo[U_MAX_VERSION_LENGTH]
The binary form of a version on ICU APIs is an array of 4 uint8_t.
Binary property Ideographic.
Unicode 4.0.1 renames the "Cyrillic Supplementary" block to "Cyrillic Supplement".
Enumerated property Indic_Positional_Category.
Binary property Changes_When_Lowercased.
Binary property IDS_Binary_Operator (new in Unicode 3.2).
U_CAPI UBool u_isalnum(UChar32 c)
Determines whether the specified code point is an alphanumeric character (letter or digit) according ...
Binary property Case_Ignorable.
Enumerated property NFC_Quick_Check.
U_CAPI UBool u_isbase(UChar32 c)
Non-standard: Determines whether the specified code point is a base character.
One more than the highest normal UJoiningGroup value.
Miscellaneous property Script_Extensions (new in Unicode 6.0).
Same as UBLOCK_PRIVATE_USE_AREA.
First constant for enumerated/integer Unicode properties.
Binary property XID_Start.
Binary property Join_Control.
Binary property Logical_Order_Exception (new in Unicode 3.2).
struct UCPMap UCPMap
Abstract map from Unicode code points (U+0000..U+10FFFF) to integer values.
Binary property White_Space.
String property Titlecase_Mapping.
U_CAPI UBool u_isISOControl(UChar32 c)
Determines whether the specified code point is an ISO control code.
U_CAPI int32_t u_getIntPropertyValue(UChar32 c, UProperty which)
Get the property value for an enumerated or integer Unicode property for a code point.
#define U_CAPI
This is used to declare a function as a public ICU C API.
U_CAPI UBool u_isblank(UChar32 c)
Determines whether the specified code point is a "blank" or "horizontal space", a character that visi...
One more than the highest normal UPropertyNameChoice value.
U_CAPI UChar32 u_getBidiPairedBracket(UChar32 c)
Maps the specified character to its paired bracket character.
One more than the last constant for enumerated/integer Unicode properties.
Enumerated property Numeric_Type.
Binary property xdigit (a C/POSIX character class).
Binary property Alphabetic.
First constant for double Unicode properties.
C API: Bit set option bit constants for various string and character processing functions.
U_CAPI UBool u_isdefined(UChar32 c)
Determines whether the specified code point is "defined", which usually means that it is assigned a c...
UBool UEnumCharNamesFn(void *context, UChar32 code, UCharNameChoice nameChoice, const char *name, int32_t length)
Type of a callback function for u_enumCharNames() that gets called for each Unicode character with th...
Binary property of strings RGI_Emoji.
U_CAPI UChar32 u_totitle(UChar32 c)
The given character is mapped to its titlecase equivalent according to UnicodeData.txt; if none is defined, the character itself is returned.
U_CAPI UBool u_isspace(UChar32 c)
Determines if the specified character is a space character or not.
One more than the highest normal USentenceBreak value.
Binary property Emoji_Component.
Binary property of strings Emoji_Keycap_Sequence.
Cn "Other, Not Assigned (no characters in [UnicodeData.txt] have this property)" (same as U_UNASSIGNE...
U_CAPI UProperty u_getPropertyEnum(const char *alias)
Return the UProperty enum for a given property name, as specified in the Unicode database file Proper...
String property Simple_Case_Folding.
U_CAPI int32_t u_getFC_NFKC_Closure(UChar32 c, UChar *dest, int32_t destCapacity, UErrorCode *pErrorCode)
Get the FC_NFKC_Closure property string for a character.
Binary property NFC_Inert.
Binary property graph (a C/POSIX character class).
String property Bidi_Mirroring_Glyph.
One more than the last constant for bit-mask Unicode properties.
U_CAPI UBool u_isULowercase(UChar32 c)
Check if a code point has the Lowercase Unicode property.
Enumerated property Block.
Represents a nonexistent or invalid property or property value.
Renamed from the misspelled "inseperable" in Unicode 4.0.1/ICU 3.0.
Binary property Radical (new in Unicode 3.2).
UCharDirection
This specifies the language directional property of a character set.
Binary property IDS_Trinary_Operator (new in Unicode 3.2).
Binary property Grapheme_Link (new in Unicode 3.2).
Enumerated property Decomposition_Type.
Binary property Regional_Indicator.
U_CAPI UChar32 u_foldCase(UChar32 c, uint32_t options)
The given character is mapped to its case folding equivalent according to UnicodeData.txt and CaseFolding.txt; if the character has no case folding equivalent, the character itself is returned.
String property Case_Folding.
This file defines an abstract map from Unicode code points to integer values.
String property Simple_Uppercase_Mapping.
U_CAPI UBool u_isxdigit(UChar32 c)
Determines whether the specified code point is a hexadecimal digit.
U_CAPI UBool u_isgraph(UChar32 c)
Determines whether the specified code point is a "graphic" character (printable, excluding spaces)...
Enumerated property Bidi_Class.
Enumerated property General_Category.
Binary property Prepended_Concatenation_Mark.
U_CAPI UBool u_isJavaIDPart(UChar32 c)
Determines if the specified character is permissible in a Java identifier.
U_CAPI void u_charAge(UChar32 c, UVersionInfo versionArray)
Get the "age" of the code point.
String property Unicode_1_Name.
U_CAPI int32_t u_getIntPropertyMinValue(UProperty which)
Get the minimum value for an enumerated/integer/binary Unicode property.
U_CAPI void u_getUnicodeVersion(UVersionInfo versionArray)
Gets the Unicode version information.
UNumericType
Numeric Type constants.
U_CAPI UChar32 u_charMirror(UChar32 c)
Maps the specified character to a "mirror-image" character.
One more than the highest normal UBidiPairedBracketType value.
Binary property Pattern_White_Space (new in Unicode 4.1).
Enumerated property Vertical_Orientation.
UBool UCharEnumTypeRange(const void *context, UChar32 start, UChar32 limit, UCharCategory type)
Callback from u_enumCharTypes(), is called for each contiguous range of code points c (where start<=c...
Binary property Changes_When_Casefolded.
U_CAPI void u_enumCharTypes(UCharEnumTypeRange *enumRange, const void *context)
Enumerate efficiently all code points with their Unicode general categories.
Binary property NFD_Inert.
Binary property Diacritic.
Binary property Terminal_Punctuation.
U_CAPI UBool u_isMirrored(UChar32 c)
Determines whether the code point has the Bidi_Mirrored property.
U_CAPI const UCPMap * u_getIntPropertyMap(UProperty property, UErrorCode *pErrorCode)
Returns an immutable UCPMap for an enumerated/catalog/int-valued property.
One more than the highest normal UNumericType value.
U_CAPI UBool u_isUWhiteSpace(UChar32 c)
Check if a code point has the White_Space Unicode property.
Enumerated property NFD_Quick_Check.
U_CAPI int32_t u_digit(UChar32 ch, int8_t radix)
Returns the decimal digit value of the code point in the specified radix.
U_CAPI uint8_t u_getCombiningClass(UChar32 c)
Returns the combining class of the code point as specified in UnicodeData.txt.
#define U_CDECL_BEGIN
This is used to begin a declaration of a library private ICU C API.
Binary property STerm (new in Unicode 4.0.1).
Enumerated property Joining_Group.
Binary property ID_Continue.
Binary property Emoji_Presentation.
U_CAPI int32_t u_getPropertyValueEnum(UProperty property, const char *alias)
Return the property value integer for a given value name, as specified in the Unicode database file P...
Binary property blank (a C/POSIX character class).
Binary property Quotation_Mark.
#define U_DEPRECATED
This is used to declare a function as a deprecated public ICU C API.
Binary property Changes_When_NFKC_Casefolded.
U_CAPI UBlockCode ublock_getCode(UChar32 c)
Returns the Unicode allocation block that contains the character.
First constant for binary Unicode properties.
U_CAPI UBool u_isIDStart(UChar32 c)
Determines if the specified character is permissible as the first character in an identifier accordin...
Binary property Noncharacter_Code_Point.
U_CAPI UBool u_ispunct(UChar32 c)
Determines whether the specified code point is a punctuation character.
U_CAPI int32_t u_charName(UChar32 code, UCharNameChoice nameChoice, char *buffer, int32_t bufferLength, UErrorCode *pErrorCode)
Retrieve the name of a Unicode character.
Enumerated property East_Asian_Width.
ULineBreak
Line Break constants.
U_CAPI double u_getNumericValue(UChar32 c)
Get the numeric value for a Unicode code point as defined in the Unicode Character Database...
U_CAPI UBool u_isUUppercase(UChar32 c)
Check if a code point has the Uppercase Unicode property.
One more than the highest UCharDirection value.
U_CAPI UChar32 u_tolower(UChar32 c)
The given character is mapped to its lowercase equivalent according to UnicodeData.txt; if the character has no lowercase equivalent, the character itself is returned.
Binary property Full_Composition_Exclusion.
Bitmask property General_Category_Mask.
String property Simple_Titlecase_Mapping.
One more than the highest normal UGraphemeClusterBreak value.
Unicode 3.2 renames this block to "Combining Diacritical Marks for Symbols".
UDecompositionType
Decomposition Type constants.
One more than the highest normal ULineBreak value.
UHangulSyllableType
Hangul Syllable Type constants.
String property Simple_Lowercase_Mapping.
UIndicPositionalCategory
Indic Positional Category constants.
Binary property print (a C/POSIX character class).
Binary property Case_Sensitive.
Standard or synthetic character name.
Binary property Bidi_Mirrored.
UVerticalOrientation
Vertical Orientation constants.
Binary property NFKC_Inert.
U_CAPI void u_enumCharNames(UChar32 start, UChar32 limit, UEnumCharNamesFn *fn, void *context, UCharNameChoice nameChoice, UErrorCode *pErrorCode)
Enumerate all assigned Unicode characters between the start and limit code points (start inclusive...
Binary property Changes_When_Casemapped.
First constant for string Unicode properties.
Binary property Grapheme_Extend (new in Unicode 3.2).
int32_t UChar32
Define UChar32 as a type for single Unicode code points.
U_CAPI UBool u_isUAlphabetic(UChar32 c)
Check if a code point has the Alphabetic Unicode property.
UGraphemeClusterBreak
Grapheme Cluster Break constants.
New No_Block value in Unicode 4.
Binary property Extender.
Double property Numeric_Value.
Unicode character name (Name property).
U_CAPI const char * u_getPropertyName(UProperty property, UPropertyNameChoice nameChoice)
Return the Unicode name for a given property, as given in the Unicode database file PropertyAliases...
Binary property Grapheme_Base (new in Unicode 3.2).
Binary property NFKD_Inert.
U_CAPI UBool u_isIDIgnorable(UChar32 c)
Determines if the specified character should be regarded as an ignorable character in an identifier...
UCharCategory
Data for enumerated Unicode general category types.
Enumerated property Sentence_Break (new in Unicode 4.1).
Binary property Lowercase.
First constant for bit-mask Unicode properties.
Enumerated property Bidi_Paired_Bracket_Type (new in Unicode 6.3).
Binary property of strings Basic_Emoji.
U_CAPI UChar32 u_toupper(UChar32 c)
The given character is mapped to its uppercase equivalent according to UnicodeData.txt; if the character has no uppercase equivalent, the character itself is returned.
USentenceBreak
Sentence Break constants.
Binary property Extended_Pictographic.
Enumerated property Indic_Syllabic_Category.
Binary property Unified_Ideograph (new in Unicode 3.2).
Enumerated property Canonical_Combining_Class.
UCharNameChoice
Selector constants for u_charName().
One more than the last constant for binary Unicode properties.
Enumerated property Script.
Unicode 3.2 renames this block to "Greek and Coptic".
Binary property Hex_Digit.
String property Uppercase_Mapping.
UPropertyNameChoice
Selector constants for u_getPropertyName() and u_getPropertyValueName().
U_CAPI UBool u_isupper(UChar32 c)
Determines whether the specified code point has the general category "Lu" (uppercase letter)...
String property Lowercase_Mapping.
char16_t UChar
The base type for UTF-16 code units and pointers.
#define U_CDECL_END
This is used to end a declaration of a library private ICU C API.
Enumerated property NFKC_Quick_Check.
U_CAPI UBool u_stringHasBinaryProperty(const UChar *s, int32_t length, UProperty which)
Returns true if the property is true for the string.
UProperty
Selection constants for Unicode properties.
U_CAPI const USet * u_getBinaryPropertySet(UProperty property, UErrorCode *pErrorCode)
Returns a frozen USet for a binary property.
Enumerated property Hangul_Syllable_Type, new in Unicode 4.
Binary property alnum (a C/POSIX character class).
Binary property Variation_Selector (new in Unicode 4.0.1).
Binary property of strings RGI_Emoji_ZWJ_Sequence.
One more than the highest normal UHangulSyllableType value.
UBlockCode
Constants for Unicode blocks, see the Unicode Data file Blocks.txt.
Enumerated property Word_Break (new in Unicode 4.1).
Binary property Deprecated (new in Unicode 3.2).
Binary property Bidi_Control.
Binary property XID_Continue.
Same as UBLOCK_PRIVATE_USE.
UErrorCode
Standard ICU4C error code type, a substitute for exceptions.
Binary property Uppercase.
Binary property Changes_When_Uppercased.
UJoiningGroup
Joining Group constants.
struct USet USet
USet is the C API type corresponding to C++ class UnicodeSet.
One more than the highest normal UEastAsianWidth value.
U_CAPI UCharDirection u_charDirection(UChar32 c)
Returns the bidirectional category value for the code point, which is used in the Unicode bidirection...
One more than the highest normal UDecompositionType value.
UEastAsianWidth
East Asian Width constants.
Enumerated property Trail_Canonical_Combining_Class.
U_CAPI int8_t u_charType(UChar32 c)
Returns the general category value for the code point.
U_CAPI UBool u_hasBinaryProperty(UChar32 c, UProperty which)
Check a binary Unicode property for a code point.
Non-category for unassigned and non-character code points.
First constant for Unicode properties with unusual value types.
U_CAPI int32_t u_charDigitValue(UChar32 c)
Returns the decimal digit value of a decimal digit character.
U_CAPI int32_t u_getIntPropertyMaxValue(UProperty which)
Get the maximum value for an enumerated/integer/binary Unicode property.
UWordBreakValues
Word Break constants.
Binary property of strings RGI_Emoji_Modifier_Sequence.
U_CAPI UBool u_isJavaIDStart(UChar32 c)
Determines if the specified character is permissible as the first character in a Java identifier...
Enumerated property Joining_Type.
One more than the last constant for double Unicode properties.
Binary property Emoji_Modifier.
Basic definitions for ICU, for both C and C++ APIs.
U_CAPI UBool u_isWhitespace(UChar32 c)
Determines if the specified code point is a whitespace character according to Java/ICU.
U_CAPI UBool u_isJavaSpaceChar(UChar32 c)
Determine if the specified code point is a space character according to Java.
String property Bidi_Paired_Bracket (new in Unicode 6.3).
Enumerated property Lead_Canonical_Combining_Class.
Binary property ASCII_Hex_Digit.
UJoiningType
Joining Type constants.
Binary property Soft_Dotted (new in Unicode 3.2).
One more than the last constant for string Unicode properties.
Binary property Emoji_Modifier_Base.
Binary Property Segment_Starter.
U_CAPI UChar32 u_forDigit(int32_t digit, int8_t radix)
Determines the character representation for a specific digit in the specified radix.
Binary property ID_Start.
Corrected name from NameAliases.txt.
Binary property Changes_When_Titlecased.
Enumerated property Line_Break.
One more than the highest normal UJoiningType value.
U_CAPI UBool u_isalpha(UChar32 c)
Determines whether the specified code point is a letter character.
U_CAPI const char * u_getPropertyValueName(UProperty property, int32_t value, UPropertyNameChoice nameChoice)
Return the Unicode name for a given property value, as given in the Unicode database file PropertyVal...
Enumerated property Grapheme_Cluster_Break (new in Unicode 4.1).
U_CAPI UBool u_iscntrl(UChar32 c)
Determines whether the specified code point is a control character (as defined by this function)...
Deprecated string property ISO_Comment.
Binary property of strings RGI_Emoji_Flag_Sequence.
U_CAPI UBool u_isIDPart(UChar32 c)
Determines if the specified character is permissible in an identifier according to Java...
U_CAPI UBool u_islower(UChar32 c)
Determines whether the specified code point has the general category "Ll" (lowercase letter)...
Binary property Default_Ignorable_Code_Point (new in Unicode 3.2).
One more than the highest normal UBlockCode value.
The Unicode_1_Name property value which is of little practical value.
int32_t u_getISOComment(UChar32 c, char *dest, int32_t destCapacity, UErrorCode *pErrorCode)
Returns an empty string.
One higher than the last enum UCharCategory constant.
Binary property of strings RGI_Emoji_Tag_Sequence.
One more than the highest normal UWordBreakValues value.
Binary property Pattern_Syntax (new in Unicode 4.1).
One more than the last constant for Unicode properties with unusual value types.
U_CAPI UBool u_isprint(UChar32 c)
Determines whether the specified code point is a printable character.
UBidiPairedBracketType
Bidi Paired Bracket Type constants.
One more than the highest normal UCharNameChoice value.
UIndicSyllabicCategory
Indic Syllabic Category constants.
U_CAPI UBool u_isdigit(UChar32 c)
Determines whether the specified code point is a digit character according to Java.
int8_t UBool
The ICU boolean type, a signed-byte integer.
U_CAPI UChar32 u_charFromName(UCharNameChoice nameChoice, const char *name, UErrorCode *pErrorCode)
Find a Unicode character by its name and return its code point value.
Enumerated property NFKD_Quick_Check.
U_CAPI UBool u_istitle(UChar32 c)
Determines whether the specified code point is a titlecase letter.