The Uchar module provides low-level access to the Unicode Character Database.

Required Header

#include <utils_i18n.h>

Overview

The Uchar module provides low-level access to the Unicode Character Database.

Sample Code 1

Gets the property value of 'east asian width' among an enumerated property, and the unicode allocation block that contains the character.

    int ret = I18N_ERROR_NONE;
    i18n_uchar32 code_point = 0;
    int property_value = 0;
    i18n_uchar_u_east_asian_width_e east_asian_width = I18N_UCHAR_U_EA_NEUTRAL;
    i18n_uchar_ublock_code_e block_code = I18N_UCHAR_UBLOCK_NO_BLOCK;

    // How to get the east asian width type for 's'
    code_point = 0x73;    // 's'
    ret = i18n_uchar_get_int_property_value(code_point, I18N_UCHAR_EAST_ASIAN_WIDTH, &property_value);
    if (ret != I18N_ERROR_NONE) {
        dlog_print(DLOG_INFO, LOG_TAG, "Error occured!!\n");
    } else {
        east_asian_width = (i18n_uchar_u_east_asian_width_e)property_value;
        dlog_print(DLOG_INFO, LOG_TAG, "East Asian Width Type for ( %.4x ) is ( %d )\n", code_point, east_asian_width);
        // East Asian Width Type for ( 0073 ) is ( 4 ) which is I18N_UCHAR_U_EA_NARROW
    }

    // How to get the block code for 's'
    ret = i18n_uchar_get_ublock_code(code_point, &block_code);
    if (ret != I18N_ERROR_NONE) {
        dlog_print(DLOG_INFO, LOG_TAG, "Error occured!!\n");
    } else {
        dlog_print(DLOG_INFO, LOG_TAG, "block name for ( %.4x ) is ( %d )\n", code_point, block_code);
        // block code for ( 0073 ) is ( 1 ) which is I18N_UCHAR_UBLOCK_BASIC_LATIN
    }

    // How to get the east asian width type for 'sung' as ideographs
    code_point = 0x661F;    // 'sung' as ideographs
    ret = i18n_uchar_get_int_property_value(code_point, I18N_UCHAR_EAST_ASIAN_WIDTH, &property_value);
    if (ret != I18N_ERROR_NONE) {
        dlog_print(DLOG_INFO, LOG_TAG, "Error occured!!\n");
    } else {
        east_asian_width = (i18n_uchar_u_east_asian_width_e)property_value;
        dlog_print(DLOG_INFO, LOG_TAG, "East Asian Width Type for ( %.4x ) is ( %d )\n", code_point, east_asian_width);
        // East Asian Width Type for ( 661f ) is ( 5 ) which is I18N_UCHAR_U_EA_WIDE
    }

    // How to get the block code for 'sung' as ideographs
    ret = i18n_uchar_get_ublock_code(code_point, &block_code);
    if (ret != I18N_ERROR_NONE) {
        dlog_print(DLOG_INFO, LOG_TAG, "Error occured!!\n");
    } else {
        dlog_print(DLOG_INFO, LOG_TAG, "block name for ( %.4x ) is ( %d )\n", code_point, block_code);
        // block code for ( 661f ) is ( 71 ) which is I18N_UCHAR_UBLOCK_CJK_UNIFIED_IDEOGRAPHS
    }

    // How to get the east asian width type for 'sung' as hangul
    code_point = 0xC131;    // 'sung' as hangul
    ret = i18n_uchar_get_int_property_value(code_point, I18N_UCHAR_EAST_ASIAN_WIDTH, &property_value);
    if (ret != I18N_ERROR_NONE) {
        dlog_print(DLOG_INFO, LOG_TAG, "Error occured!!\n");
    } else {
        east_asian_width = (i18n_uchar_u_east_asian_width_e)property_value;
        dlog_print(DLOG_INFO, LOG_TAG, "East Asian Width Type for ( %.4x ) is ( %d )\n", code_point, east_asian_width);
        // East Asian Width Type for ( c131 ) is ( 5 ) which is I18N_UCHAR_U_EA_WIDE
    }

    // How to get the block code for 'sung' as hangul
    ret = i18n_uchar_get_ublock_code(code_point, &block_code);
    if (ret != I18N_ERROR_NONE) {
        dlog_print(DLOG_INFO, LOG_TAG, "Error occured!!\n");
    } else {
        dlog_print(DLOG_INFO, LOG_TAG, "block name for ( %.4x ) is ( %d )\n", code_point, block_code);
        // block code for ( c131 ) is ( 74 ) which is I18N_UCHAR_UBLOCK_HANGUL_SYLLABLES
    }

Functions
int	i18n_uchar_get_int_property_value (i18n_uchar32 c, i18n_uchar_uproperty_e which, int32_t *property_val)
	Gets the property value for an enumerated property for a code point.
int	i18n_uchar_get_ublock_code (i18n_uchar32 c, i18n_uchar_ublock_code_e *block_val)
	Gets the Unicode allocation block that contains the character.
Typedefs
typedef uint16_t	i18n_uchar
	i18n_uchar.
typedef int32_t	i18n_uchar32
	i18n_uchar32.
typedef int8_t	i18n_ubool
	i18n_ubool.
Defines
#define	I18N_U_MASK(x) ((uint32_t)1<<(x))
#define	I18N_U_GC_CN_MASK I18N_U_MASK(I18N_UCHAR_U_GENERAL_OTHER_TYPES)
#define	I18N_U_GC_LU_MASK I18N_U_MASK(I18N_UCHAR_U_UPPERCASE_LETTER)
#define	I18N_U_GC_LL_MASK I18N_U_MASK(I18N_UCHAR_U_LOWERCASE_LETTER)
#define	I18N_U_GC_LT_MASK I18N_U_MASK(I18N_UCHAR_U_TITLECASE_LETTER)
#define	I18N_U_GC_LM_MASK I18N_U_MASK(I18N_UCHAR_U_MODIFIER_LETTER)
#define	I18N_U_GC_LO_MASK I18N_U_MASK(I18N_UCHAR_U_OTHER_LETTER)
#define	I18N_U_GC_MN_MASK I18N_U_MASK(I18N_UCHAR_U_NON_SPACING_MARK)
#define	I18N_U_GC_ME_MASK I18N_U_MASK(I18N_UCHAR_U_ENCLOSING_MARK)
#define	I18N_U_GC_MC_MASK I18N_U_MASK(I18N_UCHAR_U_COMBINING_SPACING_MARK)
#define	I18N_U_GC_ND_MASK I18N_U_MASK(I18N_UCHAR_U_DECIMAL_DIGIT_NUMBER)
#define	I18N_U_GC_NL_MASK I18N_U_MASK(I18N_UCHAR_U_LETTER_NUMBER)
#define	I18N_U_GC_NO_MASK I18N_U_MASK(I18N_UCHAR_U_OTHER_NUMBER)
#define	I18N_U_GC_ZS_MASK I18N_U_MASK(I18N_UCHAR_U_SPACE_SEPARATOR)
#define	I18N_U_GC_ZL_MASK I18N_U_MASK(I18N_UCHAR_U_LINE_SEPARATOR)
#define	I18N_U_GC_ZP_MASK I18N_U_MASK(I18N_UCHAR_U_PARAGRAPH_SEPARATOR)
#define	I18N_U_GC_CC_MASK I18N_U_MASK(I18N_UCHAR_U_CONTROL_CHAR)
#define	I18N_U_GC_CF_MASK I18N_U_MASK(I18N_UCHAR_U_FORMAT_CHAR)
#define	I18N_U_GC_CO_MASK I18N_U_MASK(I18N_UCHAR_U_PRIVATE_USE_CHAR)
#define	I18N_U_GC_CS_MASK I18N_U_MASK(I18N_UCHAR_U_SURROGATE)
#define	I18N_U_GC_PD_MASK I18N_U_MASK(I18N_UCHAR_U_DASH_PUNCTUATION)
#define	I18N_U_GC_PS_MASK I18N_U_MASK(I18N_UCHAR_U_START_PUNCTUATION)
#define	I18N_U_GC_PE_MASK I18N_U_MASK(I18N_UCHAR_U_END_PUNCTUATION)
#define	I18N_U_GC_PC_MASK I18N_U_MASK(I18N_UCHAR_U_CONNECTOR_PUNCTUATION)
#define	I18N_U_GC_PO_MASK I18N_U_MASK(I18N_UCHAR_U_OTHER_PUNCTUATION)
#define	I18N_U_GC_SM_MASK I18N_U_MASK(I18N_UCHAR_U_MATH_SYMBOL)
#define	I18N_U_GC_SC_MASK I18N_U_MASK(I18N_UCHAR_U_CURRENCY_SYMBOL)
#define	I18N_U_GC_SK_MASK I18N_U_MASK(I18N_UCHAR_U_MODIFIER_SYMBOL)
#define	I18N_U_GC_SO_MASK I18N_U_MASK(I18N_UCHAR_U_OTHER_SYMBOL)
#define	I18N_U_GC_PI_MASK I18N_U_MASK(I18N_UCHAR_U_INITIAL_PUNCTUATION)
#define	I18N_U_GC_PF_MASK I18N_U_MASK(I18N_UCHAR_U_FINAL_PUNCTUATION)
#define	I18N_U_GC_L_MASK (I18N_U_GC_LU_MASK\|I18N_U_GC_LL_MASK\|I18N_U_GC_LT_MASK\|I18N_U_GC_LM_MASK\|I18N_U_GC_LO_MASK)
#define	I18N_U_GC_LC_MASK (I18N_U_GC_LU_MASK\|I18N_U_GC_LL_MASK\|I18N_U_GC_LT_MASK)
#define	I18N_U_GC_M_MASK (I18N_U_GC_MN_MASK\|I18N_U_GC_ME_MASK\|I18N_U_GC_MC_MASK)
#define	I18N_U_GC_N_MASK (I18N_U_GC_ND_MASK\|I18N_U_GC_NL_MASK\|I18N_U_GC_NO_MASK)
#define	I18N_U_GC_Z_MASK (I18N_U_GC_ZS_MASK\|I18N_U_GC_ZL_MASK\|I18N_U_GC_ZP_MASK)
#define	I18N_U_GC_C_MASK (I18N_U_GC_CN_MASK\|I18N_U_GC_CC_MASK\|I18N_U_GC_CF_MASK\|I18N_U_GC_CO_MASK\|I18N_U_GC_CS_MASK)
#define	I18N_U_GC_P_MASK (I18N_U_GC_PD_MASK\|I18N_U_GC_PS_MASK\|I18N_U_GC_PE_MASK\|I18N_U_GC_PC_MASK\|I18N_U_GC_PO_MASK\|I18N_U_GC_PI_MASK\|I18N_U_GC_PF_MASK)
#define	I18N_U_GC_S_MASK (I18N_U_GC_SM_MASK\|I18N_U_GC_SC_MASK\|I18N_U_GC_SK_MASK\|I18N_U_GC_SO_MASK)
#define	I18N_U_NO_NUMERIC_VALUE ((double)-123456789.)
#define	I18N_U_GET_GC_MASK(c) I18N_U_MASK(u_charType(c))
#define	I18N_U_FOLD_CASE_DEFAULT 0
	Option value for case folding: use default mappings defined in CaseFolding.txt.
#define	I18N_U_FOLD_CASE_EXCLUDE_SPECIAL_I 1
	Option value for case folding: Use the modified set of mappings provided in CaseFolding.txt to handle dotted I and dotless i appropriately for Turkic languages (tr, az). Before Unicode 3.2, CaseFolding.txt contains mappings marked with 'I' that are to be included for default mappings and excluded for the Turkic-specific mappings. Unicode 3.2 CaseFolding.txt instead contains mappings marked with 'T' that are to be excluded for default mappings and included for the Turkic-specific mappings.
#define	I18N_USEARCH_DONE -1
	DONE is returned by i18n_usearch_previous() and i18n_usearch_next() after all valid matches have been returned, and by, i18n_usearch_first() and i18n_usearch_last() if there are no matches at all.

Define Documentation

#define I18N_U_FOLD_CASE_DEFAULT 0

Option value for case folding: use default mappings defined in CaseFolding.txt.

Since :: 2.3.1

#define I18N_U_FOLD_CASE_EXCLUDE_SPECIAL_I 1

Option value for case folding:
Use the modified set of mappings provided in CaseFolding.txt to handle dotted I and dotless i appropriately for Turkic languages (tr, az).
Before Unicode 3.2, CaseFolding.txt contains mappings marked with 'I' that are to be included for default mappings and excluded for the Turkic-specific mappings.
Unicode 3.2 CaseFolding.txt instead contains mappings marked with 'T' that are to be excluded for default mappings and included for the Turkic-specific mappings.

Since :: 2.3.1

#define I18N_U_GC_C_MASK (I18N_U_GC_CN_MASK|I18N_U_GC_CC_MASK|I18N_U_GC_CF_MASK|I18N_U_GC_CO_MASK|I18N_U_GC_CS_MASK)

Mask constant for multiple i18n_uchar_category_e bits (C Others).

Since :: 2.3.1

#define I18N_U_GC_CC_MASK I18N_U_MASK(I18N_UCHAR_U_CONTROL_CHAR)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_CF_MASK I18N_U_MASK(I18N_UCHAR_U_FORMAT_CHAR)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_CN_MASK I18N_U_MASK(I18N_UCHAR_U_GENERAL_OTHER_TYPES)

U_GC_XX_MASK constants are bit flags corresponding to Unicode general category values.

Since :: 2.3.1

#define I18N_U_GC_CO_MASK I18N_U_MASK(I18N_UCHAR_U_PRIVATE_USE_CHAR)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_CS_MASK I18N_U_MASK(I18N_UCHAR_U_SURROGATE)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_L_MASK (I18N_U_GC_LU_MASK|I18N_U_GC_LL_MASK|I18N_U_GC_LT_MASK|I18N_U_GC_LM_MASK|I18N_U_GC_LO_MASK)

Mask constant for multiple i18n_uchar_category_e bits (L Letters).

Since :: 2.3.1

#define I18N_U_GC_LC_MASK (I18N_U_GC_LU_MASK|I18N_U_GC_LL_MASK|I18N_U_GC_LT_MASK)

Mask constant for multiple i18n_uchar_category_e bits (LC Cased Letters).

Since :: 2.3.1

#define I18N_U_GC_LL_MASK I18N_U_MASK(I18N_UCHAR_U_LOWERCASE_LETTER)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_LM_MASK I18N_U_MASK(I18N_UCHAR_U_MODIFIER_LETTER)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_LO_MASK I18N_U_MASK(I18N_UCHAR_U_OTHER_LETTER)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_LT_MASK I18N_U_MASK(I18N_UCHAR_U_TITLECASE_LETTER)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_LU_MASK I18N_U_MASK(I18N_UCHAR_U_UPPERCASE_LETTER)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_M_MASK (I18N_U_GC_MN_MASK|I18N_U_GC_ME_MASK|I18N_U_GC_MC_MASK)

Mask constant for multiple i18n_uchar_category_e bits (M Marks).

Since :: 2.3.1

#define I18N_U_GC_MC_MASK I18N_U_MASK(I18N_UCHAR_U_COMBINING_SPACING_MARK)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_ME_MASK I18N_U_MASK(I18N_UCHAR_U_ENCLOSING_MARK)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_MN_MASK I18N_U_MASK(I18N_UCHAR_U_NON_SPACING_MARK)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_N_MASK (I18N_U_GC_ND_MASK|I18N_U_GC_NL_MASK|I18N_U_GC_NO_MASK)

Mask constant for multiple i18n_uchar_category_e bits (N Numbers).

Since :: 2.3.1

#define I18N_U_GC_ND_MASK I18N_U_MASK(I18N_UCHAR_U_DECIMAL_DIGIT_NUMBER)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_NL_MASK I18N_U_MASK(I18N_UCHAR_U_LETTER_NUMBER)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_NO_MASK I18N_U_MASK(I18N_UCHAR_U_OTHER_NUMBER)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

Mask constant for multiple i18n_uchar_category_e bits (P Punctuation).

Since :: 2.3.1

#define I18N_U_GC_PC_MASK I18N_U_MASK(I18N_UCHAR_U_CONNECTOR_PUNCTUATION)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_PD_MASK I18N_U_MASK(I18N_UCHAR_U_DASH_PUNCTUATION)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_PE_MASK I18N_U_MASK(I18N_UCHAR_U_END_PUNCTUATION)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_PF_MASK I18N_U_MASK(I18N_UCHAR_U_FINAL_PUNCTUATION)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_PI_MASK I18N_U_MASK(I18N_UCHAR_U_INITIAL_PUNCTUATION)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_PO_MASK I18N_U_MASK(I18N_UCHAR_U_OTHER_PUNCTUATION)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_PS_MASK I18N_U_MASK(I18N_UCHAR_U_START_PUNCTUATION)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_S_MASK (I18N_U_GC_SM_MASK|I18N_U_GC_SC_MASK|I18N_U_GC_SK_MASK|I18N_U_GC_SO_MASK)

Mask constant for multiple i18n_uchar_category_e bits (S Symbols).

Since :: 2.3.1

#define I18N_U_GC_SC_MASK I18N_U_MASK(I18N_UCHAR_U_CURRENCY_SYMBOL)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_SK_MASK I18N_U_MASK(I18N_UCHAR_U_MODIFIER_SYMBOL)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_SM_MASK I18N_U_MASK(I18N_UCHAR_U_MATH_SYMBOL)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_SO_MASK I18N_U_MASK(I18N_UCHAR_U_OTHER_SYMBOL)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_Z_MASK (I18N_U_GC_ZS_MASK|I18N_U_GC_ZL_MASK|I18N_U_GC_ZP_MASK)

Mask constant for multiple i18n_uchar_category_e bits (Z Separators).

Since :: 2.3.1

#define I18N_U_GC_ZL_MASK I18N_U_MASK(I18N_UCHAR_U_LINE_SEPARATOR)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_ZP_MASK I18N_U_MASK(I18N_UCHAR_U_PARAGRAPH_SEPARATOR)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GC_ZS_MASK I18N_U_MASK(I18N_UCHAR_U_SPACE_SEPARATOR)

Mask constant for a i18n_uchar_category_e.

Since :: 2.3.1

#define I18N_U_GET_GC_MASK ( c ) I18N_U_MASK(u_charType(c))

Get a single-bit bit set for the general category of a character.

Since :: 2.3.1

#define I18N_U_MASK ( x ) ((uint32_t)1<<(x))

Get a single-bit bit set (a flag) from a bit number 0..31.

Since :: 2.3.1

#define I18N_U_NO_NUMERIC_VALUE ((double)-123456789.)

Special value that is returned by i18n_uchar_get_numeric_value()(not implemented yet) when no numeric value is defined for a code point.

Since :: 2.3.1

#define I18N_USEARCH_DONE -1

DONE is returned by i18n_usearch_previous() and i18n_usearch_next() after all valid matches have been returned, and by, i18n_usearch_first() and i18n_usearch_last() if there are no matches at all.

Since :: 2.3.1

Typedef Documentation

typedef int8_t i18n_ubool

i18n_ubool.

Since :: 2.3.1

typedef uint16_t i18n_uchar

i18n_uchar.

Since :: 2.3.1

typedef int32_t i18n_uchar32

i18n_uchar32.

Since :: 2.3.1

Enumeration Type Documentation

enum i18n_uchar_category_e

Enumeration for Unicode general category types.

Since :: 2.3.1

Enumerator:

I18N_UCHAR_U_UNASSIGNED	Non-category for unassigned and non-character code points
I18N_UCHAR_U_GENERAL_OTHER_TYPES	Cn "Other, Not Assigned (no characters in [UnicodeData.txt] have this property)" (same as I18N_UCHAR_U_UNASSIGNED!)
I18N_UCHAR_U_UPPERCASE_LETTER	Lu
I18N_UCHAR_U_LOWERCASE_LETTER	Ll
I18N_UCHAR_U_TITLECASE_LETTER	Lt
I18N_UCHAR_U_MODIFIER_LETTER	Lm
I18N_UCHAR_U_OTHER_LETTER	Lo
I18N_UCHAR_U_NON_SPACING_MARK	Mn
I18N_UCHAR_U_ENCLOSING_MARK	Me
I18N_UCHAR_U_COMBINING_SPACING_MARK	Mc
I18N_UCHAR_U_DECIMAL_DIGIT_NUMBER	Nd
I18N_UCHAR_U_LETTER_NUMBER	Nl
I18N_UCHAR_U_OTHER_NUMBER	No
I18N_UCHAR_U_SPACE_SEPARATOR	Zs
I18N_UCHAR_U_LINE_SEPARATOR	Zl
I18N_UCHAR_U_PARAGRAPH_SEPARATOR	Zp
I18N_UCHAR_U_CONTROL_CHAR	Cc
I18N_UCHAR_U_FORMAT_CHAR	Cf
I18N_UCHAR_U_PRIVATE_USE_CHAR	Co
I18N_UCHAR_U_SURROGATE	Cs
I18N_UCHAR_U_DASH_PUNCTUATION	Pd
I18N_UCHAR_U_START_PUNCTUATION	Ps
I18N_UCHAR_U_END_PUNCTUATION	Pe
I18N_UCHAR_U_CONNECTOR_PUNCTUATION	Pc
I18N_UCHAR_U_OTHER_PUNCTUATION	Po
I18N_UCHAR_U_MATH_SYMBOL	Sm
I18N_UCHAR_U_CURRENCY_SYMBOL	Sc
I18N_UCHAR_U_MODIFIER_SYMBOL	Sk
I18N_UCHAR_U_OTHER_SYMBOL	So
I18N_UCHAR_U_INITIAL_PUNCTUATION	Pi
I18N_UCHAR_U_FINAL_PUNCTUATION	Pf
I18N_UCHAR_U_CHAR_CATEGORY_COUNT	One higher than the last enum i18n_uchar_category_e constant

enum i18n_uchar_direction_e

Enumeration for the language directional property of a character set.

Since :: 2.3.1

Enumerator:

I18N_UCHAR_U_LEFT_TO_RIGHT	L
I18N_UCHAR_U_RIGHT_TO_LEFT	R
I18N_UCHAR_U_EUROPEAN_NUMBER	EN
I18N_UCHAR_U_EUROPEAN_NUMBER_SEPARATOR	ES
I18N_UCHAR_U_EUROPEAN_NUMBER_TERMINATOR	ET
I18N_UCHAR_U_ARABIC_NUMBER	AN
I18N_UCHAR_U_COMMON_NUMBER_SEPARATOR	CS
I18N_UCHAR_U_BLOCK_SEPARATOR	B
I18N_UCHAR_U_SEGMENT_SEPARATOR	S
I18N_UCHAR_U_WHITE_SPACE_NEUTRAL	WS
I18N_UCHAR_U_OTHER_NEUTRAL	ON
I18N_UCHAR_U_LEFT_TO_RIGHT_EMBEDDING	LRE
I18N_UCHAR_U_LEFT_TO_RIGHT_OVERRIDE	LRO
I18N_UCHAR_U_RIGHT_TO_LEFT_ARABIC	AL
I18N_UCHAR_U_RIGHT_TO_LEFT_EMBEDDING	RLE
I18N_UCHAR_U_RIGHT_TO_LEFT_OVERRIDE	RLO
I18N_UCHAR_U_POP_DIRECTIONAL_FORMAT	PDF
I18N_UCHAR_U_DIR_NON_SPACING_MARK	NSM
I18N_UCHAR_U_BOUNDARY_NEUTRAL	BN
I18N_UCHAR_U_FIRST_STRONG_ISOLATE	FSI (Since 3.0)
I18N_UCHAR_U_LEFT_TO_RIGHT_ISOLATE	FSI (Since 3.0)
I18N_UCHAR_U_RIGHT_TO_LEFT_ISOLATE	RLI (Since 3.0)
I18N_UCHAR_U_POP_DIRECTIONAL_ISOLATE	PDI (Since 3.0)
I18N_UCHAR_U_CHAR_DIRECTION_COUNT	Count

enum i18n_uchar_u_bidi_paired_bracket_type_e

Bidi Paired Bracket Type constants.

Since :: 3.0

See also:: I18N_UCHAR_BIDI_PAIRED_BRACKET_TYPE

Enumerator:

I18N_UCHAR_U_BPT_NONE	Not a paired bracket.
I18N_UCHAR_U_BPT_OPEN	Open paired bracket.
I18N_UCHAR_U_BPT_CLOSE	Close paired bracket.
I18N_UCHAR_U_BPT_COUNT	Count

enum i18n_uchar_u_decomposition_type_e

Enumeration for Decomposition Type constants.

Since :: 2.3.1

Enumerator:

I18N_UCHAR_U_DT_NONE	[none]
I18N_UCHAR_U_DT_CANONICAL	[can]
I18N_UCHAR_U_DT_COMPAT	[com]
I18N_UCHAR_U_DT_CIRCLE	[enc]
I18N_UCHAR_U_DT_FINAL	[fin]
I18N_UCHAR_U_DT_FONT	[font]
I18N_UCHAR_U_DT_FRACTION	[fra]
I18N_UCHAR_U_DT_INITIAL	[init]
I18N_UCHAR_U_DT_ISOLATED	[iso]
I18N_UCHAR_U_DT_MEDIAL	[med]
I18N_UCHAR_U_DT_NARROW	[nar]
I18N_UCHAR_U_DT_NOBREAK	[nb]
I18N_UCHAR_U_DT_SMALL	[sml]
I18N_UCHAR_U_DT_SQUARE	[sqr]
I18N_UCHAR_U_DT_SUB	[sub]
I18N_UCHAR_U_DT_SUPER	[sup]
I18N_UCHAR_U_DT_VERTICAL	[vert]
I18N_UCHAR_U_DT_WIDE	[wide]
I18N_UCHAR_U_DT_COUNT	18

enum i18n_uchar_u_east_asian_width_e

Enumeration for East Asian Width constants.

Since :: 2.3.1

Enumerator:

I18N_UCHAR_U_EA_NEUTRAL	[N]
I18N_UCHAR_U_EA_AMBIGUOUS	[A]
I18N_UCHAR_U_EA_HALFWIDTH	[H]
I18N_UCHAR_U_EA_FULLWIDTH	[F]
I18N_UCHAR_U_EA_NARROW	[Na]
I18N_UCHAR_U_EA_WIDE	[W]

enum i18n_uchar_u_grapheme_cluster_break_e

Enumeration for Grapheme Cluster Break constants.

Since :: 2.3.1

Enumerator:

I18N_UCHAR_U_GCB_OTHER	[XX]
I18N_UCHAR_U_GCB_CONTROL	[CN]
I18N_UCHAR_U_GCB_CR	[CR]
I18N_UCHAR_U_GCB_EXTEND	[EX]
I18N_UCHAR_U_GCB_L	[L]
I18N_UCHAR_U_GCB_LF	[LF]
I18N_UCHAR_U_GCB_LV	[LV]
I18N_UCHAR_U_GCB_LVT	[LVT]
I18N_UCHAR_U_GCB_T	[T]
I18N_UCHAR_U_GCB_V	[V]
I18N_UCHAR_U_GCB_SPACING_MARK	[SM]
I18N_UCHAR_U_GCB_PREPEND	[PP]
I18N_UCHAR_UCHAR_U_GCB_COUNT

enum i18n_uchar_u_hangul_syllable_type_e

Enumeration for Hangul Syllable Type constants.

Since :: 2.3.1

Enumerator:

I18N_UCHAR_U_HST_NOT_APPLICABLE	[NA]
I18N_UCHAR_U_HST_LEADING_JAMO	[L]
I18N_UCHAR_U_HST_VOWEL_JAMO	[V]
I18N_UCHAR_U_HST_TRAILING_JAMO	[T]
I18N_UCHAR_U_HST_LV_SYLLABLE	[LV]
I18N_UCHAR_U_HST_LVT_SYLLABLE	[LVT]
I18N_UCHAR_U_HST_COUNT

enum i18n_uchar_u_joining_group_e

Enumeration for Joining Group constants.

Since :: 2.3.1

Enumerator:

I18N_UCHAR_U_JG_NO_JOINING_GROUP	No Joining Group
I18N_UCHAR_U_JG_AIN	Ain
I18N_UCHAR_U_JG_ALAPH	Alaph
I18N_UCHAR_U_JG_ALEF	Alef
I18N_UCHAR_U_JG_BEH	Beh
I18N_UCHAR_U_JG_BETH	Beth
I18N_UCHAR_U_JG_DAL	Dal
I18N_UCHAR_U_JG_DALATH_RISH	Dalath Rish
I18N_UCHAR_U_JG_E	E
I18N_UCHAR_U_JG_FEH	Feh
I18N_UCHAR_U_JG_FINAL_SEMKATH	Final Semkath
I18N_UCHAR_U_JG_GAF	Gaf
I18N_UCHAR_U_JG_GAMAL	Gamal
I18N_UCHAR_U_JG_HAH	Hah
I18N_UCHAR_U_JG_TEH_MARBUTA_GOAL	Teh Marbuta Goal
I18N_UCHAR_U_JG_HAMZA_ON_HEH_GOAL	Hamza On Heh Goal
I18N_UCHAR_U_JG_HE	He
I18N_UCHAR_U_JG_HEH	Heh
I18N_UCHAR_U_JG_HEH_GOAL	Heh Goal
I18N_UCHAR_U_JG_HETH	Heth
I18N_UCHAR_U_JG_KAF	Kaf
I18N_UCHAR_U_JG_KAPH	Kaph
I18N_UCHAR_U_JG_KNOTTED_HEH	Knotted Heh
I18N_UCHAR_U_JG_LAM	Lam
I18N_UCHAR_U_JG_LAMADH	Lamadh
I18N_UCHAR_U_JG_MEEM	Meem
I18N_UCHAR_U_JG_MIM	Mim
I18N_UCHAR_U_JG_NOON	Noon
I18N_UCHAR_U_JG_NUN	Nun
I18N_UCHAR_U_JG_PE	Pe
I18N_UCHAR_U_JG_QAF	Qaf
I18N_UCHAR_U_JG_QAPH	Qaph
I18N_UCHAR_U_JG_REH	Reh
I18N_UCHAR_U_JG_REVERSED_PE	Reversed Pe
I18N_UCHAR_U_JG_SAD	Sad
I18N_UCHAR_U_JG_SADHE	Sadhe
I18N_UCHAR_U_JG_SEEN	Seen
I18N_UCHAR_U_JG_SEMKATH	Semkath
I18N_UCHAR_U_JG_SHIN	Shin
I18N_UCHAR_U_JG_SWASH_KAF	Swash Kaf
I18N_UCHAR_U_JG_SYRIAC_WAW	Syriac Waw
I18N_UCHAR_U_JG_TAH	Tah
I18N_UCHAR_U_JG_TAW	Taw
I18N_UCHAR_U_JG_TEH_MARBUTA	Teh Marbuta
I18N_UCHAR_U_JG_TETH	Teth
I18N_UCHAR_U_JG_WAW	Waw
I18N_UCHAR_U_JG_YEH	Yeh
I18N_UCHAR_U_JG_YEH_BARREE	Yeh Barree
I18N_UCHAR_U_JG_YEH_WITH_TAIL	Yeh With Tail
I18N_UCHAR_U_JG_YUDH	Yudh
I18N_UCHAR_U_JG_YUDH_HE	Yudh He
I18N_UCHAR_U_JG_ZAIN	Zain
I18N_UCHAR_U_JG_FE	Fe
I18N_UCHAR_U_JG_KHAPH	Khaph
I18N_UCHAR_U_JG_ZHAIN	Zhain
I18N_UCHAR_U_JG_BURUSHASKI_YEH_BARREE	Burushaski Yeh Barree
I18N_UCHAR_U_JG_FARSI_YEH	Farsi Yeh
I18N_UCHAR_U_JG_NYA	Nya
I18N_UCHAR_U_JG_ROHINGYA_YEH	Rohingya Yeh
I18N_UCHAR_U_JG_MANICHAEAN_ALEPH	Manichaean Aleph (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_AYIN	Manichaean Ayin (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_BETH	Manichaean Beth (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_DALETH	Manichaean Daleth (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_DHAMEDH	Manichaean Dhamedh (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_FIVE	Manichaean Five (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_GIMEL	Manichaean Gimel (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_HETH	Manichaean Heth (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_HUNDRED	Manichaean Hundred (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_KAPH	Manichaean Kaph (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_LAMEDH	Manichaean Lamedh (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_MEM	Manichaean Mem (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_NUN	Manichaean Nun (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_ONE	Manichaean One (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_PE	Manichaean Pe (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_QOPH	Manichaean Qoph (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_RESH	Manichaean Resh (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_SADHE	Manichaean Sadhe (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_SAMEKH	Manichaean Samekh (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_TAW	Manichaean Taw (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_TEN	Manichaean Ten (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_TETH	Manichaean Teth (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_THAMEDH	Manichaean Thamedh (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_TWENTY	Manichaean Twenty (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_WAW	Manichaean Waw (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_YODH	Manichaean Yodh (Since 3.0)
I18N_UCHAR_U_JG_MANICHAEAN_ZAYIN	Manichaean Zayin (Since 3.0)
I18N_UCHAR_U_JG_STRAIGHT_WAW	Manichaean Waw (Since 3.0)
I18N_UCHAR_U_JG_COUNT	Count

enum i18n_uchar_u_joining_type_e

Enumeration for Joining Type constants.

Since :: 2.3.1

Enumerator:

I18N_UCHAR_U_JT_NON_JOINING	[U]
I18N_UCHAR_U_JT_JOIN_CAUSING	[C]
I18N_UCHAR_U_JT_DUAL_JOINING	[D]
I18N_UCHAR_U_JT_LEFT_JOINING	[L]
I18N_UCHAR_U_JT_RIGHT_JOINING	[R]
I18N_UCHAR_U_JT_TRANSPARENT	[T]
I18N_UCHAR_U_JT_COUNT	6

enum i18n_uchar_u_line_break_e

Enumeration for Line Break constants.

Since :: 2.3.1

Enumerator:

I18N_UCHAR_U_LB_UNKNOWN	[XX]
I18N_UCHAR_U_LB_AMBIGUOUS	[AI]
I18N_UCHAR_U_LB_ALPHABETIC	[AL]
I18N_UCHAR_U_LB_BREAK_BOTH	[B2]
I18N_UCHAR_U_LB_BREAK_AFTER	[BA]
I18N_UCHAR_U_LB_BREAK_BEFORE	[BB]
I18N_UCHAR_U_LB_MANDATORY_BREAK	[BK]
I18N_UCHAR_U_LB_CONTINGENT_BREAK	[CB]
I18N_UCHAR_U_LB_CLOSE_PUNCTUATION	[CL]
I18N_UCHAR_U_LB_COMBINING_MARK	[CM]
I18N_UCHAR_U_LB_CARRIAGE_RETURN	[CR]
I18N_UCHAR_U_LB_EXCLAMATION	[EX]
I18N_UCHAR_U_LB_GLUE	[GL]
I18N_UCHAR_U_LB_HYPHEN	[HY]
I18N_UCHAR_U_LB_IDEOGRAPHIC	[ID]
I18N_UCHAR_U_LB_INSEPARABLE	[IN]
I18N_UCHAR_U_LB_INFIX_NUMERIC	[IS]
I18N_UCHAR_U_LB_LINE_FEED	[LF]
I18N_UCHAR_U_LB_NONSTARTER	[NS]
I18N_UCHAR_U_LB_NUMERIC	[NU]
I18N_UCHAR_U_LB_OPEN_PUNCTUATION	[OP]
I18N_UCHAR_U_LB_POSTFIX_NUMERIC	[PO]
I18N_UCHAR_U_LB_PREFIX_NUMERIC	[PR]
I18N_UCHAR_U_LB_QUOTATION	[QU]
I18N_UCHAR_U_LB_COMPLEX_CONTEXT	[SA]
I18N_UCHAR_U_LB_SURROGATE	[SG]
I18N_UCHAR_U_LB_SPACE	[SP]
I18N_UCHAR_U_LB_BREAK_SYMBOLS	[SY]
I18N_UCHAR_U_LB_ZWSPACE	[ZW]
I18N_UCHAR_U_LB_NEXT_LINE	[NL]
I18N_UCHAR_U_LB_WORD_JOINER	[WJ]
I18N_UCHAR_U_LB_H2	[H2]
I18N_UCHAR_U_LB_H3	[H3]
I18N_UCHAR_U_LB_JL	[JL]
I18N_UCHAR_U_LB_JT	[JT]
I18N_UCHAR_U_LB_JV	[JV]
I18N_UCHAR_U_LB_CLOSE_PARENTHESIS	[CP]

enum i18n_uchar_u_numeric_type_e

Enumeration for Numeric Type constants.

Since :: 2.3.1

Enumerator:

I18N_UCHAR_U_NT_NONE	[None]
I18N_UCHAR_U_NT_DECIMAL	[de]
I18N_UCHAR_U_NT_DIGIT	[di]
I18N_UCHAR_U_NT_NUMERIC	[nu]
I18N_UCHAR_U_NT_COUNT

enum i18n_uchar_u_sentence_break_e

Enumeration for Sentence Break constants.

Since :: 2.3.1

Enumerator:

I18N_UCHAR_U_SB_OTHER	[XX]
I18N_UCHAR_U_SB_ATERM	[AT]
I18N_UCHAR_U_SB_CLOSE	[CL]
I18N_UCHAR_U_SB_FORMAT	[FO]
I18N_UCHAR_U_SB_LOWER	[LO]
I18N_UCHAR_U_SB_NUMERIC	[NU]
I18N_UCHAR_U_SB_OLETTER	[LE]
I18N_UCHAR_U_SB_SEP	[SE]
I18N_UCHAR_U_SB_SP	[SP]
I18N_UCHAR_U_SB_STERM	[ST]
I18N_UCHAR_U_SB_UPPER	[UP]
I18N_UCHAR_U_SB_CR	[CR]
I18N_UCHAR_U_SB_EXTEND	[EX]
I18N_UCHAR_U_SB_LF	[LF]
I18N_UCHAR_U_SB_SCONTINUE	[SC]
I18N_UCHAR_U_SB_COUNT

enum i18n_uchar_u_word_break_values_e

Enumeration for Word Break constants.

Since :: 2.3.1

Enumerator:

I18N_UCHAR_U_WB_OTHER	[XX]
I18N_UCHAR_U_WB_ALETTER	[LE]
I18N_UCHAR_U_WB_FORMAT	[FO]
I18N_UCHAR_U_WB_KATAKANA	[KA]
I18N_UCHAR_U_WB_MIDLETTER	[ML]
I18N_UCHAR_U_WB_MIDNUM	[MN]
I18N_UCHAR_U_WB_NUMERIC	[NU]
I18N_UCHAR_U_WB_EXTENDNUMLET	[EX]
I18N_UCHAR_U_WB_CR	[CR]
I18N_UCHAR_U_WB_EXTEND	[Extend]
I18N_UCHAR_U_WB_LF	[LF]
I18N_UCHAR_U_WB_MIDNUMLET	[MB]
I18N_UCHAR_U_WB_NEWLINE	[NL]
I18N_UCHAR_U_WB_REGIONAL_INDICATOR	[RI] (Since 3.0)
I18N_UCHAR_U_WB_HEBREW_LETTER	[HL] (Since 3.0)
I18N_UCHAR_U_WB_SINGLE_QUOTE	[SQ] (Since 3.0)
I18N_UCHAR_U_WB_DOUBLE_QUOTE	[DQ] (Since 3.0)
I18N_UCHAR_U_WB_COUNT

enum i18n_uchar_ublock_code_e

Constants for Unicode blocks, see the Unicode Data file Blocks.txt.

Since :: 2.3.1

Enumerator:

I18N_UCHAR_UBLOCK_NO_BLOCK	No Block
I18N_UCHAR_UBLOCK_BASIC_LATIN	Basic Latin
I18N_UCHAR_UBLOCK_LATIN_1_SUPPLEMENT	Latin_1 Supplement
I18N_UCHAR_UBLOCK_LATIN_EXTENDED_A	Latin Extended A
I18N_UCHAR_UBLOCK_LATIN_EXTENDED_B	Latin Extended B
I18N_UCHAR_UBLOCK_IPA_EXTENSIONS	IPA Extensions
I18N_UCHAR_UBLOCK_SPACING_MODIFIER_LETTERS	Spacing Modifier Letters
I18N_UCHAR_UBLOCK_COMBINING_DIACRITICAL_MARKS	Combining Diacritical Marks
I18N_UCHAR_UBLOCK_GREEK	Greek
I18N_UCHAR_UBLOCK_CYRILLIC	Cyrillic
I18N_UCHAR_UBLOCK_ARMENIAN	Armenian
I18N_UCHAR_UBLOCK_HEBREW	Hebrew
I18N_UCHAR_UBLOCK_ARABIC	Arabic
I18N_UCHAR_UBLOCK_SYRIAC	Syriac
I18N_UCHAR_UBLOCK_THAANA	Thaana
I18N_UCHAR_UBLOCK_DEVANAGARI	Devanagari
I18N_UCHAR_UBLOCK_BENGALI	Bengali
I18N_UCHAR_UBLOCK_GURMUKHI	Gurmukhi
I18N_UCHAR_UBLOCK_GUJARATI	Gujarati
I18N_UCHAR_UBLOCK_ORIYA	Oriya
I18N_UCHAR_UBLOCK_TAMIL	Tamil
I18N_UCHAR_UBLOCK_TELUGU	Telugu
I18N_UCHAR_UBLOCK_KANNADA	Kannada
I18N_UCHAR_UBLOCK_MALAYALAM	Malayalam
I18N_UCHAR_UBLOCK_SINHALA	Sinhala
I18N_UCHAR_UBLOCK_THAI	Thai
I18N_UCHAR_UBLOCK_LAO	Lao
I18N_UCHAR_UBLOCK_TIBETAN	Tibetan
I18N_UCHAR_UBLOCK_MYANMAR	Myanmar
I18N_UCHAR_UBLOCK_GEORGIAN	Georgian
I18N_UCHAR_UBLOCK_HANGUL_JAMO	Hangul Jamo
I18N_UCHAR_UBLOCK_ETHIOPIC	Ethiopic
I18N_UCHAR_UBLOCK_CHEROKEE	Cherokee
I18N_UCHAR_UBLOCK_UNIFIED_CANADIAN_ABORIGINAL_SYLLABICS	Unified Canadian Aboriginal Syllabics
I18N_UCHAR_UBLOCK_OGHAM	Ogham
I18N_UCHAR_UBLOCK_RUNIC	Runic
I18N_UCHAR_UBLOCK_KHMER	Khmer
I18N_UCHAR_UBLOCK_MONGOLIAN	Mongolian
I18N_UCHAR_UBLOCK_LATIN_EXTENDED_ADDITIONAL	Latin Extended Additional
I18N_UCHAR_UBLOCK_GREEK_EXTENDED	Greek Extended
I18N_UCHAR_UBLOCK_GENERAL_PUNCTUATION	General Punctuation
I18N_UCHAR_UBLOCK_SUPERSCRIPTS_AND_SUBSCRIPTS	Superscripts And Subscripts
I18N_UCHAR_UBLOCK_CURRENCY_SYMBOLS	Currency Symbols
I18N_UCHAR_UBLOCK_COMBINING_MARKS_FOR_SYMBOLS	Combining Marks For Symbols
I18N_UCHAR_UBLOCK_LETTERLIKE_SYMBOLS	Letterlike Symbols
I18N_UCHAR_UBLOCK_NUMBER_FORMS	Number Forms
I18N_UCHAR_UBLOCK_ARROWS	Arrows
I18N_UCHAR_UBLOCK_MATHEMATICAL_OPERATORS	Mathematical Operators
I18N_UCHAR_UBLOCK_MISCELLANEOUS_TECHNICAL	Miscellaneous Technical
I18N_UCHAR_UBLOCK_CONTROL_PICTURES	Control Pictures
I18N_UCHAR_UBLOCK_OPTICAL_CHARACTER_RECOGNITION	Optical Character Recognition
I18N_UCHAR_UBLOCK_ENCLOSED_ALPHANUMERICS	Enclosed Alphanumerics
I18N_UCHAR_UBLOCK_BOX_DRAWING	Box Drawing
I18N_UCHAR_UBLOCK_BLOCK_ELEMENTS	Block Elements
I18N_UCHAR_UBLOCK_GEOMETRIC_SHAPES	Geometric Shapes
I18N_UCHAR_UBLOCK_MISCELLANEOUS_SYMBOLS	Miscellaneous Symbols
I18N_UCHAR_UBLOCK_DINGBATS	Dingbats
I18N_UCHAR_UBLOCK_BRAILLE_PATTERNS	Braille Patterns
I18N_UCHAR_UBLOCK_CJK_RADICALS_SUPPLEMENT	CJK Radicals Supplement
I18N_UCHAR_UBLOCK_KANGXI_RADICALS	Kangxi Radicals
I18N_UCHAR_UBLOCK_IDEOGRAPHIC_DESCRIPTION_CHARACTERS	Ideographic Description Characters
I18N_UCHAR_UBLOCK_CJK_SYMBOLS_AND_PUNCTUATION	CJK Symbols And Punctuation
I18N_UCHAR_UBLOCK_HIRAGANA	Hiragana
I18N_UCHAR_UBLOCK_KATAKANA	Katakana
I18N_UCHAR_UBLOCK_BOPOMOFO	Bopomofo
I18N_UCHAR_UBLOCK_HANGUL_COMPATIBILITY_JAMO	Hangul Compatibility Jamo
I18N_UCHAR_UBLOCK_KANBUN	Kanbun
I18N_UCHAR_UBLOCK_BOPOMOFO_EXTENDED	Bopomofo Extended
I18N_UCHAR_UBLOCK_ENCLOSED_CJK_LETTERS_AND_MONTHS	Enclosed CJK Letters And Months
I18N_UCHAR_UBLOCK_CJK_COMPATIBILITY	CJK Compatibility
I18N_UCHAR_UBLOCK_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_A	CJK Unified Ideographs Extension A
I18N_UCHAR_UBLOCK_CJK_UNIFIED_IDEOGRAPHS	CJK Unified Ideographs
I18N_UCHAR_UBLOCK_YI_SYLLABLES	Yi Syllables
I18N_UCHAR_UBLOCK_YI_RADICALS	Yi Radicals
I18N_UCHAR_UBLOCK_HANGUL_SYLLABLES	Hangul Syllables
I18N_UCHAR_UBLOCK_HIGH_SURROGATES	High Surrogates
I18N_UCHAR_UBLOCK_HIGH_PRIVATE_USE_SURROGATES	High Private Use Surrogates
I18N_UCHAR_UBLOCK_LOW_SURROGATES	Low Surrogates
I18N_UCHAR_UBLOCK_PRIVATE_USE_AREA	Private Use Area
I18N_UCHAR_UBLOCK_PRIVATE_USE	Private Use
I18N_UCHAR_UBLOCK_CJK_COMPATIBILITY_IDEOGRAPHS	CJK Compatibility Ideographs
I18N_UCHAR_UBLOCK_ALPHABETIC_PRESENTATION_FORMS	Alphabetic Presentation Forms
I18N_UCHAR_UBLOCK_ARABIC_PRESENTATION_FORMS_A	Arabic Presentation Forms A
I18N_UCHAR_UBLOCK_COMBINING_HALF_MARKS	Combining Half Marks
I18N_UCHAR_UBLOCK_CJK_COMPATIBILITY_FORMS	CJK Compatibility Forms
I18N_UCHAR_UBLOCK_SMALL_FORM_VARIANTS	Small Form Variants
I18N_UCHAR_UBLOCK_ARABIC_PRESENTATION_FORMS_B	Arabic Presentation Forms B
I18N_UCHAR_UBLOCK_SPECIALS	Specials
I18N_UCHAR_UBLOCK_HALFWIDTH_AND_FULLWIDTH_FORMS	Halfwidth And Fullwidth Forms
I18N_UCHAR_UBLOCK_OLD_ITALIC	Old Italic
I18N_UCHAR_UBLOCK_GOTHIC	Gothic
I18N_UCHAR_UBLOCK_DESERET	Deseret
I18N_UCHAR_UBLOCK_BYZANTINE_MUSICAL_SYMBOLS	Byzantine Musical Symbols
I18N_UCHAR_UBLOCK_MUSICAL_SYMBOLS	Musical Symbols
I18N_UCHAR_UBLOCK_MATHEMATICAL_ALPHANUMERIC_SYMBOLS	Mathematical Alphanumeric Symbols
I18N_UCHAR_UBLOCK_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_B	CJK Unified Ideographs Extension B
I18N_UCHAR_UBLOCK_CJK_COMPATIBILITY_IDEOGRAPHS_SUPPLEMENT	CJK Compatibility Ideographs Supplement
I18N_UCHAR_UBLOCK_TAGS	Tags
I18N_UCHAR_UBLOCK_CYRILLIC_SUPPLEMENT	Cyrillic Supplement
I18N_UCHAR_UBLOCK_CYRILLIC_SUPPLEMENTARY	Cyrillic Supplementary
I18N_UCHAR_UBLOCK_TAGALOG	Tagalog
I18N_UCHAR_UBLOCK_HANUNOO	Hanunoo
I18N_UCHAR_UBLOCK_BUHID	Buhid
I18N_UCHAR_UBLOCK_TAGBANWA	Tagbanwa
I18N_UCHAR_UBLOCK_MISCELLANEOUS_MATHEMATICAL_SYMBOLS_A	Miscellaneous Mathematical Symbols A
I18N_UCHAR_UBLOCK_SUPPLEMENTAL_ARROWS_A	Supplemental Arrows A
I18N_UCHAR_UBLOCK_SUPPLEMENTAL_ARROWS_B	Supplemental Arrows B
I18N_UCHAR_UBLOCK_MISCELLANEOUS_MATHEMATICAL_SYMBOLS_B	Miscellaneous Mathematical Symbols B
I18N_UCHAR_UBLOCK_SUPPLEMENTAL_MATHEMATICAL_OPERATORS	Supplemental Mathematical Operators
I18N_UCHAR_UBLOCK_KATAKANA_PHONETIC_EXTENSIONS	Katakana Phonetic Extensions
I18N_UCHAR_UBLOCK_VARIATION_SELECTORS	Variation Selectors
I18N_UCHAR_UBLOCK_SUPPLEMENTARY_PRIVATE_USE_AREA_A	Supplementary Private Use Area A
I18N_UCHAR_UBLOCK_SUPPLEMENTARY_PRIVATE_USE_AREA_B	Supplementary Private Use Area B
I18N_UCHAR_UBLOCK_LIMBU	Limbu
I18N_UCHAR_UBLOCK_TAI_LE	Tai Le
I18N_UCHAR_UBLOCK_KHMER_SYMBOLS	Khmer Symbols
I18N_UCHAR_UBLOCK_PHONETIC_EXTENSIONS	Phonetic Extensions
I18N_UCHAR_UBLOCK_MISCELLANEOUS_SYMBOLS_AND_ARROWS	Miscellaneous Symbols And Arrows
I18N_UCHAR_UBLOCK_YIJING_HEXAGRAM_SYMBOLS	Yijing Hexagram Symbols
I18N_UCHAR_UBLOCK_LINEAR_B_SYLLABARY	Linear B Syllabary
I18N_UCHAR_UBLOCK_LINEAR_B_IDEOGRAMS	Linear B Ideograms
I18N_UCHAR_UBLOCK_AEGEAN_NUMBERS	Aegean Numbers
I18N_UCHAR_UBLOCK_UGARITIC	Ugaritic
I18N_UCHAR_UBLOCK_SHAVIAN	Shavian
I18N_UCHAR_UBLOCK_OSMANYA	Osmanya
I18N_UCHAR_UBLOCK_CYPRIOT_SYLLABARY	Cypriot Syllabary
I18N_UCHAR_UBLOCK_TAI_XUAN_JING_SYMBOLS	Tai Xuan Jing Symbols
I18N_UCHAR_UBLOCK_VARIATION_SELECTORS_SUPPLEMENT	Variation Selectors Supplement
I18N_UCHAR_UBLOCK_ANCIENT_GREEK_MUSICAL_NOTATION	Ancient Greek Musical Notation
I18N_UCHAR_UBLOCK_ANCIENT_GREEK_NUMBERS	Ancient Greek Numbers
I18N_UCHAR_UBLOCK_ARABIC_SUPPLEMENT	Arabic Supplement
I18N_UCHAR_UBLOCK_BUGINESE	Buginese
I18N_UCHAR_UBLOCK_CJK_STROKES	CJK Strokes
I18N_UCHAR_UBLOCK_COMBINING_DIACRITICAL_MARKS_SUPPLEMENT	Combining Diacritical Marks Supplement
I18N_UCHAR_UBLOCK_COPTIC	Coptic
I18N_UCHAR_UBLOCK_ETHIOPIC_EXTENDED	Ethiopic Extended
I18N_UCHAR_UBLOCK_ETHIOPIC_SUPPLEMENT	Ethiopic Supplement
I18N_UCHAR_UBLOCK_GEORGIAN_SUPPLEMENT	Georgian Supplement
I18N_UCHAR_UBLOCK_GLAGOLITIC	Glagolitic
I18N_UCHAR_UBLOCK_KHAROSHTHI	Kharoshthi
I18N_UCHAR_UBLOCK_MODIFIER_TONE_LETTERS	Modifier Tone Letters
I18N_UCHAR_UBLOCK_NEW_TAI_LUE	New Tai Lue
I18N_UCHAR_UBLOCK_OLD_PERSIAN	Old Persian
I18N_UCHAR_UBLOCK_PHONETIC_EXTENSIONS_SUPPLEMENT	Phonetic Extensions Supplement
I18N_UCHAR_UBLOCK_SUPPLEMENTAL_PUNCTUATION	Supplemental Punctuation
I18N_UCHAR_UBLOCK_SYLOTI_NAGRI	Syloti Nagri
I18N_UCHAR_UBLOCK_TIFINAGH	Tifinagh
I18N_UCHAR_UBLOCK_VERTICAL_FORMS	Vertical Forms
I18N_UCHAR_UBLOCK_NKO	Nko
I18N_UCHAR_UBLOCK_BALINESE	Balinese
I18N_UCHAR_UBLOCK_LATIN_EXTENDED_C	Latin Extended C
I18N_UCHAR_UBLOCK_LATIN_EXTENDED_D	Latin Extended D
I18N_UCHAR_UBLOCK_PHAGS_PA	Phags Pa
I18N_UCHAR_UBLOCK_PHOENICIAN	Phoenician
I18N_UCHAR_UBLOCK_CUNEIFORM	Cuneiform
I18N_UCHAR_UBLOCK_CUNEIFORM_NUMBERS_AND_PUNCTUATION	Cuneiform Numbers And Punctuation
I18N_UCHAR_UBLOCK_COUNTING_ROD_NUMERALS	Counting Rod Numerals
I18N_UCHAR_UBLOCK_SUNDANESE	Sundanese
I18N_UCHAR_UBLOCK_LEPCHA	Lepcha
I18N_UCHAR_UBLOCK_OL_CHIKI	Ol Chiki
I18N_UCHAR_UBLOCK_CYRILLIC_EXTENDED_A	Cyrillic Extended A
I18N_UCHAR_UBLOCK_VAI	Vai
I18N_UCHAR_UBLOCK_CYRILLIC_EXTENDED_B	Cyrillic Extended B
I18N_UCHAR_UBLOCK_SAURASHTRA	Saurashtra
I18N_UCHAR_UBLOCK_KAYAH_LI	Kayah Li
I18N_UCHAR_UBLOCK_REJANG	Rejang
I18N_UCHAR_UBLOCK_CHAM	Cham
I18N_UCHAR_UBLOCK_ANCIENT_SYMBOLS	Ancient Symbols
I18N_UCHAR_UBLOCK_PHAISTOS_DISC	Phaistos Disc
I18N_UCHAR_UBLOCK_LYCIAN	Lycian
I18N_UCHAR_UBLOCK_CARIAN	Carian
I18N_UCHAR_UBLOCK_LYDIAN	Lydian
I18N_UCHAR_UBLOCK_MAHJONG_TILES	Mahjong Tiles
I18N_UCHAR_UBLOCK_DOMINO_TILES	Domino Tiles
I18N_UCHAR_UBLOCK_SAMARITAN	Samaritan
I18N_UCHAR_UBLOCK_UNIFIED_CANADIAN_ABORIGINAL_SYLLABICS_EXTENDED	Unified Canadian Aboriginal Syllabics Extended
I18N_UCHAR_UBLOCK_TAI_THAM	Tai Tham
I18N_UCHAR_UBLOCK_VEDIC_EXTENSIONS	Vedic Extensions
I18N_UCHAR_UBLOCK_LISU	Lisu
I18N_UCHAR_UBLOCK_BAMUM	Bamum
I18N_UCHAR_UBLOCK_COMMON_INDIC_NUMBER_FORMS	Common Indic Number Forms
I18N_UCHAR_UBLOCK_DEVANAGARI_EXTENDED	Devanagari Extended
I18N_UCHAR_UBLOCK_HANGUL_JAMO_EXTENDED_A	Hangul Jamo Extended A
I18N_UCHAR_UBLOCK_JAVANESE	Javanese
I18N_UCHAR_UBLOCK_MYANMAR_EXTENDED_A	Myanmar Extended A
I18N_UCHAR_UBLOCK_TAI_VIET	Tai Viet
I18N_UCHAR_UBLOCK_MEETEI_MAYEK	Meetei Mayek
I18N_UCHAR_UBLOCK_HANGUL_JAMO_EXTENDED_B	Hangul Jamo Extended B
I18N_UCHAR_UBLOCK_IMPERIAL_ARAMAIC	Imperial Aramaic
I18N_UCHAR_UBLOCK_OLD_SOUTH_ARABIAN	Old South Arabian
I18N_UCHAR_UBLOCK_AVESTAN	Avestan
I18N_UCHAR_UBLOCK_INSCRIPTIONAL_PARTHIAN	Inscriptional Parthian
I18N_UCHAR_UBLOCK_INSCRIPTIONAL_PAHLAVI	Inscriptional Pahlavi
I18N_UCHAR_UBLOCK_OLD_TURKIC	Old Turkic
I18N_UCHAR_UBLOCK_RUMI_NUMERAL_SYMBOLS	Rumi Numeral Symbols
I18N_UCHAR_UBLOCK_KAITHI	Kaithi
I18N_UCHAR_UBLOCK_EGYPTIAN_HIEROGLYPHS	Egyptian Hieroglyphs
I18N_UCHAR_UBLOCK_ENCLOSED_ALPHANUMERIC_SUPPLEMENT	Enclosed Alphanumeric Supplement
I18N_UCHAR_UBLOCK_ENCLOSED_IDEOGRAPHIC_SUPPLEMENT	Enclosed Ideographic Supplement
I18N_UCHAR_UBLOCK_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_C	CJK Unified Ideographs Extension C
I18N_UCHAR_UBLOCK_MANDAIC	Mandaic
I18N_UCHAR_UBLOCK_BATAK	Batak
I18N_UCHAR_UBLOCK_ETHIOPIC_EXTENDED_A	Ethiopic Extended A
I18N_UCHAR_UBLOCK_BRAHMI	Brahmi
I18N_UCHAR_UBLOCK_BAMUM_SUPPLEMENT	Bamum Supplement
I18N_UCHAR_UBLOCK_KANA_SUPPLEMENT	Kana Supplement
I18N_UCHAR_UBLOCK_PLAYING_CARDS	Playing Cards
I18N_UCHAR_UBLOCK_MISCELLANEOUS_SYMBOLS_AND_PICTOGRAPHS	Miscellaneous Symbols And Pictographs
I18N_UCHAR_UBLOCK_EMOTICONS	Emoticons
I18N_UCHAR_UBLOCK_TRANSPORT_AND_MAP_SYMBOLS	Transport And Map Symbols
I18N_UCHAR_UBLOCK_ALCHEMICAL_SYMBOLS	Alchemical Symbols
I18N_UCHAR_UBLOCK_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_D	CJK Unified Ideographs Extension D
I18N_UCHAR_UBLOCK_BASSA_VAH	Bassa Vah (Since 3.0)
I18N_UCHAR_UBLOCK_CAUCASIAN_ALBANIAN	Caucasian Albanian (Since 3.0)
I18N_UCHAR_UBLOCK_COPTIC_EPACT_NUMBERS	Coptic Epact Numbers (Since 3.0)
I18N_UCHAR_UBLOCK_COMBINING_DIACRITICAL_MARKS_EXTENDED	Combining Diacritical Marks Extended (Since 3.0)
I18N_UCHAR_UBLOCK_DUPLOYAN	Duployan (Since 3.0)
I18N_UCHAR_UBLOCK_ELBASAN	Elbasan (Since 3.0)
I18N_UCHAR_UBLOCK_GEOMETRIC_SHAPES_EXTENDED	Geometric Shapes Extended (Since 3.0)
I18N_UCHAR_UBLOCK_GRANTHA	Grantha (Since 3.0)
I18N_UCHAR_UBLOCK_KHOJKI	Khojki (Since 3.0)
I18N_UCHAR_UBLOCK_KHUDAWADI	Khudawadi (Since 3.0)
I18N_UCHAR_UBLOCK_LATIN_EXTENDED_E	Latin Extended E (Since 3.0)
I18N_UCHAR_UBLOCK_LINEAR_A	Linear A (Since 3.0)
I18N_UCHAR_UBLOCK_MAHAJANI	Mahajani (Since 3.0)
I18N_UCHAR_UBLOCK_MANICHAEAN	Manichaean (Since 3.0)
I18N_UCHAR_UBLOCK_MENDE_KIKAKUI	Mende Kikakui (Since 3.0)
I18N_UCHAR_UBLOCK_MODI	Modi (Since 3.0)
I18N_UCHAR_UBLOCK_MRO	Mro (Since 3.0)
I18N_UCHAR_UBLOCK_MYANMAR_EXTENDED_B	Myanmar Extended B (Since 3.0)
I18N_UCHAR_UBLOCK_NABATAEAN	Nabataean (Since 3.0)
I18N_UCHAR_UBLOCK_OLD_NORTH_ARABIAN	Old North Arabian (Since 3.0)
I18N_UCHAR_UBLOCK_OLD_PERMIC	Old Permic (Since 3.0)
I18N_UCHAR_UBLOCK_ORNAMENTAL_DINGBATS	Ornamental Dingbats (Since 3.0)
I18N_UCHAR_UBLOCK_PAHAWH_HMONG	Pahawh Hmong (Since 3.0)
I18N_UCHAR_UBLOCK_PALMYRENE	Palmyrene (Since 3.0)
I18N_UCHAR_UBLOCK_PAU_CIN_HAU	Pau Cin Hau (Since 3.0)
I18N_UCHAR_UBLOCK_PSALTER_PAHLAVI	Psalter Pahlavi (Since 3.0)
I18N_UCHAR_UBLOCK_SHORTHAND_FORMAT_CONTROLS	Shorthand Format Controls (Since 3.0)
I18N_UCHAR_UBLOCK_SIDDHAM	Siddham (Since 3.0)
I18N_UCHAR_UBLOCK_SINHALA_ARCHAIC_NUMBERS	Sinhala Archaic Numbers (Since 3.0)
I18N_UCHAR_UBLOCK_SUPPLEMENTAL_ARROWS_C	Supplemental Arrows C (Since 3.0)
I18N_UCHAR_UBLOCK_TIRHUTA	Tirhuta (Since 3.0)
I18N_UCHAR_UBLOCK_WARANG_CITI	Warang Citi (Since 3.0)
I18N_UCHAR_UBLOCK_COUNT	Count
I18N_UCHAR_UBLOCK_INVALID_CODE	Invalid Code

enum i18n_uchar_uproperty_e

Enumeration of constants for Unicode properties. The properties APIs are intended to reflect Unicode properties as defined in the Unicode Character Database (UCD) and Unicode Technical Reports (UTR). For details about the properties see http://www.unicode.org/ucd/ . For names of Unicode properties see the UCD file PropertyAliases.txt.

Since :: 2.3.1

Enumerator:

I18N_UCHAR_ALPHABETIC	Binary property Alphabetic. Lu+Ll+Lt+Lm+Lo+Nl+Other_Alphabetic
I18N_UCHAR_BINARY_START	First constant for binary Unicode properties.
I18N_UCHAR_ASCII_HEX_DIGIT	Binary property ASCII_Hex_Digit. 0-9 A-F a-f
I18N_UCHAR_BIDI_CONTROL	Binary property Bidi_Control. Format controls which have specific functions in the Bidi Algorithm.
I18N_UCHAR_BIDI_MIRRORED	Binary property Bidi_Mirrored. Characters that may change display in RTL text. See Bidi Algorithm, UTR 9.
I18N_UCHAR_DASH	Binary property Dash. Variations of dashes.
I18N_UCHAR_DEFAULT_IGNORABLE_CODE_POINT	Binary property Default_Ignorable_Code_Point (new in Unicode 3.2). Ignorable in most processing. <2060..206F, FFF0..FFFB, E0000..E0FFF>+Other_Default_Ignorable_Code_Point+(Cf+Cc+Cs-White_Space)
I18N_UCHAR_DEPRECATED	Binary property Deprecated (new in Unicode 3.2). The usage of deprecated characters is strongly discouraged.
I18N_UCHAR_DIACRITIC	Binary property Diacritic. Characters that linguistically modify the meaning of another character to which they apply.
I18N_UCHAR_EXTENDER	Binary property Extender. Extend the value or shape of a preceding alphabetic character, e.g. length and iteration marks.
I18N_UCHAR_FULL_COMPOSITION_EXCLUSION	Binary property Full_Composition_Exclusion. CompositionExclusions.txt+Singleton Decompositions+ Non-Starter Decompositions.
I18N_UCHAR_GRAPHEME_BASE	Binary property Grapheme_Base (new in Unicode 3.2). For programmatic determination of grapheme cluster boundaries. [0..10FFFF]-Cc-Cf-Cs-Co-Cn-Zl-Zp-Grapheme_Link-Grapheme_Extend-CGJ
I18N_UCHAR_GRAPHEME_EXTEND	Binary property Grapheme_Extend (new in Unicode 3.2). For programmatic determination of grapheme cluster boundaries. Me+Mn+Mc+Other_Grapheme_Extend-Grapheme_Link-CGJ
I18N_UCHAR_GRAPHEME_LINK	Binary property Grapheme_Link (new in Unicode 3.2). For programmatic determination of grapheme cluster boundaries.
I18N_UCHAR_HEX_DIGIT	Binary property Hex_Digit. Characters commonly used for hexadecimal numbers.
I18N_UCHAR_HYPHEN	Binary property Hyphen. Dashes used to mark connections between pieces of words, plus the Katakana middle dot.
I18N_UCHAR_ID_CONTINUE	Binary property ID_Continue. Characters that can continue an identifier. DerivedCoreProperties.txt also says "NOTE: Cf characters should be filtered out." ID_Start+Mn+Mc+Nd+Pc
I18N_UCHAR_ID_START	Binary property ID_Start. Characters that can start an identifier. Lu+Ll+Lt+Lm+Lo+Nl
I18N_UCHAR_IDEOGRAPHIC	Binary property Ideographic. CJKV ideographs.
I18N_UCHAR_IDS_BINARY_OPERATOR	Binary property IDS_Binary_Operator (new in Unicode 3.2). For programmatic determination of Ideographic Description Sequences.
I18N_UCHAR_IDS_TRINARY_OPERATOR	Binary property IDS_Trinary_Operator (new in Unicode 3.2). For programmatic determination of Ideographic Description Sequences.
I18N_UCHAR_JOIN_CONTROL	Binary property Join_Control. Format controls for cursive joining and ligation.
I18N_UCHAR_LOGICAL_ORDER_EXCEPTION	Binary property Logical_Order_Exception (new in Unicode 3.2). Characters that do not use logical order and require special handling in most processing.
I18N_UCHAR_LOWERCASE	Binary property Lowercase. Ll+Other_Lowercase
I18N_UCHAR_MATH	Binary property Math. Sm+Other_Math
I18N_UCHAR_NONCHARACTER_CODE_POINT	Binary property Noncharacter_Code_Point. Code points that are explicitly defined as illegal for the encoding of characters.
I18N_UCHAR_QUOTATION_MARK	Binary property Quotation_Mark.
I18N_UCHAR_RADICAL	Binary property Radical (new in Unicode 3.2). For programmatic determination of Ideographic Description Sequences.
I18N_UCHAR_SOFT_DOTTED	Binary property Soft_Dotted (new in Unicode 3.2). Characters with a "soft dot", like i or j. An accent placed on these characters causes the dot to disappear.
I18N_UCHAR_TERMINAL_PUNCTUATION	Binary property Terminal_Punctuation. Punctuation characters that generally mark the end of textual units.
I18N_UCHAR_UNIFIED_IDEOGRAPH	Binary property Unified_Ideograph (new in Unicode 3.2). For programmatic determination of Ideographic Description Sequences.
I18N_UCHAR_UPPERCASE	Binary property Uppercase. Lu+Other_Uppercase
I18N_UCHAR_WHITE_SPACE	Binary property White_Space. Space characters+TAB+CR+LF-ZWSP-ZWNBSP
I18N_UCHAR_XID_CONTINUE	Binary property XID_Continue. ID_Continue modified to allow closure under normalization forms NFKC and NFKD.
I18N_UCHAR_XID_START	Binary property XID_Start. ID_Start modified to allow closure under normalization forms NFKC and NFKD.
I18N_UCHAR_CASE_SENSITIVE	Binary property Case_Sensitive. Either the source of a case mapping or in the target of a case mapping. Not the same as the general category Cased_Letter.
I18N_UCHAR_S_TERM	Binary property STerm (new in Unicode 4.0.1).
I18N_UCHAR_VARIATION_SELECTOR	Binary property Variation_Selector (new in Unicode 4.0.1). Indicates all those characters that qualify as Variation Selectors.
I18N_UCHAR_NFD_INERT	Binary property NFD_Inert. ICU-specific property for characters that are inert under NFD, i.e., they do not interact with adjacent characters.
I18N_UCHAR_NFKD_INERT	Binary property NFKD_Inert. ICU-specific property for characters that are inert under NFKD, i.e., they do not interact with adjacent characters.
I18N_UCHAR_NFC_INERT	Binary property NFC_Inert. ICU-specific property for characters that are inert under NFC, i.e., they do not interact with adjacent characters.
I18N_UCHAR_NFKC_INERT	Binary property NFKC_Inert. ICU-specific property for characters that are inert under NFKC, i.e., they do not interact with adjacent characters.
I18N_UCHAR_SEGMENT_STARTER	Binary Property Segment_Starter. Property for characters that are starters in terms of Unicode normalization and combining character sequences. They have ccc=0 and do not occur in non-initial position of the canonical decomposition of any character (like a-umlaut in NFD and a Jamo T in an NFD(Hangul LVT)).
I18N_UCHAR_PATTERN_SYNTAX	Binary property Pattern_Syntax (new in Unicode 4.1).
I18N_UCHAR_PATTERN_WHITE_SPACE	Binary property Pattern_White_Space (new in Unicode 4.1).
I18N_UCHAR_POSIX_ALNUM	Binary property alnum (a C/POSIX character class).
I18N_UCHAR_POSIX_BLANK	Binary property blank (a C/POSIX character class).
I18N_UCHAR_POSIX_GRAPH	Binary property graph (a C/POSIX character class).
I18N_UCHAR_POSIX_PRINT	Binary property print (a C/POSIX character class).
I18N_UCHAR_POSIX_XDIGIT	Binary property xdigit (a C/POSIX character class).
I18N_UCHAR_CASED	Binary property Cased. For Lowercase, Uppercase and Titlecase characters.
I18N_UCHAR_CASE_IGNORABLE	Binary property Case_Ignorable. Used in context-sensitive case mappings.
I18N_UCHAR_CHANGES_WHEN_LOWERCASED	Binary property Changes_When_Lowercased.
I18N_UCHAR_CHANGES_WHEN_UPPERCASED	Binary property Changes_When_Uppercased.
I18N_UCHAR_CHANGES_WHEN_TITLECASED	Binary property Changes_When_Titlecased.
I18N_UCHAR_CHANGES_WHEN_CASEFOLDED	Binary property Changes_When_Casefolded.
I18N_UCHAR_CHANGES_WHEN_CASEMAPPED	Binary property Changes_When_Casemapped.
I18N_UCHAR_CHANGES_WHEN_NFKC_CASEFOLDED	Binary property Changes_When_NFKC_Casefolded.
I18N_UCHAR_BINARY_LIMIT	One more than the last constant for binary Unicode properties.
I18N_UCHAR_BIDI_CLASS	Enumerated property Bidi_Class. Same as u_charDirection, returns i18n_uchar_direction_e values.
I18N_UCHAR_INT_START	First constant for enumerated/integer Unicode properties.
I18N_UCHAR_BLOCK	Enumerated property Block. Returns i18n_uchar_ublock_code_e values.
I18N_UCHAR_CANONICAL_COMBINING_CLASS	Enumerated property Canonical_Combining_Class. Returns 8-bit numeric values.
I18N_UCHAR_DECOMPOSITION_TYPE	Enumerated property Decomposition_Type. Returns i18n_uchar_u_decomposition_type_e values.
I18N_UCHAR_EAST_ASIAN_WIDTH	Enumerated property East_Asian_Width. Returns i18n_uchar_u_east_asian_width_e values.
I18N_UCHAR_GENERAL_CATEGORY	Enumerated property General_Category. Returns i18n_uchar_category_e values.
I18N_UCHAR_JOINING_GROUP	Enumerated property Joining_Group. Returns i18n_uchar_u_joining_group_e values.
I18N_UCHAR_JOINING_TYPE	Enumerated property Joining_Type. Returns i18n_uchar_u_joining_type_e values.
I18N_UCHAR_LINE_BREAK	Enumerated property Line_Break. Returns i18n_uchar_u_line_break_e values.
I18N_UCHAR_NUMERIC_TYPE	Enumerated property Numeric_Type. Returns i18n_uchar_u_numeric_type_e values.
I18N_UCHAR_SCRIPT	Enumerated property Script. Returns i18n_uscript_code_e values.
I18N_UCHAR_HANGUL_SYLLABLE_TYPE	Enumerated property Hangul_Syllable_Type, new in Unicode 4. Returns i18n_uchar_u_hangul_syllable_type_e values.
I18N_UCHAR_NFD_QUICK_CHECK	Enumerated property NFD_Quick_Check. Returns i18n_unormalization_check_result_e values.
I18N_UCHAR_NFKD_QUICK_CHECK	Enumerated property NFKD_Quick_Check. Returns i18n_unormalization_check_result_e values.
I18N_UCHAR_NFC_QUICK_CHECK	Enumerated property NFC_Quick_Check. Returns i18n_unormalization_check_result_e values.
I18N_UCHAR_NFKC_QUICK_CHECK	Enumerated property NFKC_Quick_Check. Returns i18n_unormalization_check_result_e values.
I18N_UCHAR_LEAD_CANONICAL_COMBINING_CLASS	Enumerated property Lead_Canonical_Combining_Class. Returns 8-bit numeric values.
I18N_UCHAR_TRAIL_CANONICAL_COMBINING_CLASS	Enumerated property Trail_Canonical_Combining_Class. Returns 8-bit numeric values.
I18N_UCHAR_GRAPHEME_CLUSTER_BREAK	Enumerated property Grapheme_Cluster_Break (new in Unicode 4.1). Returns i18n_uchar_u_grapheme_cluster_break_e values.
I18N_UCHAR_SENTENCE_BREAK	Enumerated property Sentence_Break (new in Unicode 4.1). Returns i18n_uchar_u_sentence_break_e values.
I18N_UCHAR_WORD_BREAK	Enumerated property Word_Break (new in Unicode 4.1). Returns i18n_uchar_u_word_break_values_e values.
I18N_UCHAR_BIDI_PAIRED_BRACKET_TYPE	Enumerated property Bidi_Paired_Bracket_Type. Returns i18n_uchar_u_bidi_paired_bracket_type_e values .
I18N_UCHAR_INT_LIMIT	One more than the last constant for enumerated/integer Unicode properties.
I18N_UCHAR_GENERAL_CATEGORY_MASK	Bitmask property General_Category_Mask. Mask values should be cast to uint32_t.
I18N_UCHAR_MASK_START	First constant for bit-mask Unicode properties.
I18N_UCHAR_MASK_LIMIT	One more than the last constant for bit-mask Unicode properties.
I18N_UCHAR_NUMERIC_VALUE	Double property Numeric_Value.
I18N_UCHAR_DOUBLE_START	First constant for double Unicode properties.
I18N_UCHAR_DOUBLE_LIMIT	One more than the last constant for double Unicode properties.
I18N_UCHAR_AGE	String property Age.
I18N_UCHAR_STRING_START	First constant for string Unicode properties.
I18N_UCHAR_BIDI_MIRRORING_GLYPH	String property Bidi_Mirroring_Glyph.
I18N_UCHAR_CASE_FOLDING	String property Case_Folding.
I18N_UCHAR_LOWERCASE_MAPPING	String property Lowercase_Mapping.
I18N_UCHAR_NAME	String property Name.
I18N_UCHAR_SIMPLE_CASE_FOLDING	String property Simple_Case_Folding.
I18N_UCHAR_SIMPLE_LOWERCASE_MAPPING	String property Simple_Lowercase_Mapping.
I18N_UCHAR_SIMPLE_TITLECASE_MAPPING	String property Simple_Titlecase_Mapping.
I18N_UCHAR_SIMPLE_UPPERCASE_MAPPING	String property Simple_Uppercase_Mapping.
I18N_UCHAR_TITLECASE_MAPPING	String property Titlecase_Mapping.
I18N_UCHAR_UPPERCASE_MAPPING	String property Uppercase_Mapping.
I18N_UCHAR_BIDI_PAIRED_BRACKET	String property Bidi_Paired_Bracket.
I18N_UCHAR_STRING_LIMIT	One more than the last constant for string Unicode properties.
I18N_UCHAR_SCRIPT_EXTENSIONS	Provisional property Script_Extensions (new in Unicode 6.0).
I18N_UCHAR_OTHER_PROPERTY_START	First constant for Unicode properties with unusual value types.
I18N_UCHAR_OTHER_PROPERTY_LIMIT	One more than the last constant for Unicode properties with unusual value types.
I18N_UCHAR_INVALID_CODE	Represents a nonexistent or invalid property or property value.

enum i18n_uscript_code_e

Constants for ISO 15924 script codes.

Since :: 2.4

Enumerator:

I18N_USCRIPT_COMMON	Zyyy
I18N_USCRIPT_INHERITED	Zinh, "Code for inherited script", for non-spacing combining marks; also Qaai
I18N_USCRIPT_ARABIC	Arab
I18N_USCRIPT_ARMENIAN	Armn
I18N_USCRIPT_BENGALI	Beng
I18N_USCRIPT_BOPOMOFO	Bopo
I18N_USCRIPT_CHEROKEE	Cher
I18N_USCRIPT_COPTIC	Copt
I18N_USCRIPT_CYRILLIC	Cyrl
I18N_USCRIPT_DESERET	Dsrt
I18N_USCRIPT_DEVANAGARI	Deva
I18N_USCRIPT_ETHIOPIC	Ethi
I18N_USCRIPT_GEORGIAN	Geor
I18N_USCRIPT_GOTHIC	Goth
I18N_USCRIPT_GREEK	Grek
I18N_USCRIPT_GUJARATI	Gujr
I18N_USCRIPT_GURMUKHI	Guru
I18N_USCRIPT_HAN	Hani
I18N_USCRIPT_HANGUL	Hang
I18N_USCRIPT_HEBREW	Hebr
I18N_USCRIPT_HIRAGANA	Hira
I18N_USCRIPT_KANNADA	Knda
I18N_USCRIPT_KATAKANA	Kana
I18N_USCRIPT_KHMER	Khmr
I18N_USCRIPT_LAO	Laoo
I18N_USCRIPT_LATIN	Latn
I18N_USCRIPT_MALAYALAM	Mlym
I18N_USCRIPT_MONGOLIAN	Mong
I18N_USCRIPT_MYANMAR	Mymr
I18N_USCRIPT_OGHAM	Ogam
I18N_USCRIPT_OLD_ITALIC	Ital
I18N_USCRIPT_ORIYA	Orya
I18N_USCRIPT_RUNIC	Runr
I18N_USCRIPT_SINHALA	Sinh
I18N_USCRIPT_SYRIAC	Syrc
I18N_USCRIPT_TAMIL	Taml
I18N_USCRIPT_TELUGU	Telu
I18N_USCRIPT_THAANA	Thaa
I18N_USCRIPT_THAI	Thai
I18N_USCRIPT_TIBETAN	Tibt
I18N_USCRIPT_CANADIAN_ABORIGINAL	Cans, Canadian_Aboriginal script.
I18N_USCRIPT_UCAS	Canadian_Aboriginal script (alias).
I18N_USCRIPT_YI	Yiii
I18N_USCRIPT_TAGALOG	Tglg
I18N_USCRIPT_HANUNOO	Hano
I18N_USCRIPT_BUHID	Buhd
I18N_USCRIPT_TAGBANWA	Tagb
I18N_USCRIPT_BRAILLE	Brai
I18N_USCRIPT_CYPRIOT	Cprt
I18N_USCRIPT_LIMBU	Limb
I18N_USCRIPT_LINEAR_B	Linb
I18N_USCRIPT_OSMANYA	Osma
I18N_USCRIPT_SHAVIAN	Shaw
I18N_USCRIPT_TAI_LE	Tale
I18N_USCRIPT_UGARITIC	Ugar
I18N_USCRIPT_KATAKANA_OR_HIRAGANA	Hrkt
I18N_USCRIPT_BUGINESE	Bugi
I18N_USCRIPT_GLAGOLITIC	Glag
I18N_USCRIPT_KHAROSHTHI	Khar
I18N_USCRIPT_SYLOTI_NAGRI	Sylo
I18N_USCRIPT_NEW_TAI_LUE	Talu
I18N_USCRIPT_TIFINAGH	Tfng
I18N_USCRIPT_OLD_PERSIAN	Xpeo
I18N_USCRIPT_BALINESE	Bali
I18N_USCRIPT_BATAK	Batk
I18N_USCRIPT_BLISSYMBOLS	Blis
I18N_USCRIPT_BRAHMI	Brah
I18N_USCRIPT_CHAM	Cham
I18N_USCRIPT_CIRTH	Cirt
I18N_USCRIPT_OLD_CHURCH_SLAVONIC_CYRILLIC	Cyrs
I18N_USCRIPT_DEMOTIC_EGYPTIAN	Egyd
I18N_USCRIPT_HIERATIC_EGYPTIAN	Egyh
I18N_USCRIPT_EGYPTIAN_HIEROGLYPHS	Egyp
I18N_USCRIPT_KHUTSURI	Geok
I18N_USCRIPT_SIMPLIFIED_HAN	Hans
I18N_USCRIPT_TRADITIONAL_HAN	Hant
I18N_USCRIPT_PAHAWH_HMONG	Hmng
I18N_USCRIPT_OLD_HUNGARIAN	Hung
I18N_USCRIPT_HARAPPAN_INDUS	Inds
I18N_USCRIPT_JAVANESE	Java
I18N_USCRIPT_KAYAH_LI	Kali
I18N_USCRIPT_LATIN_FRAKTUR	Latf
I18N_USCRIPT_LATIN_GAELIC	Latg
I18N_USCRIPT_LEPCHA	Lepc
I18N_USCRIPT_LINEAR_A	Lina
I18N_USCRIPT_MANDAIC	Mand
I18N_USCRIPT_MAYAN_HIEROGLYPHS	Maya
I18N_USCRIPT_MEROITIC_HIEROGLYPHS	Mero
I18N_USCRIPT_NKO	Nkoo
I18N_USCRIPT_ORKHON	Orkh
I18N_USCRIPT_OLD_PERMIC	Perm
I18N_USCRIPT_PHAGS_PA	Phag
I18N_USCRIPT_PHOENICIAN	Phnx
I18N_USCRIPT_PHONETIC_POLLARD	Plrd
I18N_USCRIPT_RONGORONGO	Roro
I18N_USCRIPT_SARATI	Sara
I18N_USCRIPT_ESTRANGELO_SYRIAC	Syre
I18N_USCRIPT_WESTERN_SYRIAC	Syrj
I18N_USCRIPT_EASTERN_SYRIAC	Syrn
I18N_USCRIPT_TENGWAR	Teng
I18N_USCRIPT_VAI	Vaii
I18N_USCRIPT_VISIBLE_SPEECH	Visp
I18N_USCRIPT_CUNEIFORM	Xsux
I18N_USCRIPT_UNWRITTEN_LANGUAGES	Zxxx
I18N_USCRIPT_UNKNOWN	Zzzz, Unknown="Code for uncoded script", for unassigned code points
I18N_USCRIPT_CARIAN	Cari
I18N_USCRIPT_JAPANESE	Jpan
I18N_USCRIPT_LANNA	Lana
I18N_USCRIPT_LYCIAN	Lyci
I18N_USCRIPT_LYDIAN	Lydi
I18N_USCRIPT_OL_CHIKI	Olck
I18N_USCRIPT_REJANG	Rjng
I18N_USCRIPT_SAURASHTRA	Saur
I18N_USCRIPT_SIGN_WRITING	Sgnw
I18N_USCRIPT_SUNDANESE	Sund
I18N_USCRIPT_MOON	Moon
I18N_USCRIPT_MEITEI_MAYEK	Mtei
I18N_USCRIPT_IMPERIAL_ARAMAIC	Armi
I18N_USCRIPT_AVESTAN	Avst
I18N_USCRIPT_CHAKMA	Cakm
I18N_USCRIPT_KOREAN	Kore
I18N_USCRIPT_KAITHI	Kthi
I18N_USCRIPT_MANICHAEAN	Mani
I18N_USCRIPT_INSCRIPTIONAL_PAHLAVI	Phli
I18N_USCRIPT_PSALTER_PAHLAVI	Phlp
I18N_USCRIPT_BOOK_PAHLAVI	Phlv
I18N_USCRIPT_INSCRIPTIONAL_PARTHIAN	Prti
I18N_USCRIPT_SAMARITAN	Samr
I18N_USCRIPT_TAI_VIET	Tavt
I18N_USCRIPT_MATHEMATICAL_NOTATION	Zmth
I18N_USCRIPT_SYMBOLS	Zsym
I18N_USCRIPT_BAMUM	Bamu
I18N_USCRIPT_LISU	Lisu
I18N_USCRIPT_NAKHI_GEBA	Nkgb
I18N_USCRIPT_OLD_SOUTH_ARABIAN	Sarb
I18N_USCRIPT_BASSA_VAH	Bass
I18N_USCRIPT_DUPLOYAN_SHORTAND	Dupl
I18N_USCRIPT_ELBASAN	Elba
I18N_USCRIPT_GRANTHA	Gran
I18N_USCRIPT_KPELLE	Kpel
I18N_USCRIPT_LOMA	Loma
I18N_USCRIPT_MENDE	Mend
I18N_USCRIPT_MEROITIC_CURSIVE	Merc
I18N_USCRIPT_OLD_NORTH_ARABIAN	Narb
I18N_USCRIPT_NABATAEAN	Nbat
I18N_USCRIPT_PALMYRENE	Palm
I18N_USCRIPT_SINDHI	Sind
I18N_USCRIPT_WARANG_CITI	Wara
I18N_USCRIPT_AFAKA	Afak
I18N_USCRIPT_JURCHEN	Jurc
I18N_USCRIPT_MRO	Mroo
I18N_USCRIPT_NUSHU	Nshu
I18N_USCRIPT_SHARADA	Shrd
I18N_USCRIPT_SORA_SOMPENG	Sora
I18N_USCRIPT_TAKRI	Takr
I18N_USCRIPT_TANGUT	Tang
I18N_USCRIPT_WOLEAI	Wole
I18N_USCRIPT_ANATOLIAN_HIEROGLYPHS	Hluw
I18N_USCRIPT_KHOJKI	Khoj
I18N_USCRIPT_TIRHUTA	Tirh
I18N_USCRIPT_CODE_LIMIT	Count of i18n_uscript_code_e enumerators

Function Documentation

int i18n_uchar_get_int_property_value	(	i18n_uchar32	c,
		i18n_uchar_uproperty_e	which,
		int32_t *	property_val
	)

Gets the property value for an enumerated property for a code point.

int property_value; i18n_uchar_u_east_asian_width_e east_asian_width; i18n_uchar_get_int_property_value (c, I18N_UCHAR_EAST_ASIAN_WIDTH, &property_value); east_asian_width = (i18n_uchar_u_east_asian_width_e)property_value;

int property_value; bool is_ideographic; i18n_uchar_get_int_property_value(c, I18N_UCHAR_IDEOGRAPHIC, &property_value); is_ideographic = (bool)property_value;

Since :: 2.3.1

Parameters:

[in]	c	The code point to test.
[in]	which	The i18n_uchar_uproperty_e selector constant, identifies which property to check Must be I18N_UCHAR_BINARY_START<=which<I18N_UCHAR_BINARY_LIMIT or I18N_UCHAR_INT_START<=which<I18N_UCHAR_INT_LIMIT or I18N_UCHAR_MASK_START<=which<I18N_UCHAR_MASK_LIMIT.
[out]	property_val	The numeric value that is directly the property value or, for enumerated properties, corresponds to the numeric value of the enumerated constant of the respective property value enumeration type (cast to enum type if necessary) Returns `0` or `1` (for false/true) for binary Unicode properties Returns a bit-mask for mask properties Returns `0` if 'which' is out of bounds or if the Unicode version does not have data for the property at all, or not for this code point.

Return values:

I18N_ERROR_NONE	Successful
I18N_ERROR_INVALID_PARAMETER	Invalid function parameter

int i18n_uchar_get_ublock_code	(	i18n_uchar32	c,
		i18n_uchar_ublock_code_e *	block_val
	)

Gets the Unicode allocation block that contains the character.

Since :: 2.3.1

Parameters:

[in]	c	The code point to test
[out]	block_val	The block value for the code point

Return values:

I18N_ERROR_NONE	Successful
I18N_ERROR_INVALID_PARAMETER	Invalid function parameter

Required Header

Overview

Sample Code 1

Functions

Typedefs

Defines

Define Documentation

Typedef Documentation

Enumeration Type Documentation

Function Documentation