Tizen Native API  3.0

The Uchar module provides low-level access to the Unicode Character Database.

Required Header

#include <utils_i18n.h>

Overview

The Uchar module provides low-level access to the Unicode Character Database.

Sample Code 1

Gets the property value of 'east asian width' among an enumerated property, and the unicode allocation block that contains the character.

    int ret = I18N_ERROR_NONE;
    i18n_uchar32 code_point = 0;
    int property_value = 0;
    i18n_uchar_u_east_asian_width_e east_asian_width = I18N_UCHAR_U_EA_NEUTRAL;
    i18n_uchar_ublock_code_e block_code = I18N_UCHAR_UBLOCK_NO_BLOCK;

    // How to get the east asian width type for 's'
    code_point = 0x73;    // 's'
    ret = i18n_uchar_get_int_property_value(code_point, I18N_UCHAR_EAST_ASIAN_WIDTH, &property_value);
    if (ret != I18N_ERROR_NONE) {
        dlog_print(DLOG_INFO, LOG_TAG, "Error occured!!\n");
    } else {
        east_asian_width = (i18n_uchar_u_east_asian_width_e)property_value;
        dlog_print(DLOG_INFO, LOG_TAG, "East Asian Width Type for ( %.4x ) is ( %d )\n", code_point, east_asian_width);
        // East Asian Width Type for ( 0073 ) is ( 4 ) which is I18N_UCHAR_U_EA_NARROW
    }

    // How to get the block code for 's'
    ret = i18n_uchar_get_ublock_code(code_point, &block_code);
    if (ret != I18N_ERROR_NONE) {
        dlog_print(DLOG_INFO, LOG_TAG, "Error occured!!\n");
    } else {
        dlog_print(DLOG_INFO, LOG_TAG, "block name for ( %.4x ) is ( %d )\n", code_point, block_code);
        // block code for ( 0073 ) is ( 1 ) which is I18N_UCHAR_UBLOCK_BASIC_LATIN
    }

    // How to get the east asian width type for 'sung' as ideographs
    code_point = 0x661F;    // 'sung' as ideographs
    ret = i18n_uchar_get_int_property_value(code_point, I18N_UCHAR_EAST_ASIAN_WIDTH, &property_value);
    if (ret != I18N_ERROR_NONE) {
        dlog_print(DLOG_INFO, LOG_TAG, "Error occured!!\n");
    } else {
        east_asian_width = (i18n_uchar_u_east_asian_width_e)property_value;
        dlog_print(DLOG_INFO, LOG_TAG, "East Asian Width Type for ( %.4x ) is ( %d )\n", code_point, east_asian_width);
        // East Asian Width Type for ( 661f ) is ( 5 ) which is I18N_UCHAR_U_EA_WIDE
    }

    // How to get the block code for 'sung' as ideographs
    ret = i18n_uchar_get_ublock_code(code_point, &block_code);
    if (ret != I18N_ERROR_NONE) {
        dlog_print(DLOG_INFO, LOG_TAG, "Error occured!!\n");
    } else {
        dlog_print(DLOG_INFO, LOG_TAG, "block name for ( %.4x ) is ( %d )\n", code_point, block_code);
        // block code for ( 661f ) is ( 71 ) which is I18N_UCHAR_UBLOCK_CJK_UNIFIED_IDEOGRAPHS
    }

    // How to get the east asian width type for 'sung' as hangul
    code_point = 0xC131;    // 'sung' as hangul
    ret = i18n_uchar_get_int_property_value(code_point, I18N_UCHAR_EAST_ASIAN_WIDTH, &property_value);
    if (ret != I18N_ERROR_NONE) {
        dlog_print(DLOG_INFO, LOG_TAG, "Error occured!!\n");
    } else {
        east_asian_width = (i18n_uchar_u_east_asian_width_e)property_value;
        dlog_print(DLOG_INFO, LOG_TAG, "East Asian Width Type for ( %.4x ) is ( %d )\n", code_point, east_asian_width);
        // East Asian Width Type for ( c131 ) is ( 5 ) which is I18N_UCHAR_U_EA_WIDE
    }

    // How to get the block code for 'sung' as hangul
    ret = i18n_uchar_get_ublock_code(code_point, &block_code);
    if (ret != I18N_ERROR_NONE) {
        dlog_print(DLOG_INFO, LOG_TAG, "Error occured!!\n");
    } else {
        dlog_print(DLOG_INFO, LOG_TAG, "block name for ( %.4x ) is ( %d )\n", code_point, block_code);
        // block code for ( c131 ) is ( 74 ) which is I18N_UCHAR_UBLOCK_HANGUL_SYLLABLES
    }

Functions

int i18n_uchar_get_int_property_value (i18n_uchar32 c, i18n_uchar_uproperty_e which, int32_t *property_val)
 Gets the property value for an enumerated property for a code point.
int i18n_uchar_get_ublock_code (i18n_uchar32 c, i18n_uchar_ublock_code_e *block_val)
 Gets the Unicode allocation block that contains the character.

Typedefs

typedef uint16_t i18n_uchar
 i18n_uchar.
typedef int32_t i18n_uchar32
 i18n_uchar32.
typedef int8_t i18n_ubool
 i18n_ubool.

Defines

#define I18N_U_MASK(x)   ((uint32_t)1<<(x))
#define I18N_U_GC_CN_MASK   I18N_U_MASK(I18N_UCHAR_U_GENERAL_OTHER_TYPES)
#define I18N_U_GC_LU_MASK   I18N_U_MASK(I18N_UCHAR_U_UPPERCASE_LETTER)
#define I18N_U_GC_LL_MASK   I18N_U_MASK(I18N_UCHAR_U_LOWERCASE_LETTER)
#define I18N_U_GC_LT_MASK   I18N_U_MASK(I18N_UCHAR_U_TITLECASE_LETTER)
#define I18N_U_GC_LM_MASK   I18N_U_MASK(I18N_UCHAR_U_MODIFIER_LETTER)
#define I18N_U_GC_LO_MASK   I18N_U_MASK(I18N_UCHAR_U_OTHER_LETTER)
#define I18N_U_GC_MN_MASK   I18N_U_MASK(I18N_UCHAR_U_NON_SPACING_MARK)
#define I18N_U_GC_ME_MASK   I18N_U_MASK(I18N_UCHAR_U_ENCLOSING_MARK)
#define I18N_U_GC_MC_MASK   I18N_U_MASK(I18N_UCHAR_U_COMBINING_SPACING_MARK)
#define I18N_U_GC_ND_MASK   I18N_U_MASK(I18N_UCHAR_U_DECIMAL_DIGIT_NUMBER)
#define I18N_U_GC_NL_MASK   I18N_U_MASK(I18N_UCHAR_U_LETTER_NUMBER)
#define I18N_U_GC_NO_MASK   I18N_U_MASK(I18N_UCHAR_U_OTHER_NUMBER)
#define I18N_U_GC_ZS_MASK   I18N_U_MASK(I18N_UCHAR_U_SPACE_SEPARATOR)
#define I18N_U_GC_ZL_MASK   I18N_U_MASK(I18N_UCHAR_U_LINE_SEPARATOR)
#define I18N_U_GC_ZP_MASK   I18N_U_MASK(I18N_UCHAR_U_PARAGRAPH_SEPARATOR)
#define I18N_U_GC_CC_MASK   I18N_U_MASK(I18N_UCHAR_U_CONTROL_CHAR)
#define I18N_U_GC_CF_MASK   I18N_U_MASK(I18N_UCHAR_U_FORMAT_CHAR)
#define I18N_U_GC_CO_MASK   I18N_U_MASK(I18N_UCHAR_U_PRIVATE_USE_CHAR)
#define I18N_U_GC_CS_MASK   I18N_U_MASK(I18N_UCHAR_U_SURROGATE)
#define I18N_U_GC_PD_MASK   I18N_U_MASK(I18N_UCHAR_U_DASH_PUNCTUATION)
#define I18N_U_GC_PS_MASK   I18N_U_MASK(I18N_UCHAR_U_START_PUNCTUATION)
#define I18N_U_GC_PE_MASK   I18N_U_MASK(I18N_UCHAR_U_END_PUNCTUATION)
#define I18N_U_GC_PC_MASK   I18N_U_MASK(I18N_UCHAR_U_CONNECTOR_PUNCTUATION)
#define I18N_U_GC_PO_MASK   I18N_U_MASK(I18N_UCHAR_U_OTHER_PUNCTUATION)
#define I18N_U_GC_SM_MASK   I18N_U_MASK(I18N_UCHAR_U_MATH_SYMBOL)
#define I18N_U_GC_SC_MASK   I18N_U_MASK(I18N_UCHAR_U_CURRENCY_SYMBOL)
#define I18N_U_GC_SK_MASK   I18N_U_MASK(I18N_UCHAR_U_MODIFIER_SYMBOL)
#define I18N_U_GC_SO_MASK   I18N_U_MASK(I18N_UCHAR_U_OTHER_SYMBOL)
#define I18N_U_GC_PI_MASK   I18N_U_MASK(I18N_UCHAR_U_INITIAL_PUNCTUATION)
#define I18N_U_GC_PF_MASK   I18N_U_MASK(I18N_UCHAR_U_FINAL_PUNCTUATION)
#define I18N_U_GC_L_MASK   (I18N_U_GC_LU_MASK|I18N_U_GC_LL_MASK|I18N_U_GC_LT_MASK|I18N_U_GC_LM_MASK|I18N_U_GC_LO_MASK)
#define I18N_U_GC_LC_MASK   (I18N_U_GC_LU_MASK|I18N_U_GC_LL_MASK|I18N_U_GC_LT_MASK)
#define I18N_U_GC_M_MASK   (I18N_U_GC_MN_MASK|I18N_U_GC_ME_MASK|I18N_U_GC_MC_MASK)
#define I18N_U_GC_N_MASK   (I18N_U_GC_ND_MASK|I18N_U_GC_NL_MASK|I18N_U_GC_NO_MASK)
#define I18N_U_GC_Z_MASK   (I18N_U_GC_ZS_MASK|I18N_U_GC_ZL_MASK|I18N_U_GC_ZP_MASK)
#define I18N_U_GC_C_MASK   (I18N_U_GC_CN_MASK|I18N_U_GC_CC_MASK|I18N_U_GC_CF_MASK|I18N_U_GC_CO_MASK|I18N_U_GC_CS_MASK)
#define I18N_U_GC_P_MASK   (I18N_U_GC_PD_MASK|I18N_U_GC_PS_MASK|I18N_U_GC_PE_MASK|I18N_U_GC_PC_MASK|I18N_U_GC_PO_MASK|I18N_U_GC_PI_MASK|I18N_U_GC_PF_MASK)
#define I18N_U_GC_S_MASK   (I18N_U_GC_SM_MASK|I18N_U_GC_SC_MASK|I18N_U_GC_SK_MASK|I18N_U_GC_SO_MASK)
#define I18N_U_NO_NUMERIC_VALUE   ((double)-123456789.)
#define I18N_U_GET_GC_MASK(c)   I18N_U_MASK(u_charType(c))
#define I18N_U_FOLD_CASE_DEFAULT   0
 Option value for case folding: use default mappings defined in CaseFolding.txt.
#define I18N_U_FOLD_CASE_EXCLUDE_SPECIAL_I   1
 Option value for case folding:
Use the modified set of mappings provided in CaseFolding.txt to handle dotted I and dotless i appropriately for Turkic languages (tr, az).
Before Unicode 3.2, CaseFolding.txt contains mappings marked with 'I' that are to be included for default mappings and excluded for the Turkic-specific mappings.
Unicode 3.2 CaseFolding.txt instead contains mappings marked with 'T' that are to be excluded for default mappings and included for the Turkic-specific mappings.
#define I18N_USEARCH_DONE   -1
 DONE is returned by i18n_usearch_previous() and i18n_usearch_next() after all valid matches have been returned, and by, i18n_usearch_first() and i18n_usearch_last() if there are no matches at all.

Define Documentation

#define I18N_U_FOLD_CASE_DEFAULT   0

Option value for case folding: use default mappings defined in CaseFolding.txt.

Since :
2.3.1

Option value for case folding:
Use the modified set of mappings provided in CaseFolding.txt to handle dotted I and dotless i appropriately for Turkic languages (tr, az).
Before Unicode 3.2, CaseFolding.txt contains mappings marked with 'I' that are to be included for default mappings and excluded for the Turkic-specific mappings.
Unicode 3.2 CaseFolding.txt instead contains mappings marked with 'T' that are to be excluded for default mappings and included for the Turkic-specific mappings.

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1

U_GC_XX_MASK constants are bit flags corresponding to Unicode general category values.

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1

Mask constant for multiple i18n_uchar_category_e bits (LC Cased Letters).

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1

Mask constant for multiple i18n_uchar_category_e bits (M Marks).

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1

Mask constant for multiple i18n_uchar_category_e bits (N Numbers).

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1

Mask constant for multiple i18n_uchar_category_e bits (S Symbols).

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1

Mask constant for multiple i18n_uchar_category_e bits (Z Separators).

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1

Mask constant for a i18n_uchar_category_e.

Since :
2.3.1
#define I18N_U_GET_GC_MASK (   c)    I18N_U_MASK(u_charType(c))

Get a single-bit bit set for the general category of a character.

Since :
2.3.1
#define I18N_U_MASK (   x)    ((uint32_t)1<<(x))

Get a single-bit bit set (a flag) from a bit number 0..31.

Since :
2.3.1
#define I18N_U_NO_NUMERIC_VALUE   ((double)-123456789.)

Special value that is returned by i18n_uchar_get_numeric_value()(not implemented yet) when no numeric value is defined for a code point.

Since :
2.3.1
#define I18N_USEARCH_DONE   -1

DONE is returned by i18n_usearch_previous() and i18n_usearch_next() after all valid matches have been returned, and by, i18n_usearch_first() and i18n_usearch_last() if there are no matches at all.

Since :
2.3.1

Typedef Documentation

typedef int8_t i18n_ubool

i18n_ubool.

Since :
2.3.1
typedef uint16_t i18n_uchar

i18n_uchar.

Since :
2.3.1
typedef int32_t i18n_uchar32

i18n_uchar32.

Since :
2.3.1

Enumeration Type Documentation

Enumeration for Unicode general category types.

Since :
2.3.1
Enumerator:
I18N_UCHAR_U_UNASSIGNED 

Non-category for unassigned and non-character code points

I18N_UCHAR_U_GENERAL_OTHER_TYPES 

Cn "Other, Not Assigned (no characters in [UnicodeData.txt] have this property)" (same as I18N_UCHAR_U_UNASSIGNED!)

I18N_UCHAR_U_UPPERCASE_LETTER 

Lu

I18N_UCHAR_U_LOWERCASE_LETTER 

Ll

I18N_UCHAR_U_TITLECASE_LETTER 

Lt

I18N_UCHAR_U_MODIFIER_LETTER 

Lm

I18N_UCHAR_U_OTHER_LETTER 

Lo

I18N_UCHAR_U_NON_SPACING_MARK 

Mn

I18N_UCHAR_U_ENCLOSING_MARK 

Me

I18N_UCHAR_U_COMBINING_SPACING_MARK 

Mc

I18N_UCHAR_U_DECIMAL_DIGIT_NUMBER 

Nd

I18N_UCHAR_U_LETTER_NUMBER 

Nl

I18N_UCHAR_U_OTHER_NUMBER 

No

I18N_UCHAR_U_SPACE_SEPARATOR 

Zs

I18N_UCHAR_U_LINE_SEPARATOR 

Zl

I18N_UCHAR_U_PARAGRAPH_SEPARATOR 

Zp

I18N_UCHAR_U_CONTROL_CHAR 

Cc

I18N_UCHAR_U_FORMAT_CHAR 

Cf

I18N_UCHAR_U_PRIVATE_USE_CHAR 

Co

I18N_UCHAR_U_SURROGATE 

Cs

I18N_UCHAR_U_DASH_PUNCTUATION 

Pd

I18N_UCHAR_U_START_PUNCTUATION 

Ps

I18N_UCHAR_U_END_PUNCTUATION 

Pe

I18N_UCHAR_U_CONNECTOR_PUNCTUATION 

Pc

I18N_UCHAR_U_OTHER_PUNCTUATION 

Po

I18N_UCHAR_U_MATH_SYMBOL 

Sm

I18N_UCHAR_U_CURRENCY_SYMBOL 

Sc

I18N_UCHAR_U_MODIFIER_SYMBOL 

Sk

I18N_UCHAR_U_OTHER_SYMBOL 

So

I18N_UCHAR_U_INITIAL_PUNCTUATION 

Pi

I18N_UCHAR_U_FINAL_PUNCTUATION 

Pf

I18N_UCHAR_U_CHAR_CATEGORY_COUNT 

One higher than the last enum i18n_uchar_category_e constant

Enumeration for the language directional property of a character set.

Since :
2.3.1
Enumerator:
I18N_UCHAR_U_LEFT_TO_RIGHT 

L

I18N_UCHAR_U_RIGHT_TO_LEFT 

R

I18N_UCHAR_U_EUROPEAN_NUMBER 

EN

I18N_UCHAR_U_EUROPEAN_NUMBER_SEPARATOR 

ES

I18N_UCHAR_U_EUROPEAN_NUMBER_TERMINATOR 

ET

I18N_UCHAR_U_ARABIC_NUMBER 

AN

I18N_UCHAR_U_COMMON_NUMBER_SEPARATOR 

CS

I18N_UCHAR_U_BLOCK_SEPARATOR 

B

I18N_UCHAR_U_SEGMENT_SEPARATOR 

S

I18N_UCHAR_U_WHITE_SPACE_NEUTRAL 

WS

I18N_UCHAR_U_OTHER_NEUTRAL 

ON

I18N_UCHAR_U_LEFT_TO_RIGHT_EMBEDDING 

LRE

I18N_UCHAR_U_LEFT_TO_RIGHT_OVERRIDE 

LRO

I18N_UCHAR_U_RIGHT_TO_LEFT_ARABIC 

AL

I18N_UCHAR_U_RIGHT_TO_LEFT_EMBEDDING 

RLE

I18N_UCHAR_U_RIGHT_TO_LEFT_OVERRIDE 

RLO

I18N_UCHAR_U_POP_DIRECTIONAL_FORMAT 

PDF

I18N_UCHAR_U_DIR_NON_SPACING_MARK 

NSM

I18N_UCHAR_U_BOUNDARY_NEUTRAL 

BN

I18N_UCHAR_U_FIRST_STRONG_ISOLATE 

FSI (Since 3.0)

I18N_UCHAR_U_LEFT_TO_RIGHT_ISOLATE 

FSI (Since 3.0)

I18N_UCHAR_U_RIGHT_TO_LEFT_ISOLATE 

RLI (Since 3.0)

I18N_UCHAR_U_POP_DIRECTIONAL_ISOLATE 

PDI (Since 3.0)

I18N_UCHAR_U_CHAR_DIRECTION_COUNT 

Count

Bidi Paired Bracket Type constants.

Since :
3.0
See also:
I18N_UCHAR_BIDI_PAIRED_BRACKET_TYPE
Enumerator:
I18N_UCHAR_U_BPT_NONE 

Not a paired bracket.

I18N_UCHAR_U_BPT_OPEN 

Open paired bracket.

I18N_UCHAR_U_BPT_CLOSE 

Close paired bracket.

I18N_UCHAR_U_BPT_COUNT 

Count

Enumeration for Decomposition Type constants.

Since :
2.3.1
Enumerator:
I18N_UCHAR_U_DT_NONE 

[none]

I18N_UCHAR_U_DT_CANONICAL 

[can]

I18N_UCHAR_U_DT_COMPAT 

[com]

I18N_UCHAR_U_DT_CIRCLE 

[enc]

I18N_UCHAR_U_DT_FINAL 

[fin]

I18N_UCHAR_U_DT_FONT 

[font]

I18N_UCHAR_U_DT_FRACTION 

[fra]

I18N_UCHAR_U_DT_INITIAL 

[init]

I18N_UCHAR_U_DT_ISOLATED 

[iso]

I18N_UCHAR_U_DT_MEDIAL 

[med]

I18N_UCHAR_U_DT_NARROW 

[nar]

I18N_UCHAR_U_DT_NOBREAK 

[nb]

I18N_UCHAR_U_DT_SMALL 

[sml]

I18N_UCHAR_U_DT_SQUARE 

[sqr]

I18N_UCHAR_U_DT_SUB 

[sub]

I18N_UCHAR_U_DT_SUPER 

[sup]

I18N_UCHAR_U_DT_VERTICAL 

[vert]

I18N_UCHAR_U_DT_WIDE 

[wide]

I18N_UCHAR_U_DT_COUNT 

18

Enumeration for East Asian Width constants.

Since :
2.3.1
Enumerator:
I18N_UCHAR_U_EA_NEUTRAL 

[N]

I18N_UCHAR_U_EA_AMBIGUOUS 

[A]

I18N_UCHAR_U_EA_HALFWIDTH 

[H]

I18N_UCHAR_U_EA_FULLWIDTH 

[F]

I18N_UCHAR_U_EA_NARROW 

[Na]

I18N_UCHAR_U_EA_WIDE 

[W]

Enumeration for Grapheme Cluster Break constants.

Since :
2.3.1
Enumerator:
I18N_UCHAR_U_GCB_OTHER 

[XX]

I18N_UCHAR_U_GCB_CONTROL 

[CN]

I18N_UCHAR_U_GCB_CR 

[CR]

I18N_UCHAR_U_GCB_EXTEND 

[EX]

I18N_UCHAR_U_GCB_L 

[L]

I18N_UCHAR_U_GCB_LF 

[LF]

I18N_UCHAR_U_GCB_LV 

[LV]

I18N_UCHAR_U_GCB_LVT 

[LVT]

I18N_UCHAR_U_GCB_T 

[T]

I18N_UCHAR_U_GCB_V 

[V]

I18N_UCHAR_U_GCB_SPACING_MARK 

[SM]

I18N_UCHAR_U_GCB_PREPEND 

[PP]

I18N_UCHAR_UCHAR_U_GCB_COUNT 

Enumeration for Hangul Syllable Type constants.

Since :
2.3.1
Enumerator:
I18N_UCHAR_U_HST_NOT_APPLICABLE 

[NA]

I18N_UCHAR_U_HST_LEADING_JAMO 

[L]

I18N_UCHAR_U_HST_VOWEL_JAMO 

[V]

I18N_UCHAR_U_HST_TRAILING_JAMO 

[T]

I18N_UCHAR_U_HST_LV_SYLLABLE 

[LV]

I18N_UCHAR_U_HST_LVT_SYLLABLE 

[LVT]

I18N_UCHAR_U_HST_COUNT 

Enumeration for Joining Group constants.

Since :
2.3.1
Enumerator:
I18N_UCHAR_U_JG_NO_JOINING_GROUP 

No Joining Group

I18N_UCHAR_U_JG_AIN 

Ain

I18N_UCHAR_U_JG_ALAPH 

Alaph

I18N_UCHAR_U_JG_ALEF 

Alef

I18N_UCHAR_U_JG_BEH 

Beh

I18N_UCHAR_U_JG_BETH 

Beth

I18N_UCHAR_U_JG_DAL 

Dal

I18N_UCHAR_U_JG_DALATH_RISH 

Dalath Rish

I18N_UCHAR_U_JG_E 

E

I18N_UCHAR_U_JG_FEH 

Feh

I18N_UCHAR_U_JG_FINAL_SEMKATH 

Final Semkath

I18N_UCHAR_U_JG_GAF 

Gaf

I18N_UCHAR_U_JG_GAMAL 

Gamal

I18N_UCHAR_U_JG_HAH 

Hah

I18N_UCHAR_U_JG_TEH_MARBUTA_GOAL 

Teh Marbuta Goal

I18N_UCHAR_U_JG_HAMZA_ON_HEH_GOAL 

Hamza On Heh Goal

I18N_UCHAR_U_JG_HE 

He

I18N_UCHAR_U_JG_HEH 

Heh

I18N_UCHAR_U_JG_HEH_GOAL 

Heh Goal

I18N_UCHAR_U_JG_HETH 

Heth

I18N_UCHAR_U_JG_KAF 

Kaf

I18N_UCHAR_U_JG_KAPH 

Kaph

I18N_UCHAR_U_JG_KNOTTED_HEH 

Knotted Heh

I18N_UCHAR_U_JG_LAM 

Lam

I18N_UCHAR_U_JG_LAMADH 

Lamadh

I18N_UCHAR_U_JG_MEEM 

Meem

I18N_UCHAR_U_JG_MIM 

Mim

I18N_UCHAR_U_JG_NOON 

Noon

I18N_UCHAR_U_JG_NUN 

Nun

I18N_UCHAR_U_JG_PE 

Pe

I18N_UCHAR_U_JG_QAF 

Qaf

I18N_UCHAR_U_JG_QAPH 

Qaph

I18N_UCHAR_U_JG_REH 

Reh

I18N_UCHAR_U_JG_REVERSED_PE 

Reversed Pe

I18N_UCHAR_U_JG_SAD 

Sad

I18N_UCHAR_U_JG_SADHE 

Sadhe

I18N_UCHAR_U_JG_SEEN 

Seen

I18N_UCHAR_U_JG_SEMKATH 

Semkath

I18N_UCHAR_U_JG_SHIN 

Shin

I18N_UCHAR_U_JG_SWASH_KAF 

Swash Kaf

I18N_UCHAR_U_JG_SYRIAC_WAW 

Syriac Waw

I18N_UCHAR_U_JG_TAH 

Tah

I18N_UCHAR_U_JG_TAW 

Taw

I18N_UCHAR_U_JG_TEH_MARBUTA 

Teh Marbuta

I18N_UCHAR_U_JG_TETH 

Teth

I18N_UCHAR_U_JG_WAW 

Waw

I18N_UCHAR_U_JG_YEH 

Yeh

I18N_UCHAR_U_JG_YEH_BARREE 

Yeh Barree

I18N_UCHAR_U_JG_YEH_WITH_TAIL 

Yeh With Tail

I18N_UCHAR_U_JG_YUDH 

Yudh

I18N_UCHAR_U_JG_YUDH_HE 

Yudh He

I18N_UCHAR_U_JG_ZAIN 

Zain

I18N_UCHAR_U_JG_FE 

Fe

I18N_UCHAR_U_JG_KHAPH 

Khaph

I18N_UCHAR_U_JG_ZHAIN 

Zhain

I18N_UCHAR_U_JG_BURUSHASKI_YEH_BARREE 

Burushaski Yeh Barree

I18N_UCHAR_U_JG_FARSI_YEH 

Farsi Yeh

I18N_UCHAR_U_JG_NYA 

Nya

I18N_UCHAR_U_JG_ROHINGYA_YEH 

Rohingya Yeh

I18N_UCHAR_U_JG_MANICHAEAN_ALEPH 

Manichaean Aleph (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_AYIN 

Manichaean Ayin (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_BETH 

Manichaean Beth (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_DALETH 

Manichaean Daleth (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_DHAMEDH 

Manichaean Dhamedh (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_FIVE 

Manichaean Five (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_GIMEL 

Manichaean Gimel (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_HETH 

Manichaean Heth (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_HUNDRED 

Manichaean Hundred (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_KAPH 

Manichaean Kaph (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_LAMEDH 

Manichaean Lamedh (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_MEM 

Manichaean Mem (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_NUN 

Manichaean Nun (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_ONE 

Manichaean One (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_PE 

Manichaean Pe (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_QOPH 

Manichaean Qoph (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_RESH 

Manichaean Resh (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_SADHE 

Manichaean Sadhe (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_SAMEKH 

Manichaean Samekh (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_TAW 

Manichaean Taw (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_TEN 

Manichaean Ten (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_TETH 

Manichaean Teth (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_THAMEDH 

Manichaean Thamedh (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_TWENTY 

Manichaean Twenty (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_WAW 

Manichaean Waw (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_YODH 

Manichaean Yodh (Since 3.0)

I18N_UCHAR_U_JG_MANICHAEAN_ZAYIN 

Manichaean Zayin (Since 3.0)

I18N_UCHAR_U_JG_STRAIGHT_WAW 

Manichaean Waw (Since 3.0)

I18N_UCHAR_U_JG_COUNT 

Count

Enumeration for Joining Type constants.

Since :
2.3.1
Enumerator:
I18N_UCHAR_U_JT_NON_JOINING 

[U]

I18N_UCHAR_U_JT_JOIN_CAUSING 

[C]

I18N_UCHAR_U_JT_DUAL_JOINING 

[D]

I18N_UCHAR_U_JT_LEFT_JOINING 

[L]

I18N_UCHAR_U_JT_RIGHT_JOINING 

[R]

I18N_UCHAR_U_JT_TRANSPARENT 

[T]

I18N_UCHAR_U_JT_COUNT 

6

Enumeration for Line Break constants.

Since :
2.3.1
Enumerator:
I18N_UCHAR_U_LB_UNKNOWN 

[XX]

I18N_UCHAR_U_LB_AMBIGUOUS 

[AI]

I18N_UCHAR_U_LB_ALPHABETIC 

[AL]

I18N_UCHAR_U_LB_BREAK_BOTH 

[B2]

I18N_UCHAR_U_LB_BREAK_AFTER 

[BA]

I18N_UCHAR_U_LB_BREAK_BEFORE 

[BB]

I18N_UCHAR_U_LB_MANDATORY_BREAK 

[BK]

I18N_UCHAR_U_LB_CONTINGENT_BREAK 

[CB]

I18N_UCHAR_U_LB_CLOSE_PUNCTUATION 

[CL]

I18N_UCHAR_U_LB_COMBINING_MARK 

[CM]

I18N_UCHAR_U_LB_CARRIAGE_RETURN 

[CR]

I18N_UCHAR_U_LB_EXCLAMATION 

[EX]

I18N_UCHAR_U_LB_GLUE 

[GL]

I18N_UCHAR_U_LB_HYPHEN 

[HY]

I18N_UCHAR_U_LB_IDEOGRAPHIC 

[ID]

I18N_UCHAR_U_LB_INSEPARABLE 

[IN]

I18N_UCHAR_U_LB_INFIX_NUMERIC 

[IS]

I18N_UCHAR_U_LB_LINE_FEED 

[LF]

I18N_UCHAR_U_LB_NONSTARTER 

[NS]

I18N_UCHAR_U_LB_NUMERIC 

[NU]

I18N_UCHAR_U_LB_OPEN_PUNCTUATION 

[OP]

I18N_UCHAR_U_LB_POSTFIX_NUMERIC 

[PO]

I18N_UCHAR_U_LB_PREFIX_NUMERIC 

[PR]

I18N_UCHAR_U_LB_QUOTATION 

[QU]

I18N_UCHAR_U_LB_COMPLEX_CONTEXT 

[SA]

I18N_UCHAR_U_LB_SURROGATE 

[SG]

I18N_UCHAR_U_LB_SPACE 

[SP]

I18N_UCHAR_U_LB_BREAK_SYMBOLS 

[SY]

I18N_UCHAR_U_LB_ZWSPACE 

[ZW]

I18N_UCHAR_U_LB_NEXT_LINE 

[NL]

I18N_UCHAR_U_LB_WORD_JOINER 

[WJ]

I18N_UCHAR_U_LB_H2 

[H2]

I18N_UCHAR_U_LB_H3 

[H3]

I18N_UCHAR_U_LB_JL 

[JL]

I18N_UCHAR_U_LB_JT 

[JT]

I18N_UCHAR_U_LB_JV 

[JV]

I18N_UCHAR_U_LB_CLOSE_PARENTHESIS 

[CP]

Enumeration for Numeric Type constants.

Since :
2.3.1
Enumerator:
I18N_UCHAR_U_NT_NONE 

[None]

I18N_UCHAR_U_NT_DECIMAL 

[de]

I18N_UCHAR_U_NT_DIGIT 

[di]

I18N_UCHAR_U_NT_NUMERIC 

[nu]

I18N_UCHAR_U_NT_COUNT 

Enumeration for Sentence Break constants.

Since :
2.3.1
Enumerator:
I18N_UCHAR_U_SB_OTHER 

[XX]

I18N_UCHAR_U_SB_ATERM 

[AT]

I18N_UCHAR_U_SB_CLOSE 

[CL]

I18N_UCHAR_U_SB_FORMAT 

[FO]

I18N_UCHAR_U_SB_LOWER 

[LO]

I18N_UCHAR_U_SB_NUMERIC 

[NU]

I18N_UCHAR_U_SB_OLETTER 

[LE]

I18N_UCHAR_U_SB_SEP 

[SE]

I18N_UCHAR_U_SB_SP 

[SP]

I18N_UCHAR_U_SB_STERM 

[ST]

I18N_UCHAR_U_SB_UPPER 

[UP]

I18N_UCHAR_U_SB_CR 

[CR]

I18N_UCHAR_U_SB_EXTEND 

[EX]

I18N_UCHAR_U_SB_LF 

[LF]

I18N_UCHAR_U_SB_SCONTINUE 

[SC]

I18N_UCHAR_U_SB_COUNT 

Enumeration for Word Break constants.

Since :
2.3.1
Enumerator:
I18N_UCHAR_U_WB_OTHER 

[XX]

I18N_UCHAR_U_WB_ALETTER 

[LE]

I18N_UCHAR_U_WB_FORMAT 

[FO]

I18N_UCHAR_U_WB_KATAKANA 

[KA]

I18N_UCHAR_U_WB_MIDLETTER 

[ML]

I18N_UCHAR_U_WB_MIDNUM 

[MN]

I18N_UCHAR_U_WB_NUMERIC 

[NU]

I18N_UCHAR_U_WB_EXTENDNUMLET 

[EX]

I18N_UCHAR_U_WB_CR 

[CR]

I18N_UCHAR_U_WB_EXTEND 

[Extend]

I18N_UCHAR_U_WB_LF 

[LF]

I18N_UCHAR_U_WB_MIDNUMLET 

[MB]

I18N_UCHAR_U_WB_NEWLINE 

[NL]

I18N_UCHAR_U_WB_REGIONAL_INDICATOR 

[RI] (Since 3.0)

I18N_UCHAR_U_WB_HEBREW_LETTER 

[HL] (Since 3.0)

I18N_UCHAR_U_WB_SINGLE_QUOTE 

[SQ] (Since 3.0)

I18N_UCHAR_U_WB_DOUBLE_QUOTE 

[DQ] (Since 3.0)

I18N_UCHAR_U_WB_COUNT 

Constants for Unicode blocks, see the Unicode Data file Blocks.txt.

Since :
2.3.1
Enumerator:
I18N_UCHAR_UBLOCK_NO_BLOCK 

No Block

I18N_UCHAR_UBLOCK_BASIC_LATIN 

Basic Latin

I18N_UCHAR_UBLOCK_LATIN_1_SUPPLEMENT 

Latin_1 Supplement

I18N_UCHAR_UBLOCK_LATIN_EXTENDED_A 

Latin Extended A

I18N_UCHAR_UBLOCK_LATIN_EXTENDED_B 

Latin Extended B

I18N_UCHAR_UBLOCK_IPA_EXTENSIONS 

IPA Extensions

I18N_UCHAR_UBLOCK_SPACING_MODIFIER_LETTERS 

Spacing Modifier Letters

I18N_UCHAR_UBLOCK_COMBINING_DIACRITICAL_MARKS 

Combining Diacritical Marks

I18N_UCHAR_UBLOCK_GREEK 

Greek

I18N_UCHAR_UBLOCK_CYRILLIC 

Cyrillic

I18N_UCHAR_UBLOCK_ARMENIAN 

Armenian

I18N_UCHAR_UBLOCK_HEBREW 

Hebrew

I18N_UCHAR_UBLOCK_ARABIC 

Arabic

I18N_UCHAR_UBLOCK_SYRIAC 

Syriac

I18N_UCHAR_UBLOCK_THAANA 

Thaana

I18N_UCHAR_UBLOCK_DEVANAGARI 

Devanagari

I18N_UCHAR_UBLOCK_BENGALI 

Bengali

I18N_UCHAR_UBLOCK_GURMUKHI 

Gurmukhi

I18N_UCHAR_UBLOCK_GUJARATI 

Gujarati

I18N_UCHAR_UBLOCK_ORIYA 

Oriya

I18N_UCHAR_UBLOCK_TAMIL 

Tamil

I18N_UCHAR_UBLOCK_TELUGU 

Telugu

I18N_UCHAR_UBLOCK_KANNADA 

Kannada

I18N_UCHAR_UBLOCK_MALAYALAM 

Malayalam

I18N_UCHAR_UBLOCK_SINHALA 

Sinhala

I18N_UCHAR_UBLOCK_THAI 

Thai

I18N_UCHAR_UBLOCK_LAO 

Lao

I18N_UCHAR_UBLOCK_TIBETAN 

Tibetan

I18N_UCHAR_UBLOCK_MYANMAR 

Myanmar

I18N_UCHAR_UBLOCK_GEORGIAN 

Georgian

I18N_UCHAR_UBLOCK_HANGUL_JAMO 

Hangul Jamo

I18N_UCHAR_UBLOCK_ETHIOPIC 

Ethiopic

I18N_UCHAR_UBLOCK_CHEROKEE 

Cherokee

I18N_UCHAR_UBLOCK_UNIFIED_CANADIAN_ABORIGINAL_SYLLABICS 

Unified Canadian Aboriginal Syllabics

I18N_UCHAR_UBLOCK_OGHAM 

Ogham

I18N_UCHAR_UBLOCK_RUNIC 

Runic

I18N_UCHAR_UBLOCK_KHMER 

Khmer

I18N_UCHAR_UBLOCK_MONGOLIAN 

Mongolian

I18N_UCHAR_UBLOCK_LATIN_EXTENDED_ADDITIONAL 

Latin Extended Additional

I18N_UCHAR_UBLOCK_GREEK_EXTENDED 

Greek Extended

I18N_UCHAR_UBLOCK_GENERAL_PUNCTUATION 

General Punctuation

I18N_UCHAR_UBLOCK_SUPERSCRIPTS_AND_SUBSCRIPTS 

Superscripts And Subscripts

I18N_UCHAR_UBLOCK_CURRENCY_SYMBOLS 

Currency Symbols

I18N_UCHAR_UBLOCK_COMBINING_MARKS_FOR_SYMBOLS 

Combining Marks For Symbols

I18N_UCHAR_UBLOCK_LETTERLIKE_SYMBOLS 

Letterlike Symbols

I18N_UCHAR_UBLOCK_NUMBER_FORMS 

Number Forms

I18N_UCHAR_UBLOCK_ARROWS 

Arrows

I18N_UCHAR_UBLOCK_MATHEMATICAL_OPERATORS 

Mathematical Operators

I18N_UCHAR_UBLOCK_MISCELLANEOUS_TECHNICAL 

Miscellaneous Technical

I18N_UCHAR_UBLOCK_CONTROL_PICTURES 

Control Pictures

I18N_UCHAR_UBLOCK_OPTICAL_CHARACTER_RECOGNITION 

Optical Character Recognition

I18N_UCHAR_UBLOCK_ENCLOSED_ALPHANUMERICS 

Enclosed Alphanumerics

I18N_UCHAR_UBLOCK_BOX_DRAWING 

Box Drawing

I18N_UCHAR_UBLOCK_BLOCK_ELEMENTS 

Block Elements

I18N_UCHAR_UBLOCK_GEOMETRIC_SHAPES 

Geometric Shapes

I18N_UCHAR_UBLOCK_MISCELLANEOUS_SYMBOLS 

Miscellaneous Symbols

I18N_UCHAR_UBLOCK_DINGBATS 

Dingbats

I18N_UCHAR_UBLOCK_BRAILLE_PATTERNS 

Braille Patterns

I18N_UCHAR_UBLOCK_CJK_RADICALS_SUPPLEMENT 

CJK Radicals Supplement

I18N_UCHAR_UBLOCK_KANGXI_RADICALS 

Kangxi Radicals

I18N_UCHAR_UBLOCK_IDEOGRAPHIC_DESCRIPTION_CHARACTERS 

Ideographic Description Characters

I18N_UCHAR_UBLOCK_CJK_SYMBOLS_AND_PUNCTUATION 

CJK Symbols And Punctuation

I18N_UCHAR_UBLOCK_HIRAGANA 

Hiragana

I18N_UCHAR_UBLOCK_KATAKANA 

Katakana

I18N_UCHAR_UBLOCK_BOPOMOFO 

Bopomofo

I18N_UCHAR_UBLOCK_HANGUL_COMPATIBILITY_JAMO 

Hangul Compatibility Jamo

I18N_UCHAR_UBLOCK_KANBUN 

Kanbun

I18N_UCHAR_UBLOCK_BOPOMOFO_EXTENDED 

Bopomofo Extended

I18N_UCHAR_UBLOCK_ENCLOSED_CJK_LETTERS_AND_MONTHS 

Enclosed CJK Letters And Months

I18N_UCHAR_UBLOCK_CJK_COMPATIBILITY 

CJK Compatibility

I18N_UCHAR_UBLOCK_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_A 

CJK Unified Ideographs Extension A

I18N_UCHAR_UBLOCK_CJK_UNIFIED_IDEOGRAPHS 

CJK Unified Ideographs

I18N_UCHAR_UBLOCK_YI_SYLLABLES 

Yi Syllables

I18N_UCHAR_UBLOCK_YI_RADICALS 

Yi Radicals

I18N_UCHAR_UBLOCK_HANGUL_SYLLABLES 

Hangul Syllables

I18N_UCHAR_UBLOCK_HIGH_SURROGATES 

High Surrogates

I18N_UCHAR_UBLOCK_HIGH_PRIVATE_USE_SURROGATES 

High Private Use Surrogates

I18N_UCHAR_UBLOCK_LOW_SURROGATES 

Low Surrogates

I18N_UCHAR_UBLOCK_PRIVATE_USE_AREA 

Private Use Area

I18N_UCHAR_UBLOCK_PRIVATE_USE 

Private Use

I18N_UCHAR_UBLOCK_CJK_COMPATIBILITY_IDEOGRAPHS 

CJK Compatibility Ideographs

I18N_UCHAR_UBLOCK_ALPHABETIC_PRESENTATION_FORMS 

Alphabetic Presentation Forms

I18N_UCHAR_UBLOCK_ARABIC_PRESENTATION_FORMS_A 

Arabic Presentation Forms A

I18N_UCHAR_UBLOCK_COMBINING_HALF_MARKS 

Combining Half Marks

I18N_UCHAR_UBLOCK_CJK_COMPATIBILITY_FORMS 

CJK Compatibility Forms

I18N_UCHAR_UBLOCK_SMALL_FORM_VARIANTS 

Small Form Variants

I18N_UCHAR_UBLOCK_ARABIC_PRESENTATION_FORMS_B 

Arabic Presentation Forms B

I18N_UCHAR_UBLOCK_SPECIALS 

Specials

I18N_UCHAR_UBLOCK_HALFWIDTH_AND_FULLWIDTH_FORMS 

Halfwidth And Fullwidth Forms

I18N_UCHAR_UBLOCK_OLD_ITALIC 

Old Italic

I18N_UCHAR_UBLOCK_GOTHIC 

Gothic

I18N_UCHAR_UBLOCK_DESERET 

Deseret

I18N_UCHAR_UBLOCK_BYZANTINE_MUSICAL_SYMBOLS 

Byzantine Musical Symbols

I18N_UCHAR_UBLOCK_MUSICAL_SYMBOLS 

Musical Symbols

I18N_UCHAR_UBLOCK_MATHEMATICAL_ALPHANUMERIC_SYMBOLS 

Mathematical Alphanumeric Symbols

I18N_UCHAR_UBLOCK_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_B 

CJK Unified Ideographs Extension B

I18N_UCHAR_UBLOCK_CJK_COMPATIBILITY_IDEOGRAPHS_SUPPLEMENT 

CJK Compatibility Ideographs Supplement

I18N_UCHAR_UBLOCK_TAGS 

Tags

I18N_UCHAR_UBLOCK_CYRILLIC_SUPPLEMENT 

Cyrillic Supplement

I18N_UCHAR_UBLOCK_CYRILLIC_SUPPLEMENTARY 

Cyrillic Supplementary

I18N_UCHAR_UBLOCK_TAGALOG 

Tagalog

I18N_UCHAR_UBLOCK_HANUNOO 

Hanunoo

I18N_UCHAR_UBLOCK_BUHID 

Buhid

I18N_UCHAR_UBLOCK_TAGBANWA 

Tagbanwa

I18N_UCHAR_UBLOCK_MISCELLANEOUS_MATHEMATICAL_SYMBOLS_A 

Miscellaneous Mathematical Symbols A

I18N_UCHAR_UBLOCK_SUPPLEMENTAL_ARROWS_A 

Supplemental Arrows A

I18N_UCHAR_UBLOCK_SUPPLEMENTAL_ARROWS_B 

Supplemental Arrows B

I18N_UCHAR_UBLOCK_MISCELLANEOUS_MATHEMATICAL_SYMBOLS_B 

Miscellaneous Mathematical Symbols B

I18N_UCHAR_UBLOCK_SUPPLEMENTAL_MATHEMATICAL_OPERATORS 

Supplemental Mathematical Operators

I18N_UCHAR_UBLOCK_KATAKANA_PHONETIC_EXTENSIONS 

Katakana Phonetic Extensions

I18N_UCHAR_UBLOCK_VARIATION_SELECTORS 

Variation Selectors

I18N_UCHAR_UBLOCK_SUPPLEMENTARY_PRIVATE_USE_AREA_A 

Supplementary Private Use Area A

I18N_UCHAR_UBLOCK_SUPPLEMENTARY_PRIVATE_USE_AREA_B 

Supplementary Private Use Area B

I18N_UCHAR_UBLOCK_LIMBU 

Limbu

I18N_UCHAR_UBLOCK_TAI_LE 

Tai Le

I18N_UCHAR_UBLOCK_KHMER_SYMBOLS 

Khmer Symbols

I18N_UCHAR_UBLOCK_PHONETIC_EXTENSIONS 

Phonetic Extensions

I18N_UCHAR_UBLOCK_MISCELLANEOUS_SYMBOLS_AND_ARROWS 

Miscellaneous Symbols And Arrows

I18N_UCHAR_UBLOCK_YIJING_HEXAGRAM_SYMBOLS 

Yijing Hexagram Symbols

I18N_UCHAR_UBLOCK_LINEAR_B_SYLLABARY 

Linear B Syllabary

I18N_UCHAR_UBLOCK_LINEAR_B_IDEOGRAMS 

Linear B Ideograms

I18N_UCHAR_UBLOCK_AEGEAN_NUMBERS 

Aegean Numbers

I18N_UCHAR_UBLOCK_UGARITIC 

Ugaritic

I18N_UCHAR_UBLOCK_SHAVIAN 

Shavian

I18N_UCHAR_UBLOCK_OSMANYA 

Osmanya

I18N_UCHAR_UBLOCK_CYPRIOT_SYLLABARY 

Cypriot Syllabary

I18N_UCHAR_UBLOCK_TAI_XUAN_JING_SYMBOLS 

Tai Xuan Jing Symbols

I18N_UCHAR_UBLOCK_VARIATION_SELECTORS_SUPPLEMENT 

Variation Selectors Supplement

I18N_UCHAR_UBLOCK_ANCIENT_GREEK_MUSICAL_NOTATION 

Ancient Greek Musical Notation

I18N_UCHAR_UBLOCK_ANCIENT_GREEK_NUMBERS 

Ancient Greek Numbers

I18N_UCHAR_UBLOCK_ARABIC_SUPPLEMENT 

Arabic Supplement

I18N_UCHAR_UBLOCK_BUGINESE 

Buginese

I18N_UCHAR_UBLOCK_CJK_STROKES 

CJK Strokes

I18N_UCHAR_UBLOCK_COMBINING_DIACRITICAL_MARKS_SUPPLEMENT 

Combining Diacritical Marks Supplement

I18N_UCHAR_UBLOCK_COPTIC 

Coptic

I18N_UCHAR_UBLOCK_ETHIOPIC_EXTENDED 

Ethiopic Extended

I18N_UCHAR_UBLOCK_ETHIOPIC_SUPPLEMENT 

Ethiopic Supplement

I18N_UCHAR_UBLOCK_GEORGIAN_SUPPLEMENT 

Georgian Supplement

I18N_UCHAR_UBLOCK_GLAGOLITIC 

Glagolitic

I18N_UCHAR_UBLOCK_KHAROSHTHI 

Kharoshthi

I18N_UCHAR_UBLOCK_MODIFIER_TONE_LETTERS 

Modifier Tone Letters

I18N_UCHAR_UBLOCK_NEW_TAI_LUE 

New Tai Lue

I18N_UCHAR_UBLOCK_OLD_PERSIAN 

Old Persian

I18N_UCHAR_UBLOCK_PHONETIC_EXTENSIONS_SUPPLEMENT 

Phonetic Extensions Supplement

I18N_UCHAR_UBLOCK_SUPPLEMENTAL_PUNCTUATION 

Supplemental Punctuation

I18N_UCHAR_UBLOCK_SYLOTI_NAGRI 

Syloti Nagri

I18N_UCHAR_UBLOCK_TIFINAGH 

Tifinagh

I18N_UCHAR_UBLOCK_VERTICAL_FORMS 

Vertical Forms

I18N_UCHAR_UBLOCK_NKO 

Nko

I18N_UCHAR_UBLOCK_BALINESE 

Balinese

I18N_UCHAR_UBLOCK_LATIN_EXTENDED_C 

Latin Extended C

I18N_UCHAR_UBLOCK_LATIN_EXTENDED_D 

Latin Extended D

I18N_UCHAR_UBLOCK_PHAGS_PA 

Phags Pa

I18N_UCHAR_UBLOCK_PHOENICIAN 

Phoenician

I18N_UCHAR_UBLOCK_CUNEIFORM 

Cuneiform

I18N_UCHAR_UBLOCK_CUNEIFORM_NUMBERS_AND_PUNCTUATION 

Cuneiform Numbers And Punctuation

I18N_UCHAR_UBLOCK_COUNTING_ROD_NUMERALS 

Counting Rod Numerals

I18N_UCHAR_UBLOCK_SUNDANESE 

Sundanese

I18N_UCHAR_UBLOCK_LEPCHA 

Lepcha

I18N_UCHAR_UBLOCK_OL_CHIKI 

Ol Chiki

I18N_UCHAR_UBLOCK_CYRILLIC_EXTENDED_A 

Cyrillic Extended A

I18N_UCHAR_UBLOCK_VAI 

Vai

I18N_UCHAR_UBLOCK_CYRILLIC_EXTENDED_B 

Cyrillic Extended B

I18N_UCHAR_UBLOCK_SAURASHTRA 

Saurashtra

I18N_UCHAR_UBLOCK_KAYAH_LI 

Kayah Li

I18N_UCHAR_UBLOCK_REJANG 

Rejang

I18N_UCHAR_UBLOCK_CHAM 

Cham

I18N_UCHAR_UBLOCK_ANCIENT_SYMBOLS 

Ancient Symbols

I18N_UCHAR_UBLOCK_PHAISTOS_DISC 

Phaistos Disc

I18N_UCHAR_UBLOCK_LYCIAN 

Lycian

I18N_UCHAR_UBLOCK_CARIAN 

Carian

I18N_UCHAR_UBLOCK_LYDIAN 

Lydian

I18N_UCHAR_UBLOCK_MAHJONG_TILES 

Mahjong Tiles

I18N_UCHAR_UBLOCK_DOMINO_TILES 

Domino Tiles

I18N_UCHAR_UBLOCK_SAMARITAN 

Samaritan

I18N_UCHAR_UBLOCK_UNIFIED_CANADIAN_ABORIGINAL_SYLLABICS_EXTENDED 

Unified Canadian Aboriginal Syllabics Extended

I18N_UCHAR_UBLOCK_TAI_THAM 

Tai Tham

I18N_UCHAR_UBLOCK_VEDIC_EXTENSIONS 

Vedic Extensions

I18N_UCHAR_UBLOCK_LISU 

Lisu

I18N_UCHAR_UBLOCK_BAMUM 

Bamum

I18N_UCHAR_UBLOCK_COMMON_INDIC_NUMBER_FORMS 

Common Indic Number Forms

I18N_UCHAR_UBLOCK_DEVANAGARI_EXTENDED 

Devanagari Extended

I18N_UCHAR_UBLOCK_HANGUL_JAMO_EXTENDED_A 

Hangul Jamo Extended A

I18N_UCHAR_UBLOCK_JAVANESE 

Javanese

I18N_UCHAR_UBLOCK_MYANMAR_EXTENDED_A 

Myanmar Extended A

I18N_UCHAR_UBLOCK_TAI_VIET 

Tai Viet

I18N_UCHAR_UBLOCK_MEETEI_MAYEK 

Meetei Mayek

I18N_UCHAR_UBLOCK_HANGUL_JAMO_EXTENDED_B 

Hangul Jamo Extended B

I18N_UCHAR_UBLOCK_IMPERIAL_ARAMAIC 

Imperial Aramaic

I18N_UCHAR_UBLOCK_OLD_SOUTH_ARABIAN 

Old South Arabian

I18N_UCHAR_UBLOCK_AVESTAN 

Avestan

I18N_UCHAR_UBLOCK_INSCRIPTIONAL_PARTHIAN 

Inscriptional Parthian

I18N_UCHAR_UBLOCK_INSCRIPTIONAL_PAHLAVI 

Inscriptional Pahlavi

I18N_UCHAR_UBLOCK_OLD_TURKIC 

Old Turkic

I18N_UCHAR_UBLOCK_RUMI_NUMERAL_SYMBOLS 

Rumi Numeral Symbols

I18N_UCHAR_UBLOCK_KAITHI 

Kaithi

I18N_UCHAR_UBLOCK_EGYPTIAN_HIEROGLYPHS 

Egyptian Hieroglyphs

I18N_UCHAR_UBLOCK_ENCLOSED_ALPHANUMERIC_SUPPLEMENT 

Enclosed Alphanumeric Supplement

I18N_UCHAR_UBLOCK_ENCLOSED_IDEOGRAPHIC_SUPPLEMENT 

Enclosed Ideographic Supplement

I18N_UCHAR_UBLOCK_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_C 

CJK Unified Ideographs Extension C

I18N_UCHAR_UBLOCK_MANDAIC 

Mandaic

I18N_UCHAR_UBLOCK_BATAK 

Batak

I18N_UCHAR_UBLOCK_ETHIOPIC_EXTENDED_A 

Ethiopic Extended A

I18N_UCHAR_UBLOCK_BRAHMI 

Brahmi

I18N_UCHAR_UBLOCK_BAMUM_SUPPLEMENT 

Bamum Supplement

I18N_UCHAR_UBLOCK_KANA_SUPPLEMENT 

Kana Supplement

I18N_UCHAR_UBLOCK_PLAYING_CARDS 

Playing Cards

I18N_UCHAR_UBLOCK_MISCELLANEOUS_SYMBOLS_AND_PICTOGRAPHS 

Miscellaneous Symbols And Pictographs

I18N_UCHAR_UBLOCK_EMOTICONS 

Emoticons

I18N_UCHAR_UBLOCK_TRANSPORT_AND_MAP_SYMBOLS 

Transport And Map Symbols

I18N_UCHAR_UBLOCK_ALCHEMICAL_SYMBOLS 

Alchemical Symbols

I18N_UCHAR_UBLOCK_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_D 

CJK Unified Ideographs Extension D

I18N_UCHAR_UBLOCK_BASSA_VAH 

Bassa Vah (Since 3.0)

I18N_UCHAR_UBLOCK_CAUCASIAN_ALBANIAN 

Caucasian Albanian (Since 3.0)

I18N_UCHAR_UBLOCK_COPTIC_EPACT_NUMBERS 

Coptic Epact Numbers (Since 3.0)

I18N_UCHAR_UBLOCK_COMBINING_DIACRITICAL_MARKS_EXTENDED 

Combining Diacritical Marks Extended (Since 3.0)

I18N_UCHAR_UBLOCK_DUPLOYAN 

Duployan (Since 3.0)

I18N_UCHAR_UBLOCK_ELBASAN 

Elbasan (Since 3.0)

I18N_UCHAR_UBLOCK_GEOMETRIC_SHAPES_EXTENDED 

Geometric Shapes Extended (Since 3.0)

I18N_UCHAR_UBLOCK_GRANTHA 

Grantha (Since 3.0)

I18N_UCHAR_UBLOCK_KHOJKI 

Khojki (Since 3.0)

I18N_UCHAR_UBLOCK_KHUDAWADI 

Khudawadi (Since 3.0)

I18N_UCHAR_UBLOCK_LATIN_EXTENDED_E 

Latin Extended E (Since 3.0)

I18N_UCHAR_UBLOCK_LINEAR_A 

Linear A (Since 3.0)

I18N_UCHAR_UBLOCK_MAHAJANI 

Mahajani (Since 3.0)

I18N_UCHAR_UBLOCK_MANICHAEAN 

Manichaean (Since 3.0)

I18N_UCHAR_UBLOCK_MENDE_KIKAKUI 

Mende Kikakui (Since 3.0)

I18N_UCHAR_UBLOCK_MODI 

Modi (Since 3.0)

I18N_UCHAR_UBLOCK_MRO 

Mro (Since 3.0)

I18N_UCHAR_UBLOCK_MYANMAR_EXTENDED_B 

Myanmar Extended B (Since 3.0)

I18N_UCHAR_UBLOCK_NABATAEAN 

Nabataean (Since 3.0)

I18N_UCHAR_UBLOCK_OLD_NORTH_ARABIAN 

Old North Arabian (Since 3.0)

I18N_UCHAR_UBLOCK_OLD_PERMIC 

Old Permic (Since 3.0)

I18N_UCHAR_UBLOCK_ORNAMENTAL_DINGBATS 

Ornamental Dingbats (Since 3.0)

I18N_UCHAR_UBLOCK_PAHAWH_HMONG 

Pahawh Hmong (Since 3.0)

I18N_UCHAR_UBLOCK_PALMYRENE 

Palmyrene (Since 3.0)

I18N_UCHAR_UBLOCK_PAU_CIN_HAU 

Pau Cin Hau (Since 3.0)

I18N_UCHAR_UBLOCK_PSALTER_PAHLAVI 

Psalter Pahlavi (Since 3.0)

I18N_UCHAR_UBLOCK_SHORTHAND_FORMAT_CONTROLS 

Shorthand Format Controls (Since 3.0)

I18N_UCHAR_UBLOCK_SIDDHAM 

Siddham (Since 3.0)

I18N_UCHAR_UBLOCK_SINHALA_ARCHAIC_NUMBERS 

Sinhala Archaic Numbers (Since 3.0)

I18N_UCHAR_UBLOCK_SUPPLEMENTAL_ARROWS_C 

Supplemental Arrows C (Since 3.0)

I18N_UCHAR_UBLOCK_TIRHUTA 

Tirhuta (Since 3.0)

I18N_UCHAR_UBLOCK_WARANG_CITI 

Warang Citi (Since 3.0)

I18N_UCHAR_UBLOCK_COUNT 

Count

I18N_UCHAR_UBLOCK_INVALID_CODE 

Invalid Code

Enumeration of constants for Unicode properties. The properties APIs are intended to reflect Unicode properties as defined in the Unicode Character Database (UCD) and Unicode Technical Reports (UTR). For details about the properties see http://www.unicode.org/ucd/ . For names of Unicode properties see the UCD file PropertyAliases.txt.

Since :
2.3.1
Enumerator:
I18N_UCHAR_ALPHABETIC 

Binary property Alphabetic.
Lu+Ll+Lt+Lm+Lo+Nl+Other_Alphabetic

I18N_UCHAR_BINARY_START 

First constant for binary Unicode properties.

I18N_UCHAR_ASCII_HEX_DIGIT 

Binary property ASCII_Hex_Digit.
0-9 A-F a-f

I18N_UCHAR_BIDI_CONTROL 

Binary property Bidi_Control.
Format controls which have specific functions in the Bidi Algorithm.

I18N_UCHAR_BIDI_MIRRORED 

Binary property Bidi_Mirrored.
Characters that may change display in RTL text. See Bidi Algorithm, UTR 9.

I18N_UCHAR_DASH 

Binary property Dash.
Variations of dashes.

I18N_UCHAR_DEFAULT_IGNORABLE_CODE_POINT 

Binary property Default_Ignorable_Code_Point (new in Unicode 3.2).
Ignorable in most processing. <2060..206F, FFF0..FFFB, E0000..E0FFF>+Other_Default_Ignorable_Code_Point+(Cf+Cc+Cs-White_Space)

I18N_UCHAR_DEPRECATED 

Binary property Deprecated (new in Unicode 3.2).
The usage of deprecated characters is strongly discouraged.

I18N_UCHAR_DIACRITIC 

Binary property Diacritic.
Characters that linguistically modify the meaning of another character to which they apply.

I18N_UCHAR_EXTENDER 

Binary property Extender.
Extend the value or shape of a preceding alphabetic character, e.g. length and iteration marks.

I18N_UCHAR_FULL_COMPOSITION_EXCLUSION 

Binary property Full_Composition_Exclusion.
CompositionExclusions.txt+Singleton Decompositions+ Non-Starter Decompositions.

I18N_UCHAR_GRAPHEME_BASE 

Binary property Grapheme_Base (new in Unicode 3.2).
For programmatic determination of grapheme cluster boundaries. [0..10FFFF]-Cc-Cf-Cs-Co-Cn-Zl-Zp-Grapheme_Link-Grapheme_Extend-CGJ

I18N_UCHAR_GRAPHEME_EXTEND 

Binary property Grapheme_Extend (new in Unicode 3.2).
For programmatic determination of grapheme cluster boundaries. Me+Mn+Mc+Other_Grapheme_Extend-Grapheme_Link-CGJ

I18N_UCHAR_GRAPHEME_LINK 

Binary property Grapheme_Link (new in Unicode 3.2).
For programmatic determination of grapheme cluster boundaries.

I18N_UCHAR_HEX_DIGIT 

Binary property Hex_Digit.
Characters commonly used for hexadecimal numbers.

I18N_UCHAR_HYPHEN 

Binary property Hyphen.
Dashes used to mark connections between pieces of words, plus the Katakana middle dot.

I18N_UCHAR_ID_CONTINUE 

Binary property ID_Continue.
Characters that can continue an identifier. DerivedCoreProperties.txt also says "NOTE: Cf characters should be filtered out." ID_Start+Mn+Mc+Nd+Pc

I18N_UCHAR_ID_START 

Binary property ID_Start.
Characters that can start an identifier. Lu+Ll+Lt+Lm+Lo+Nl

I18N_UCHAR_IDEOGRAPHIC 

Binary property Ideographic.
CJKV ideographs.

I18N_UCHAR_IDS_BINARY_OPERATOR 

Binary property IDS_Binary_Operator (new in Unicode 3.2).
For programmatic determination of Ideographic Description Sequences.

I18N_UCHAR_IDS_TRINARY_OPERATOR 

Binary property IDS_Trinary_Operator (new in Unicode 3.2).
For programmatic determination of Ideographic Description Sequences.

I18N_UCHAR_JOIN_CONTROL 

Binary property Join_Control.
Format controls for cursive joining and ligation.

I18N_UCHAR_LOGICAL_ORDER_EXCEPTION 

Binary property Logical_Order_Exception (new in Unicode 3.2).
Characters that do not use logical order and require special handling in most processing.

I18N_UCHAR_LOWERCASE 

Binary property Lowercase.
Ll+Other_Lowercase

I18N_UCHAR_MATH 

Binary property Math.
Sm+Other_Math

I18N_UCHAR_NONCHARACTER_CODE_POINT 

Binary property Noncharacter_Code_Point.
Code points that are explicitly defined as illegal for the encoding of characters.

I18N_UCHAR_QUOTATION_MARK 

Binary property Quotation_Mark.

I18N_UCHAR_RADICAL 

Binary property Radical (new in Unicode 3.2).
For programmatic determination of Ideographic Description Sequences.

I18N_UCHAR_SOFT_DOTTED 

Binary property Soft_Dotted (new in Unicode 3.2).
Characters with a "soft dot", like i or j. An accent placed on these characters causes the dot to disappear.

I18N_UCHAR_TERMINAL_PUNCTUATION 

Binary property Terminal_Punctuation.
Punctuation characters that generally mark the end of textual units.

I18N_UCHAR_UNIFIED_IDEOGRAPH 

Binary property Unified_Ideograph (new in Unicode 3.2).
For programmatic determination of Ideographic Description Sequences.

I18N_UCHAR_UPPERCASE 

Binary property Uppercase.
Lu+Other_Uppercase

I18N_UCHAR_WHITE_SPACE 

Binary property White_Space.
Space characters+TAB+CR+LF-ZWSP-ZWNBSP

I18N_UCHAR_XID_CONTINUE 

Binary property XID_Continue.
ID_Continue modified to allow closure under normalization forms NFKC and NFKD.

I18N_UCHAR_XID_START 

Binary property XID_Start.
ID_Start modified to allow closure under normalization forms NFKC and NFKD.

I18N_UCHAR_CASE_SENSITIVE 

Binary property Case_Sensitive.
Either the source of a case mapping or in the target of a case mapping. Not the same as the general category Cased_Letter.

I18N_UCHAR_S_TERM 

Binary property STerm (new in Unicode 4.0.1).

I18N_UCHAR_VARIATION_SELECTOR 

Binary property Variation_Selector (new in Unicode 4.0.1).
Indicates all those characters that qualify as Variation Selectors.

I18N_UCHAR_NFD_INERT 

Binary property NFD_Inert.
ICU-specific property for characters that are inert under NFD, i.e., they do not interact with adjacent characters.

I18N_UCHAR_NFKD_INERT 

Binary property NFKD_Inert.
ICU-specific property for characters that are inert under NFKD, i.e., they do not interact with adjacent characters.

I18N_UCHAR_NFC_INERT 

Binary property NFC_Inert.
ICU-specific property for characters that are inert under NFC, i.e., they do not interact with adjacent characters.

I18N_UCHAR_NFKC_INERT 

Binary property NFKC_Inert.
ICU-specific property for characters that are inert under NFKC, i.e., they do not interact with adjacent characters.

I18N_UCHAR_SEGMENT_STARTER 

Binary Property Segment_Starter.
Property for characters that are starters in terms of Unicode normalization and combining character sequences. They have ccc=0 and do not occur in non-initial position of the canonical decomposition of any character (like a-umlaut in NFD and a Jamo T in an NFD(Hangul LVT)).

I18N_UCHAR_PATTERN_SYNTAX 

Binary property Pattern_Syntax (new in Unicode 4.1).

I18N_UCHAR_PATTERN_WHITE_SPACE 

Binary property Pattern_White_Space (new in Unicode 4.1).

I18N_UCHAR_POSIX_ALNUM 

Binary property alnum (a C/POSIX character class).

I18N_UCHAR_POSIX_BLANK 

Binary property blank (a C/POSIX character class).

I18N_UCHAR_POSIX_GRAPH 

Binary property graph (a C/POSIX character class).

I18N_UCHAR_POSIX_PRINT 

Binary property print (a C/POSIX character class).

I18N_UCHAR_POSIX_XDIGIT 

Binary property xdigit (a C/POSIX character class).

I18N_UCHAR_CASED 

Binary property Cased.
For Lowercase, Uppercase and Titlecase characters.

I18N_UCHAR_CASE_IGNORABLE 

Binary property Case_Ignorable.
Used in context-sensitive case mappings.

I18N_UCHAR_CHANGES_WHEN_LOWERCASED 

Binary property Changes_When_Lowercased.

I18N_UCHAR_CHANGES_WHEN_UPPERCASED 

Binary property Changes_When_Uppercased.

I18N_UCHAR_CHANGES_WHEN_TITLECASED 

Binary property Changes_When_Titlecased.

I18N_UCHAR_CHANGES_WHEN_CASEFOLDED 

Binary property Changes_When_Casefolded.

I18N_UCHAR_CHANGES_WHEN_CASEMAPPED 

Binary property Changes_When_Casemapped.

I18N_UCHAR_CHANGES_WHEN_NFKC_CASEFOLDED 

Binary property Changes_When_NFKC_Casefolded.

I18N_UCHAR_BINARY_LIMIT 

One more than the last constant for binary Unicode properties.

I18N_UCHAR_BIDI_CLASS 

Enumerated property Bidi_Class.
Same as u_charDirection, returns i18n_uchar_direction_e values.

I18N_UCHAR_INT_START 

First constant for enumerated/integer Unicode properties.

I18N_UCHAR_BLOCK 

Enumerated property Block.
Returns i18n_uchar_ublock_code_e values.

I18N_UCHAR_CANONICAL_COMBINING_CLASS 

Enumerated property Canonical_Combining_Class.
Returns 8-bit numeric values.

I18N_UCHAR_DECOMPOSITION_TYPE 

Enumerated property Decomposition_Type.
Returns i18n_uchar_u_decomposition_type_e values.

I18N_UCHAR_EAST_ASIAN_WIDTH 

Enumerated property East_Asian_Width.
Returns i18n_uchar_u_east_asian_width_e values.

I18N_UCHAR_GENERAL_CATEGORY 

Enumerated property General_Category.
Returns i18n_uchar_category_e values.

I18N_UCHAR_JOINING_GROUP 

Enumerated property Joining_Group.
Returns i18n_uchar_u_joining_group_e values.

I18N_UCHAR_JOINING_TYPE 

Enumerated property Joining_Type.
Returns i18n_uchar_u_joining_type_e values.

I18N_UCHAR_LINE_BREAK 

Enumerated property Line_Break.
Returns i18n_uchar_u_line_break_e values.

I18N_UCHAR_NUMERIC_TYPE 

Enumerated property Numeric_Type.
Returns i18n_uchar_u_numeric_type_e values.

I18N_UCHAR_SCRIPT 

Enumerated property Script.
Returns i18n_uscript_code_e values.

I18N_UCHAR_HANGUL_SYLLABLE_TYPE 

Enumerated property Hangul_Syllable_Type, new in Unicode 4.
Returns i18n_uchar_u_hangul_syllable_type_e values.

I18N_UCHAR_NFD_QUICK_CHECK 

Enumerated property NFD_Quick_Check.
Returns i18n_unormalization_check_result_e values.

I18N_UCHAR_NFKD_QUICK_CHECK 

Enumerated property NFKD_Quick_Check.
Returns i18n_unormalization_check_result_e values.

I18N_UCHAR_NFC_QUICK_CHECK 

Enumerated property NFC_Quick_Check.
Returns i18n_unormalization_check_result_e values.

I18N_UCHAR_NFKC_QUICK_CHECK 

Enumerated property NFKC_Quick_Check.
Returns i18n_unormalization_check_result_e values.

I18N_UCHAR_LEAD_CANONICAL_COMBINING_CLASS 

Enumerated property Lead_Canonical_Combining_Class.
Returns 8-bit numeric values.

I18N_UCHAR_TRAIL_CANONICAL_COMBINING_CLASS 

Enumerated property Trail_Canonical_Combining_Class.
Returns 8-bit numeric values.

I18N_UCHAR_GRAPHEME_CLUSTER_BREAK 

Enumerated property Grapheme_Cluster_Break (new in Unicode 4.1).
Returns i18n_uchar_u_grapheme_cluster_break_e values.

I18N_UCHAR_SENTENCE_BREAK 

Enumerated property Sentence_Break (new in Unicode 4.1).
Returns i18n_uchar_u_sentence_break_e values.

I18N_UCHAR_WORD_BREAK 

Enumerated property Word_Break (new in Unicode 4.1).
Returns i18n_uchar_u_word_break_values_e values.

I18N_UCHAR_BIDI_PAIRED_BRACKET_TYPE 

Enumerated property Bidi_Paired_Bracket_Type.
Returns i18n_uchar_u_bidi_paired_bracket_type_e values .

I18N_UCHAR_INT_LIMIT 

One more than the last constant for enumerated/integer Unicode properties.

I18N_UCHAR_GENERAL_CATEGORY_MASK 

Bitmask property General_Category_Mask.
Mask values should be cast to uint32_t.

I18N_UCHAR_MASK_START 

First constant for bit-mask Unicode properties.

I18N_UCHAR_MASK_LIMIT 

One more than the last constant for bit-mask Unicode properties.

I18N_UCHAR_NUMERIC_VALUE 

Double property Numeric_Value.

I18N_UCHAR_DOUBLE_START 

First constant for double Unicode properties.

I18N_UCHAR_DOUBLE_LIMIT 

One more than the last constant for double Unicode properties.

I18N_UCHAR_AGE 

String property Age.

I18N_UCHAR_STRING_START 

First constant for string Unicode properties.

I18N_UCHAR_BIDI_MIRRORING_GLYPH 

String property Bidi_Mirroring_Glyph.

I18N_UCHAR_CASE_FOLDING 

String property Case_Folding.

I18N_UCHAR_LOWERCASE_MAPPING 

String property Lowercase_Mapping.

I18N_UCHAR_NAME 

String property Name.

I18N_UCHAR_SIMPLE_CASE_FOLDING 

String property Simple_Case_Folding.

I18N_UCHAR_SIMPLE_LOWERCASE_MAPPING 

String property Simple_Lowercase_Mapping.

I18N_UCHAR_SIMPLE_TITLECASE_MAPPING 

String property Simple_Titlecase_Mapping.

I18N_UCHAR_SIMPLE_UPPERCASE_MAPPING 

String property Simple_Uppercase_Mapping.

I18N_UCHAR_TITLECASE_MAPPING 

String property Titlecase_Mapping.

I18N_UCHAR_UPPERCASE_MAPPING 

String property Uppercase_Mapping.

I18N_UCHAR_BIDI_PAIRED_BRACKET 

String property Bidi_Paired_Bracket.

I18N_UCHAR_STRING_LIMIT 

One more than the last constant for string Unicode properties.

I18N_UCHAR_SCRIPT_EXTENSIONS 

Provisional property Script_Extensions (new in Unicode 6.0).

I18N_UCHAR_OTHER_PROPERTY_START 

First constant for Unicode properties with unusual value types.

I18N_UCHAR_OTHER_PROPERTY_LIMIT 

One more than the last constant for Unicode properties with unusual value types.

I18N_UCHAR_INVALID_CODE 

Represents a nonexistent or invalid property or property value.

Constants for ISO 15924 script codes.

Since :
2.4
Enumerator:
I18N_USCRIPT_COMMON 

Zyyy

I18N_USCRIPT_INHERITED 

Zinh, "Code for inherited script", for non-spacing combining marks; also Qaai

I18N_USCRIPT_ARABIC 

Arab

I18N_USCRIPT_ARMENIAN 

Armn

I18N_USCRIPT_BENGALI 

Beng

I18N_USCRIPT_BOPOMOFO 

Bopo

I18N_USCRIPT_CHEROKEE 

Cher

I18N_USCRIPT_COPTIC 

Copt

I18N_USCRIPT_CYRILLIC 

Cyrl

I18N_USCRIPT_DESERET 

Dsrt

I18N_USCRIPT_DEVANAGARI 

Deva

I18N_USCRIPT_ETHIOPIC 

Ethi

I18N_USCRIPT_GEORGIAN 

Geor

I18N_USCRIPT_GOTHIC 

Goth

I18N_USCRIPT_GREEK 

Grek

I18N_USCRIPT_GUJARATI 

Gujr

I18N_USCRIPT_GURMUKHI 

Guru

I18N_USCRIPT_HAN 

Hani

I18N_USCRIPT_HANGUL 

Hang

I18N_USCRIPT_HEBREW 

Hebr

I18N_USCRIPT_HIRAGANA 

Hira

I18N_USCRIPT_KANNADA 

Knda

I18N_USCRIPT_KATAKANA 

Kana

I18N_USCRIPT_KHMER 

Khmr

I18N_USCRIPT_LAO 

Laoo

I18N_USCRIPT_LATIN 

Latn

I18N_USCRIPT_MALAYALAM 

Mlym

I18N_USCRIPT_MONGOLIAN 

Mong

I18N_USCRIPT_MYANMAR 

Mymr

I18N_USCRIPT_OGHAM 

Ogam

I18N_USCRIPT_OLD_ITALIC 

Ital

I18N_USCRIPT_ORIYA 

Orya

I18N_USCRIPT_RUNIC 

Runr

I18N_USCRIPT_SINHALA 

Sinh

I18N_USCRIPT_SYRIAC 

Syrc

I18N_USCRIPT_TAMIL 

Taml

I18N_USCRIPT_TELUGU 

Telu

I18N_USCRIPT_THAANA 

Thaa

I18N_USCRIPT_THAI 

Thai

I18N_USCRIPT_TIBETAN 

Tibt

I18N_USCRIPT_CANADIAN_ABORIGINAL 

Cans, Canadian_Aboriginal script.

I18N_USCRIPT_UCAS 

Canadian_Aboriginal script (alias).

I18N_USCRIPT_YI 

Yiii

I18N_USCRIPT_TAGALOG 

Tglg

I18N_USCRIPT_HANUNOO 

Hano

I18N_USCRIPT_BUHID 

Buhd

I18N_USCRIPT_TAGBANWA 

Tagb

I18N_USCRIPT_BRAILLE 

Brai

I18N_USCRIPT_CYPRIOT 

Cprt

I18N_USCRIPT_LIMBU 

Limb

I18N_USCRIPT_LINEAR_B 

Linb

I18N_USCRIPT_OSMANYA 

Osma

I18N_USCRIPT_SHAVIAN 

Shaw

I18N_USCRIPT_TAI_LE 

Tale

I18N_USCRIPT_UGARITIC 

Ugar

I18N_USCRIPT_KATAKANA_OR_HIRAGANA 

Hrkt

I18N_USCRIPT_BUGINESE 

Bugi

I18N_USCRIPT_GLAGOLITIC 

Glag

I18N_USCRIPT_KHAROSHTHI 

Khar

I18N_USCRIPT_SYLOTI_NAGRI 

Sylo

I18N_USCRIPT_NEW_TAI_LUE 

Talu

I18N_USCRIPT_TIFINAGH 

Tfng

I18N_USCRIPT_OLD_PERSIAN 

Xpeo

I18N_USCRIPT_BALINESE 

Bali

I18N_USCRIPT_BATAK 

Batk

I18N_USCRIPT_BLISSYMBOLS 

Blis

I18N_USCRIPT_BRAHMI 

Brah

I18N_USCRIPT_CHAM 

Cham

I18N_USCRIPT_CIRTH 

Cirt

I18N_USCRIPT_OLD_CHURCH_SLAVONIC_CYRILLIC 

Cyrs

I18N_USCRIPT_DEMOTIC_EGYPTIAN 

Egyd

I18N_USCRIPT_HIERATIC_EGYPTIAN 

Egyh

I18N_USCRIPT_EGYPTIAN_HIEROGLYPHS 

Egyp

I18N_USCRIPT_KHUTSURI 

Geok

I18N_USCRIPT_SIMPLIFIED_HAN 

Hans

I18N_USCRIPT_TRADITIONAL_HAN 

Hant

I18N_USCRIPT_PAHAWH_HMONG 

Hmng

I18N_USCRIPT_OLD_HUNGARIAN 

Hung

I18N_USCRIPT_HARAPPAN_INDUS 

Inds

I18N_USCRIPT_JAVANESE 

Java

I18N_USCRIPT_KAYAH_LI 

Kali

I18N_USCRIPT_LATIN_FRAKTUR 

Latf

I18N_USCRIPT_LATIN_GAELIC 

Latg

I18N_USCRIPT_LEPCHA 

Lepc

I18N_USCRIPT_LINEAR_A 

Lina

I18N_USCRIPT_MANDAIC 

Mand

I18N_USCRIPT_MAYAN_HIEROGLYPHS 

Maya

I18N_USCRIPT_MEROITIC_HIEROGLYPHS 

Mero

I18N_USCRIPT_NKO 

Nkoo

I18N_USCRIPT_ORKHON 

Orkh

I18N_USCRIPT_OLD_PERMIC 

Perm

I18N_USCRIPT_PHAGS_PA 

Phag

I18N_USCRIPT_PHOENICIAN 

Phnx

I18N_USCRIPT_PHONETIC_POLLARD 

Plrd

I18N_USCRIPT_RONGORONGO 

Roro

I18N_USCRIPT_SARATI 

Sara

I18N_USCRIPT_ESTRANGELO_SYRIAC 

Syre

I18N_USCRIPT_WESTERN_SYRIAC 

Syrj

I18N_USCRIPT_EASTERN_SYRIAC 

Syrn

I18N_USCRIPT_TENGWAR 

Teng

I18N_USCRIPT_VAI 

Vaii

I18N_USCRIPT_VISIBLE_SPEECH 

Visp

I18N_USCRIPT_CUNEIFORM 

Xsux

I18N_USCRIPT_UNWRITTEN_LANGUAGES 

Zxxx

I18N_USCRIPT_UNKNOWN 

Zzzz, Unknown="Code for uncoded script", for unassigned code points

I18N_USCRIPT_CARIAN 

Cari

I18N_USCRIPT_JAPANESE 

Jpan

I18N_USCRIPT_LANNA 

Lana

I18N_USCRIPT_LYCIAN 

Lyci

I18N_USCRIPT_LYDIAN 

Lydi

I18N_USCRIPT_OL_CHIKI 

Olck

I18N_USCRIPT_REJANG 

Rjng

I18N_USCRIPT_SAURASHTRA 

Saur

I18N_USCRIPT_SIGN_WRITING 

Sgnw

I18N_USCRIPT_SUNDANESE 

Sund

I18N_USCRIPT_MOON 

Moon

I18N_USCRIPT_MEITEI_MAYEK 

Mtei

I18N_USCRIPT_IMPERIAL_ARAMAIC 

Armi

I18N_USCRIPT_AVESTAN 

Avst

I18N_USCRIPT_CHAKMA 

Cakm

I18N_USCRIPT_KOREAN 

Kore

I18N_USCRIPT_KAITHI 

Kthi

I18N_USCRIPT_MANICHAEAN 

Mani

I18N_USCRIPT_INSCRIPTIONAL_PAHLAVI 

Phli

I18N_USCRIPT_PSALTER_PAHLAVI 

Phlp

I18N_USCRIPT_BOOK_PAHLAVI 

Phlv

I18N_USCRIPT_INSCRIPTIONAL_PARTHIAN 

Prti

I18N_USCRIPT_SAMARITAN 

Samr

I18N_USCRIPT_TAI_VIET 

Tavt

I18N_USCRIPT_MATHEMATICAL_NOTATION 

Zmth

I18N_USCRIPT_SYMBOLS 

Zsym

I18N_USCRIPT_BAMUM 

Bamu

I18N_USCRIPT_LISU 

Lisu

I18N_USCRIPT_NAKHI_GEBA 

Nkgb

I18N_USCRIPT_OLD_SOUTH_ARABIAN 

Sarb

I18N_USCRIPT_BASSA_VAH 

Bass

I18N_USCRIPT_DUPLOYAN_SHORTAND 

Dupl

I18N_USCRIPT_ELBASAN 

Elba

I18N_USCRIPT_GRANTHA 

Gran

I18N_USCRIPT_KPELLE 

Kpel

I18N_USCRIPT_LOMA 

Loma

I18N_USCRIPT_MENDE 

Mend

I18N_USCRIPT_MEROITIC_CURSIVE 

Merc

I18N_USCRIPT_OLD_NORTH_ARABIAN 

Narb

I18N_USCRIPT_NABATAEAN 

Nbat

I18N_USCRIPT_PALMYRENE 

Palm

I18N_USCRIPT_SINDHI 

Sind

I18N_USCRIPT_WARANG_CITI 

Wara

I18N_USCRIPT_AFAKA 

Afak

I18N_USCRIPT_JURCHEN 

Jurc

I18N_USCRIPT_MRO 

Mroo

I18N_USCRIPT_NUSHU 

Nshu

I18N_USCRIPT_SHARADA 

Shrd

I18N_USCRIPT_SORA_SOMPENG 

Sora

I18N_USCRIPT_TAKRI 

Takr

I18N_USCRIPT_TANGUT 

Tang

I18N_USCRIPT_WOLEAI 

Wole

I18N_USCRIPT_ANATOLIAN_HIEROGLYPHS 

Hluw

I18N_USCRIPT_KHOJKI 

Khoj

I18N_USCRIPT_TIRHUTA 

Tirh

I18N_USCRIPT_CODE_LIMIT 

Count of i18n_uscript_code_e enumerators


Function Documentation

int i18n_uchar_get_int_property_value ( i18n_uchar32  c,
i18n_uchar_uproperty_e  which,
int32_t *  property_val 
)

Gets the property value for an enumerated property for a code point.

int property_value;
i18n_uchar_u_east_asian_width_e east_asian_width;
i18n_uchar_get_int_property_value (c, I18N_UCHAR_EAST_ASIAN_WIDTH, &property_value);
east_asian_width = (i18n_uchar_u_east_asian_width_e)property_value;

int property_value;
bool is_ideographic;
i18n_uchar_get_int_property_value(c, I18N_UCHAR_IDEOGRAPHIC, &property_value);
is_ideographic = (bool)property_value;

Since :
2.3.1
Parameters:
[in]cThe code point to test.
[in]whichThe i18n_uchar_uproperty_e selector constant, identifies which property to check
Must be I18N_UCHAR_BINARY_START<=which<I18N_UCHAR_BINARY_LIMIT or I18N_UCHAR_INT_START<=which<I18N_UCHAR_INT_LIMIT or I18N_UCHAR_MASK_START<=which<I18N_UCHAR_MASK_LIMIT.
[out]property_valThe numeric value that is directly the property value or, for enumerated properties, corresponds to the numeric value of the enumerated constant of the respective property value enumeration type (cast to enum type if necessary)
Returns 0 or 1 (for false/true) for binary Unicode properties
Returns a bit-mask for mask properties
Returns 0 if 'which' is out of bounds or if the Unicode version does not have data for the property at all, or not for this code point.
Return values:
I18N_ERROR_NONESuccessful
I18N_ERROR_INVALID_PARAMETERInvalid function parameter

Gets the Unicode allocation block that contains the character.

Since :
2.3.1
Parameters:
[in]cThe code point to test
[out]block_valThe block value for the code point
Return values:
I18N_ERROR_NONESuccessful
I18N_ERROR_INVALID_PARAMETERInvalid function parameter