|
Data Structures |
| struct | utf32_nfkd |
| | The upper 8 bit of c are reserved for flags. More...
|
| struct | utf32_comb_class |
| struct | utf32_general_category |
Defines |
| #define | UTF32_NFKD_REPLACE_MAXLEN 18 |
| #define | UTF32_F_MASK 0xff000000U |
| #define | UTF32_F_NFKD 0x80000000U /**< Set for compatibility compositions */ |
| | Set for compatibility compositions.
|
| #define | UTF32_NFD(x) (x) |
| #define | UTF32_NFKD(x) (UTF32_F_NFKD | (x)) |
| #define | UNI_GC_LU UNI_GC_LETTER_UPPERCASE |
| #define | UNI_GC_LL UNI_GC_LETTER_LOWERCASE |
| #define | UNI_GC_LT UNI_GC_LETTER_TITLECASE |
| #define | UNI_GC_LM UNI_GC_LETTER_MODIFIER |
| #define | UNI_GC_LO UNI_GC_LETTER_OTHER |
| #define | UNI_GC_MN UNI_GC_MARK_NONSPACING |
| #define | UNI_GC_MC UNI_GC_MARK_SPACING_COMBINE |
| #define | UNI_GC_ME UNI_GC_MARK_ENCLOSING |
| #define | UNI_GC_ND UNI_GC_NUMBER_DECIMAL |
| #define | UNI_GC_NL UNI_GC_NUMBER_LETTER |
| #define | UNI_GC_NO UNI_GC_NUMBER_OTHER |
| #define | UNI_GC_PC UNI_GC_PUNCT_CONNECTOR |
| #define | UNI_GC_PD UNI_GC_PUNCT_DASH |
| #define | UNI_GC_PS UNI_GC_PUNCT_OPEN |
| #define | UNI_GC_PE UNI_GC_PUNCT_CLOSE |
| #define | UNI_GC_PI UNI_GC_PUNCT_INIT_QUOTE |
| #define | UNI_GC_PF UNI_GC_PUNCT_FINAL_QUOTE |
| #define | UNI_GC_PO UNI_GC_PUNCT_OTHER |
| #define | UNI_GC_SM UNI_GC_SYMBOL_MATH |
| #define | UNI_GC_SC UNI_GC_SYMBOL_CURRENCY |
| #define | UNI_GC_SK UNI_GC_SYMBOL_MODIFIER |
| #define | UNI_GC_SO UNI_GC_SYMBOL_OTHER |
| #define | UNI_GC_ZS UNI_GC_SEPARATOR_SPACE |
| #define | UNI_GC_ZL UNI_GC_SEPARATOR_LINE |
| #define | UNI_GC_ZP UNI_GC_SEPARATOR_PARAGRAPH |
| #define | UNI_GC_CC UNI_GC_OTHER_CONTROL |
| #define | UNI_GC_CF UNI_GC_OTHER_FORMAT |
| #define | UNI_GC_CS UNI_GC_OTHER_SURROGATE |
| #define | UNI_GC_CO UNI_GC_OTHER_PRIVATE_USE |
| #define | UNI_GC_CN UNI_GC_OTHER_NOT_ASSIGNED |
Enumerations |
| enum | uni_gc_t {
UNI_GC_LETTER_UPPERCASE = 0,
UNI_GC_LETTER_LOWERCASE,
UNI_GC_LETTER_TITLECASE,
UNI_GC_LETTER_MODIFIER,
UNI_GC_LETTER_OTHER,
UNI_GC_MARK_NONSPACING,
UNI_GC_MARK_SPACING_COMBINE,
UNI_GC_MARK_ENCLOSING,
UNI_GC_NUMBER_DECIMAL,
UNI_GC_NUMBER_LETTER,
UNI_GC_NUMBER_OTHER,
UNI_GC_PUNCT_CONNECTOR,
UNI_GC_PUNCT_DASH,
UNI_GC_PUNCT_OPEN,
UNI_GC_PUNCT_CLOSE,
UNI_GC_PUNCT_INIT_QUOTE,
UNI_GC_PUNCT_FINAL_QUOTE,
UNI_GC_PUNCT_OTHER,
UNI_GC_SYMBOL_MATH,
UNI_GC_SYMBOL_CURRENCY,
UNI_GC_SYMBOL_MODIFIER,
UNI_GC_SYMBOL_OTHER,
UNI_GC_SEPARATOR_SPACE,
UNI_GC_SEPARATOR_LINE,
UNI_GC_SEPARATOR_PARAGRAPH,
UNI_GC_OTHER_CONTROL,
UNI_GC_OTHER_FORMAT,
UNI_GC_OTHER_SURROGATE,
UNI_GC_OTHER_PRIVATE_USE,
UNI_GC_OTHER_NOT_ASSIGNED
} |
Variables |
| struct { |
| const guchar start |
| const guchar end |
| } | utf8_2nd_byte_tab [64] |
| const struct utf32_nfkd | utf32_nfkd_lut [] |
| | The upper 8 bit of c are reserved for flags.
|
| struct { |
| guint16 lower |
| guint16 upper |
| } | utf32_uppercase_lut [] |
| struct { |
| guint16 upper |
| guint16 lower |
| } | utf32_lowercase_lut [] |
| const struct utf32_comb_class | utf32_comb_class_lut [] |
| const guint32 | utf32_composition_exclusions [] |
| | These are special exlusions which cannot be derived from UnicodeData.txt but are listed in CompositionExclusions.txt.
|
| const struct utf32_general_category | utf32_general_category_lut [] |
| struct { |
| guint32 start |
| guint32 end |
| } | utf32_block_id_lut [] |
| struct { |
| guint32 uc |
| guint16 len |
| } | utf32_normalization_specials [] |
| | This table is huge! It can be generated with the following AWK script:.
|
| struct { |
| guint16 uc |
| const char s [4] |
| } | jap_tab [] |