#include <sys/types.h>Include dependency graph for ut_charset.h:

This graph shows which files directly or indirectly include this file:

Go to the source code of this file.
Classes | |
| struct | UtCharType |
| Description of a character. More... | |
| struct | UtCharset |
| Contains informations about a charset. More... | |
Defines | |
| #define | UT_CTG_PONCT_IF_N UT_CTG_PONCT_INIT_OTHER-UT_CTG_PONCT_INIT_0+1 |
Typedefs | |
| typedef enum UtCateg | UtCateg |
| Categories to classify characters. | |
| typedef u_char | UtScript |
| typedef UtCharType | UtCharType |
| Description of a character. | |
| typedef enum UtCharsetType | UtCharsetType |
| typedef UtCharset | UtCharset |
| Contains informations about a charset. | |
Enumerations | |
| enum | UtCateg { UT_CTG_UNSET = 0, UT_CTG_UPPERCASE, UT_CTG_LOWERCASE, UT_CTG_OTHER_LETTER, UT_CTG_NUMBER, UT_CTG_PONCTUATION, UT_CTG_PONCT_INIT_0, UT_CTG_PONCT_INIT_1, UT_CTG_PONCT_INIT_2, UT_CTG_PONCT_INIT_3, UT_CTG_PONCT_INIT_OTHER, UT_CTG_PONCT_FINAL_0, UT_CTG_PONCT_FINAL_1, UT_CTG_PONCT_FINAL_2, UT_CTG_PONCT_FINAL_3, UT_CTG_PONCT_FINAL_OTHER, UT_CTG_CURRENCY, UT_CTG_SYMBOL, UT_CTG_CONTROL, UT_CTG_DELIMITER, UT_CTG_MARK, UT_CTG_OTHER } |
| Categories to classify characters. More... | |
| enum | UtCharsetType { UT_CST_UNSET = -1, UT_CST_ASCII = 0, UT_CST_UTF_8, UT_CST_UTF_16BE, UT_CST_UTF_16LE, UT_CST_UTF_32BE, UT_CST_UTF_32LE, UT_CST_ASCII_EXTENSION } |
Variables | |
| const char * | UT_CHARSET_NAME [] |
| Charset Name. | |
Definition in file ut_charset.h.
|
|
Categories to classify characters. They are inspirated from ftp://ftp.unicode.org/Public/UNIDATA/UCD.html#General_Category_Values
Referenced by ut_xascii_pass(). |
|
|
Contains informations about a charset. This structure is used to describe a charset. It is stocked as an array in UtSession::charset. This array is created from file charsets.dat by ut_load_charsets() (called in ut_init()); it is destroyed in ut_finish(). |
|
|
Charset type. ASCII extension means charsets monobytes whose 128 firsts characters are the same than ASCII's ones. Referenced by parse_charmap_line(). |
|
|
Type of alphabet (latin, cyrillic, arabic, greek, hebrew, thai...) The index is the same than for array SCRIPT_NAME in ut_charset.c Definition at line 76 of file ut_charset.h. Referenced by ut_xascii_pass(). |
|
|
Categories to classify characters. They are inspirated from ftp://ftp.unicode.org/Public/UNIDATA/UCD.html#General_Category_Values
Definition at line 45 of file ut_charset.h. |
|
|
Charset type. ASCII extension means charsets monobytes whose 128 firsts characters are the same than ASCII's ones.
Definition at line 110 of file ut_charset.h. |
1.3.9