#include <sys/types.h>
Include dependency graph for ut_charset.h:
This graph shows which files directly or indirectly include this file:
Go to the source code of this file.
Classes | |
struct | UtCharType |
Description of a character. More... | |
struct | UtCharset |
Contains informations about a charset. More... | |
Defines | |
#define | UT_CTG_PONCT_IF_N UT_CTG_PONCT_INIT_OTHER-UT_CTG_PONCT_INIT_0+1 |
Typedefs | |
typedef enum UtCateg | UtCateg |
Categories to classify characters. | |
typedef u_char | UtScript |
typedef UtCharType | UtCharType |
Description of a character. | |
typedef enum UtCharsetType | UtCharsetType |
typedef UtCharset | UtCharset |
Contains informations about a charset. | |
Enumerations | |
enum | UtCateg { UT_CTG_UNSET = 0, UT_CTG_UPPERCASE, UT_CTG_LOWERCASE, UT_CTG_OTHER_LETTER, UT_CTG_NUMBER, UT_CTG_PONCTUATION, UT_CTG_PONCT_INIT_0, UT_CTG_PONCT_INIT_1, UT_CTG_PONCT_INIT_2, UT_CTG_PONCT_INIT_3, UT_CTG_PONCT_INIT_OTHER, UT_CTG_PONCT_FINAL_0, UT_CTG_PONCT_FINAL_1, UT_CTG_PONCT_FINAL_2, UT_CTG_PONCT_FINAL_3, UT_CTG_PONCT_FINAL_OTHER, UT_CTG_CURRENCY, UT_CTG_SYMBOL, UT_CTG_CONTROL, UT_CTG_DELIMITER, UT_CTG_MARK, UT_CTG_OTHER } |
Categories to classify characters. More... | |
enum | UtCharsetType { UT_CST_UNSET = -1, UT_CST_ASCII = 0, UT_CST_UTF_8, UT_CST_UTF_16BE, UT_CST_UTF_16LE, UT_CST_UTF_32BE, UT_CST_UTF_32LE, UT_CST_ASCII_EXTENSION } |
Variables | |
const char * | UT_CHARSET_NAME [] |
Charset Name. |
Definition in file ut_charset.h.
|
Categories to classify characters. They are inspirated from ftp://ftp.unicode.org/Public/UNIDATA/UCD.html#General_Category_Values
Referenced by ut_xascii_pass(). |
|
Contains informations about a charset. This structure is used to describe a charset. It is stocked as an array in UtSession::charset. This array is created from file charsets.dat by ut_load_charsets() (called in ut_init()); it is destroyed in ut_finish(). |
|
Charset type. ASCII extension means charsets monobytes whose 128 firsts characters are the same than ASCII's ones. Referenced by parse_charmap_line(). |
|
Type of alphabet (latin, cyrillic, arabic, greek, hebrew, thai...) The index is the same than for array SCRIPT_NAME in ut_charset.c Definition at line 76 of file ut_charset.h. Referenced by ut_xascii_pass(). |
|
Categories to classify characters. They are inspirated from ftp://ftp.unicode.org/Public/UNIDATA/UCD.html#General_Category_Values
Definition at line 45 of file ut_charset.h. |
|
Charset type. ASCII extension means charsets monobytes whose 128 firsts characters are the same than ASCII's ones.
Definition at line 110 of file ut_charset.h. |