1
0
mirror of https://github.com/rkd77/elinks.git synced 2024-09-16 01:08:31 -04:00
elinks/src/intl/charsets.h

82 lines
3.0 KiB
C
Raw Normal View History

#ifndef EL__INTL_CHARSETS_H
#define EL__INTL_CHARSETS_H
typedef uint32_t unicode_val_T;
/* UCS/Unicode replacement character. */
#define UCS_NO_CHAR ((unicode_val_T) 0xFFFFFFFD)
/*   replacement character. See u2cp(). */
#define NBSP_CHAR ((unsigned char) 1)
#define NBSP_CHAR_STRING "\001"
struct conv_table {
int t;
union {
unsigned char *str;
struct conv_table *tbl;
} u;
};
enum convert_string_mode {
CSM_DEFAULT, /* Convert any char. */
CSM_QUERY, /* Special handling of '&' and '=' chars. */
CSM_FORM, /* Special handling of '&' and '=' chars in forms. */
CSM_NONE, /* Convert nothing. */
};
struct conv_table *get_translation_table(int, int);
unsigned char *get_entity_string(const unsigned char *str, const int strlen, int encoding);
/* The convert_string() name is also used by Samba (version 3.0.3), which
* provides libnss_wins.so.2, which is called somewhere inside
* _nss_wins_gethostbyname_r(). This name clash causes the elinks hostname
* lookup thread to crash so we need to rename the symbol. */
/* Reported by Derek Poon and filed as bug 453 */
#undef convert_string
#define convert_string convert_string_elinks
/* This routine converts a string from one charset to another according to the
* passed @convert_table, potentially also decoding SGML (HTML) entities along
* the way (according to @mode). It either returns dynamically allocated
* converted string of length @length, or if the @callback is non-NULL it calls
* it each few bytes instead and always returns NULL (@length is undefined).
* Note that it's ok not to care and pass NULL as @length. */
unsigned char *convert_string(struct conv_table *convert_table,
unsigned char *chars, int charslen, int cp,
enum convert_string_mode mode, int *length,
void (*callback)(void *data, unsigned char *buf, int buflen),
void *callback_data);
int get_cp_index(unsigned char *);
unsigned char *get_cp_name(int);
unsigned char *get_cp_mime_name(int);
2006-07-18 11:51:03 -04:00
int is_cp_utf8(int);
void free_conv_table(void);
#ifdef CONFIG_UTF_8
2006-01-14 16:44:00 -05:00
inline unsigned char *encode_utf_8(unicode_val_T);
inline unsigned char *utf8_prevchar(unsigned char *, int, unsigned char *);
inline int utf8charlen(const unsigned char *);
int utf8_char2cells(unsigned char *, unsigned char *);
int utf8_ptr2cells(unsigned char *, unsigned char *);
int utf8_ptr2chars(unsigned char *, unsigned char *);
int utf8_cells2bytes(unsigned char *, int, unsigned char *);
inline int unicode_to_cell(unicode_val_T);
unicode_val_T unicode_fold_label_case(unicode_val_T);
2006-01-14 16:44:00 -05:00
inline int strlen_utf8(unsigned char **);
inline unicode_val_T utf_8_to_unicode(unsigned char **, unsigned char *);
2006-08-13 16:35:50 -04:00
unicode_val_T cp_to_unicode(int, unsigned char **, unsigned char *);
#endif /* CONFIG_UTF_8 */
2006-01-14 16:44:00 -05:00
unicode_val_T cp2u(int, unsigned char);
unsigned char *cp2utf_8(int, int);
unsigned char *u2cp_(unicode_val_T, int, int no_nbsp_hack);
#define u2cp(u, to) u2cp_(u, to, 0)
#define u2cp_no_nbsp(u, to) u2cp_(u, to, 1)
void init_charsets_lookup(void);
void free_charsets_lookup(void);
#endif