mirror of
https://github.com/rkd77/elinks.git
synced 2025-01-03 14:57:44 -05:00
68 lines
2.3 KiB
C
68 lines
2.3 KiB
C
|
/* $Id: charsets.h,v 1.26 2005/07/15 20:17:25 miciah Exp $ */
|
||
|
|
||
|
#ifndef EL__INTL_CHARSETS_H
|
||
|
#define EL__INTL_CHARSETS_H
|
||
|
|
||
|
typedef uint32_t unicode_val_T;
|
||
|
|
||
|
/* UCS/Unicode replacement character. */
|
||
|
#define UCS_NO_CHAR ((unicode_val_T) 0xFFFD)
|
||
|
|
||
|
/* replacement character. See u2cp(). */
|
||
|
#define NBSP_CHAR ((unsigned char) 1)
|
||
|
#define NBSP_CHAR_STRING "\001"
|
||
|
|
||
|
struct conv_table {
|
||
|
int t;
|
||
|
union {
|
||
|
unsigned char *str;
|
||
|
struct conv_table *tbl;
|
||
|
} u;
|
||
|
};
|
||
|
|
||
|
enum convert_string_mode {
|
||
|
CSM_DEFAULT, /* Convert any char. */
|
||
|
CSM_QUERY, /* Special handling of '&' and '=' chars. */
|
||
|
CSM_FORM, /* Special handling of '&' and '=' chars in forms. */
|
||
|
CSM_NONE, /* Convert nothing. */
|
||
|
};
|
||
|
|
||
|
struct conv_table *get_translation_table(int, int);
|
||
|
unsigned char *get_entity_string(const unsigned char *str, const int strlen, int encoding);
|
||
|
|
||
|
/* The convert_string() name is also used by Samba (version 3.0.3), which
|
||
|
* provides libnss_wins.so.2, which is called somewhere inside
|
||
|
* _nss_wins_gethostbyname_r(). This name clash causes the elinks hostname
|
||
|
* lookup thread to crash so we need to rename the symbol. */
|
||
|
/* Reported by Derek Poon and filed as bug 453 */
|
||
|
#undef convert_string
|
||
|
#define convert_string convert_string_elinks
|
||
|
|
||
|
/* This routine converts a string from one charset to another according to the
|
||
|
* passed @convert_table, potentially also decoding SGML (HTML) entities along
|
||
|
* the way (according to @mode). It either returns dynamically allocated
|
||
|
* converted string of length @length, or if the @callback is non-NULL it calls
|
||
|
* it each few bytes instead and always returns NULL (@length is undefined).
|
||
|
* Note that it's ok not to care and pass NULL as @length. */
|
||
|
unsigned char *convert_string(struct conv_table *convert_table,
|
||
|
unsigned char *chars, int charslen, int cp,
|
||
|
enum convert_string_mode mode, int *length,
|
||
|
void (*callback)(void *data, unsigned char *buf, int buflen),
|
||
|
void *callback_data);
|
||
|
|
||
|
int get_cp_index(unsigned char *);
|
||
|
unsigned char *get_cp_name(int);
|
||
|
unsigned char *get_cp_mime_name(int);
|
||
|
int is_cp_special(int);
|
||
|
void free_conv_table(void);
|
||
|
unsigned char *cp2utf_8(int, int);
|
||
|
|
||
|
unsigned char *u2cp_(unicode_val_T, int, int no_nbsp_hack);
|
||
|
#define u2cp(u, to) u2cp_(u, to, 0)
|
||
|
#define u2cp_no_nbsp(u, to) u2cp_(u, to, 1)
|
||
|
|
||
|
void init_charsets_lookup(void);
|
||
|
void free_charsets_lookup(void);
|
||
|
|
||
|
#endif
|