#ifndef EL__DOCUMENT_HTML_PARSER_H #define EL__DOCUMENT_HTML_PARSER_H #include "document/format.h" #include "intl/charsets.h" /* unicode_val_T */ #include "util/align.h" #include "util/color.h" #include "util/lists.h" struct document_options; struct form_control; struct frameset_desc; struct html_context; struct memory_list; struct menu_item; struct part; struct string; struct uri; /* XXX: This is just terible - this interface is from 75% only for other HTML * files - there's lack of any well defined interface and it's all randomly * mixed up :/. */ struct text_attrib { struct text_style style; int fontsize; unsigned char *link; unsigned char *target; unsigned char *image; unsigned char *title; struct form_control *form; color_T clink; color_T vlink; #ifdef CONFIG_BOOKMARKS color_T bookmark_link; #endif color_T image_link; #ifdef CONFIG_CSS /* Bug 766: CSS speedup. 56% of CPU time was going to * get_attr_value(). Of those calls, 97% were asking for "id" * or "class". So cache the results. start_element() sets up * these pointers if html_context->options->css_enable; * otherwise they remain NULL. */ unsigned char *id; unsigned char *class; #endif unsigned char *select; int select_disabled; unsigned int tabindex; unicode_val_T accesskey; unsigned char *onclick; unsigned char *ondblclick; unsigned char *onmouseover; unsigned char *onhover; unsigned char *onfocus; unsigned char *onmouseout; unsigned char *onblur; }; /* This enum is pretty ugly, yes ;). */ enum format_list_flag { P_NONE = 0, P_NUMBER = 1, P_alpha = 2, P_ALPHA = 3, P_roman = 4, P_ROMAN = 5, P_STAR = 1, P_O = 2, P_PLUS = 3, P_LISTMASK = 7, P_COMPACT = 8, }; struct par_attrib { enum format_align align; int leftmargin; int rightmargin; int width; int list_level; unsigned list_number; int dd_margin; enum format_list_flag flags; color_T bgcolor; }; /* HTML parser stack mortality info */ enum html_element_mortality_type { /* Elements of this type can not be removed from the stack. This type * is created by the renderer when formatting a HTML part. */ ELEMENT_IMMORTAL, /* Elements of this type can only be removed by elements of the start * type. This type is created whenever a HTML state is created using * init_html_parser_state(). */ /* The element has been created by*/ ELEMENT_DONT_KILL, /* These elements can safely be removed from the stack by both */ ELEMENT_KILLABLE, /* These elements not only cannot bear any other elements inside but * any attempt to do so will cause them to terminate. This is so deadly * that it affects even invisible elements. Ie. foo<body>. */ ELEMENT_WEAK, }; struct html_element { LIST_HEAD(struct html_element); enum html_element_mortality_type type; struct text_attrib attr; struct par_attrib parattr; int invisible; unsigned char *name; int namelen; unsigned char *options; /* See document/html/parser/parse.c's element_info.linebreak * description. */ int linebreak; struct frameset_desc *frameset; /* For the needs of CSS engine. A wannabe bitmask. */ enum html_element_pseudo_class { ELEMENT_LINK = 1, ELEMENT_VISITED = 2, } pseudo_class; }; #define is_inline_element(e) (e->linebreak == 0) #define is_block_element(e) (e->linebreak > 0) enum html_special_type { SP_TAG, SP_FORM, SP_CONTROL, SP_TABLE, SP_USED, SP_FRAMESET, SP_FRAME, SP_NOWRAP, SP_CACHE_CONTROL, SP_CACHE_EXPIRES, SP_REFRESH, SP_STYLESHEET, SP_COLOR_LINK_LINES, SP_SCRIPT, }; /* Interface for the renderer */ struct html_context * init_html_parser(struct uri *uri, struct document_options *options, unsigned char *start, unsigned char *end, struct string *head, struct string *title, void (*put_chars)(struct html_context *, unsigned char *, int), void (*line_break)(struct html_context *), void *(*special)(struct html_context *, enum html_special_type, ...)); void done_html_parser(struct html_context *html_context); struct html_element *init_html_parser_state(struct html_context *html_context, enum html_element_mortality_type type, int align, int margin, int width); void done_html_parser_state(struct html_context *html_context, struct html_element *element); /* Interface for the table handling */ int get_bgcolor(struct html_context *html_context, unsigned char *a, color_T *rgb); void set_fragment_identifier(struct html_context *html_context, unsigned char *attr_name, unsigned char *attr); void add_fragment_identifier(struct html_context *html_context, struct part *, unsigned char *attr); /* Interface for the viewer */ int get_image_map(unsigned char *head, unsigned char *pos, unsigned char *eof, struct menu_item **menu, struct memory_list **ml, struct uri *uri, struct document_options *options, unsigned char *target_base, int to, int def, int hdef); /* For html/parser/forms.c,general.c,link.c,parse.c,stack.c */ /* Ensure that there are at least n successive line-breaks at the current * position, but don't add more than necessary to bring the current number * of successive line-breaks above n. * * For example, there should be two line-breaks after a <br>, but multiple * successive <br>'s warrant still only two line-breaks. ln_break will be * called with n = 2 for each of multiple successive <br>'s, but ln_break * will only add two line-breaks for the entire run of <br>'s. */ void ln_break(struct html_context *html_context, int n); int get_color(struct html_context *html_context, unsigned char *a, unsigned char *c, color_T *rgb); #endif