1
0
mirror of https://github.com/rkd77/elinks.git synced 2025-01-03 14:57:44 -05:00
elinks/src/document/html/renderer.c
Pavol Babincak f9d67aeb73 Added configure option --enable-utf-8
For enabling better UTF-8 support by Witek and Scrool.
2006-02-18 20:28:00 +01:00

2197 lines
54 KiB
C

/* HTML renderer */
#ifdef HAVE_CONFIG_H
#include "config.h"
#endif
#include <ctype.h>
#include <stdarg.h>
#include <string.h>
#include "elinks.h"
#include "cache/cache.h"
#include "config/options.h"
#include "document/docdata.h"
#include "document/document.h"
#include "document/html/frames.h"
#include "document/html/parser.h"
#include "document/html/parser/parse.h"
#include "document/html/renderer.h"
#include "document/html/tables.h"
#include "document/options.h"
#include "document/refresh.h"
#include "document/renderer.h"
#include "intl/charsets.h"
#include "osdep/types.h"
#include "protocol/uri.h"
#include "session/session.h"
#include "terminal/color.h"
#include "terminal/draw.h"
#include "util/color.h"
#include "util/conv.h"
#include "util/error.h"
#include "util/hash.h"
#include "util/lists.h"
#include "util/memory.h"
#include "util/string.h"
#include "util/time.h"
#include "viewer/text/form.h"
#include "viewer/text/view.h"
#include "viewer/text/vs.h"
/* Unsafe macros */
#include "document/html/internal.h"
/* Types and structs */
/* Tags are used for ``id''s or anchors in the document referenced by the
* fragment part of the URI. */
/* FIXME: This and find_tag() should be part of the general infrastructure
* in document/document.*. --pasky */
struct tag {
LIST_HEAD(struct tag);
int x, y;
unsigned char name[1]; /* must be last of struct. --Zas */
};
enum link_state {
LINK_STATE_NONE,
LINK_STATE_NEW,
LINK_STATE_SAME,
};
struct link_state_info {
unsigned char *link;
unsigned char *target;
unsigned char *image;
struct form_control *form;
};
struct table_cache_entry_key {
unsigned char *start;
unsigned char *end;
int align;
int margin;
int width;
int x;
int link_num;
};
struct table_cache_entry {
LIST_HEAD(struct table_cache_entry);
struct table_cache_entry_key key;
struct part part;
};
/* Max. entries in table cache used for nested tables. */
#define MAX_TABLE_CACHE_ENTRIES 16384
/* Global variables */
static int table_cache_entries;
static struct hash *table_cache;
struct renderer_context {
int last_link_to_move;
struct tag *last_tag_to_move;
/* All tags between document->tags and this tag (inclusive) should
* be aligned to the next line break, unless some real content follows
* the tag. Therefore, this virtual tags list accumulates new tags as
* they arrive and empties when some real content is written; if a line
* break is inserted in the meanwhile, the tags follow it (ie. imagine
* <a name="x"> <p>, then the "x" tag follows the line breaks inserted
* by the <p> tag). */
struct tag *last_tag_for_newline;
struct link_state_info link_state_info;
struct conv_table *convert_table;
/* Used for setting cache info from HTTP-EQUIV meta tags. */
struct cache_entry *cached;
int g_ctrl_num;
int subscript; /* Count stacked subscripts */
int supscript; /* Count stacked supscripts */
unsigned int empty_format:1;
unsigned int nobreak:1;
unsigned int nosearchable:1;
unsigned int nowrap:1; /* Activated/deactivated by SP_NOWRAP. */
};
static struct renderer_context renderer_context;
/* Prototypes */
void line_break(struct html_context *);
void put_chars(struct html_context *, unsigned char *, int);
#define X(x_) (part->box.x + (x_))
#define Y(y_) (part->box.y + (y_))
#define SPACES_GRANULARITY 0x7F
#define ALIGN_SPACES(x, o, n) mem_align_alloc(x, o, n, SPACES_GRANULARITY)
static inline void
set_screen_char_color(struct screen_char *schar,
color_T bgcolor, color_T fgcolor,
enum color_flags color_flags,
enum color_mode color_mode)
{
struct color_pair colors = INIT_COLOR_PAIR(bgcolor, fgcolor);
set_term_color(schar, &colors, color_flags, color_mode);
}
static int
realloc_line(struct html_context *html_context, struct document *document,
int y, int length)
{
struct screen_char *pos, *end;
struct line *line;
if (!realloc_lines(document, y))
return -1;
line = &document->data[y];
if (length < line->length)
return 0;
if (!ALIGN_LINE(&line->chars, line->length, length + 1))
return -1;
/* We cannot rely on the aligned allocation to clear the members for us
* since for line splitting we simply trim the length. Question is if
* it is better to to clear the line after the splitting or here. */
end = &line->chars[length];
end->data = ' ';
end->attr = 0;
set_screen_char_color(end, par_format.bgcolor, 0x0,
0, document->options.color_mode);
for (pos = &line->chars[line->length]; pos < end; pos++) {
copy_screen_chars(pos, end, 1);
}
line->length = length + 1;
return 0;
}
void
expand_lines(struct html_context *html_context, struct part *part,
int x, int y, int lines, color_T bgcolor)
{
int line;
assert(part && part->document);
if_assert_failed return;
if (!use_document_bg_colors(&part->document->options))
return;
par_format.bgcolor = bgcolor;
for (line = 0; line < lines; line++)
realloc_line(html_context, part->document, Y(y + line), X(x));
}
static inline int
realloc_spaces(struct part *part, int length)
{
if (length < part->spaces_len)
return 0;
if (!ALIGN_SPACES(&part->spaces, part->spaces_len, length))
return -1;
part->spaces_len = length;
return 0;
}
#define LINE(y_) part->document->data[Y(y_)]
#define POS(x_, y_) LINE(y_).chars[X(x_)]
#define LEN(y_) int_max(LINE(y_).length - part->box.x, 0)
/* When we clear chars we want to preserve and use the background colors
* already in place else we could end up ``staining'' the background especial
* when drawing table cells. So make the cleared chars share the colors in
* place. */
static inline void
clear_hchars(struct html_context *html_context, int x, int y, int width)
{
struct part *part;
struct screen_char *pos, *end;
assert(html_context);
if_assert_failed return;
part = html_context->part;
assert(part && part->document && width > 0);
if_assert_failed return;
if (realloc_line(html_context, part->document, Y(y), X(x) + width - 1))
return;
assert(part->document->data);
if_assert_failed return;
pos = &POS(x, y);
end = pos + width - 1;
end->data = ' ';
end->attr = 0;
set_screen_char_color(end, par_format.bgcolor, 0x0,
0, part->document->options.color_mode);
while (pos < end)
copy_screen_chars(pos++, end, 1);
}
/* TODO: Merge parts with get_format_screen_char(). --jonas */
/* Allocates the required chars on the given line and returns the char at
* position (x, y) ready to be used as a template char. */
static inline struct screen_char *
get_frame_char(struct html_context *html_context, struct part *part,
int x, int y, unsigned char data,
color_T bgcolor, color_T fgcolor)
{
struct screen_char *template;
assert(html_context);
if_assert_failed return NULL;
assert(part && part->document && x >= 0 && y >= 0);
if_assert_failed return NULL;
if (realloc_line(html_context, part->document, Y(y), X(x)))
return NULL;
assert(part->document->data);
if_assert_failed return NULL;
template = &POS(x, y);
template->data = data;
template->attr = SCREEN_ATTR_FRAME;
set_screen_char_color(template, bgcolor, fgcolor,
part->document->options.color_flags,
part->document->options.color_mode);
return template;
}
void
draw_frame_hchars(struct part *part, int x, int y, int width,
unsigned char data, color_T bgcolor, color_T fgcolor,
struct html_context *html_context)
{
struct screen_char *template;
assert(width > 0);
if_assert_failed return;
template = get_frame_char(html_context, part, x + width - 1, y, data, bgcolor, fgcolor);
if (!template) return;
/* The template char is the last we need to draw so only decrease @width. */
for (width -= 1; width; width--, x++) {
copy_screen_chars(&POS(x, y), template, 1);
}
}
void
draw_frame_vchars(struct part *part, int x, int y, int height,
unsigned char data, color_T bgcolor, color_T fgcolor,
struct html_context *html_context)
{
struct screen_char *template = get_frame_char(html_context, part, x, y,
data, bgcolor, fgcolor);
if (!template) return;
/* The template char is the first vertical char to be drawn. So
* copy it to the rest. */
for (height -= 1, y += 1; height; height--, y++) {
if (realloc_line(html_context, part->document, Y(y), X(x)))
return;
copy_screen_chars(&POS(x, y), template, 1);
}
}
static inline struct screen_char *
get_format_screen_char(struct html_context *html_context,
enum link_state link_state)
{
static struct text_attrib_style ta_cache = { -1, 0x0, 0x0 };
static struct screen_char schar_cache;
if (memcmp(&ta_cache, &format.style, sizeof(ta_cache))) {
copy_struct(&ta_cache, &format.style);
schar_cache.attr = 0;
if (format.style.attr & ~(AT_UPDATE_SUB|AT_UPDATE_SUP)) {
if (format.style.attr & AT_UNDERLINE) {
schar_cache.attr |= SCREEN_ATTR_UNDERLINE;
}
if (format.style.attr & AT_BOLD) {
schar_cache.attr |= SCREEN_ATTR_BOLD;
}
if (format.style.attr & AT_ITALIC) {
schar_cache.attr |= SCREEN_ATTR_ITALIC;
}
if (format.style.attr & AT_GRAPHICS) {
schar_cache.attr |= SCREEN_ATTR_FRAME;
}
}
if (link_state != LINK_STATE_NONE
&& html_context->options->underline_links) {
schar_cache.attr |= SCREEN_ATTR_UNDERLINE;
}
set_screen_char_color(&schar_cache, format.style.bg, format.style.fg,
html_context->options->color_flags,
html_context->options->color_mode);
if (html_context->options->display_subs) {
if (format.style.attr & AT_SUBSCRIPT) {
if (format.style.attr & AT_UPDATE_SUB) {
renderer_context.subscript++;
format.style.attr &= ~AT_UPDATE_SUB;
put_chars(html_context, "[", 1);
}
} else {
while (renderer_context.subscript) {
renderer_context.subscript--;
put_chars(html_context, "]", 1);
}
}
}
if (html_context->options->display_sups) {
if (format.style.attr & AT_SUPERSCRIPT) {
if (format.style.attr & AT_UPDATE_SUP) {
renderer_context.supscript++;
format.style.attr &= ~AT_UPDATE_SUP;
put_chars(html_context, "^", 1);
}
} else {
while (renderer_context.supscript)
renderer_context.supscript--;
}
}
}
if (!!(schar_cache.attr & SCREEN_ATTR_UNSEARCHABLE)
^ !!renderer_context.nosearchable) {
schar_cache.attr ^= SCREEN_ATTR_UNSEARCHABLE;
}
return &schar_cache;
}
#ifdef CONFIG_UTF_8
/* First possibly do the format change and then find out what coordinates
* to use since sub- or superscript might change them */
static inline int
set_hline(struct html_context *html_context, unsigned char *chars, int charslen,
enum link_state link_state)
{
struct part *part = html_context->part;
struct screen_char *schar = get_format_screen_char(html_context,
link_state);
int x = part->cx;
int y = part->cy;
int x2 = x;
int len = charslen;
int utf8 = html_context->options->utf8;
assert(part);
if_assert_failed return len;
assert(charslen >= 0);
if (realloc_spaces(part, x + charslen))
return len;
if (part->document) {
if (realloc_line(html_context, part->document,
Y(y), X(x) + charslen - 1))
return len;
if (utf8) {
unsigned char *end;
for (end = chars + charslen; chars < end; x++) {
if (*chars == NBSP_CHAR) {
schar->data = ' ';
part->spaces[x] = html_context->options->wrap_nbsp;
chars++;
} else {
unicode_val_T data;
part->spaces[x] = (*chars == ' ');
data = utf_8_to_unicode(&chars, end);
if (data == UCS_NO_CHAR) {
/* HR */
unsigned char attr = schar->attr;
schar->data = *chars++;
schar->attr = SCREEN_ATTR_FRAME;
copy_screen_chars(&POS(x, y), schar, 1);
schar->attr = attr;
continue;
} else {
schar->data = (uint16_t)data;
}
}
copy_screen_chars(&POS(x, y), schar, 1);
}
} else {
for (; charslen > 0; charslen--, x++, chars++) {
if (*chars == NBSP_CHAR) {
schar->data = ' ';
part->spaces[x] = html_context->options->wrap_nbsp;
} else {
part->spaces[x] = (*chars == ' ');
schar->data = *chars;
}
copy_screen_chars(&POS(x, y), schar, 1);
}
}
len = x - x2;
} else {
if (utf8) {
unsigned char *end;
for (end = chars + charslen; chars < end; x++) {
unicode_val_T data;
part->spaces[x] = (*chars == ' ');
data = utf_8_to_unicode(&chars, end);
if (data == UCS_NO_CHAR) chars++;
}
len = x - x2;
} else {
for (; charslen > 0; charslen--, x++, chars++) {
part->spaces[x] = (*chars == ' ');
}
}
}
return len;
}
#else
/* First possibly do the format change and then find out what coordinates
* to use since sub- or superscript might change them */
static inline void
set_hline(struct html_context *html_context, unsigned char *chars, int charslen,
enum link_state link_state)
{
struct part *part = html_context->part;
struct screen_char *schar = get_format_screen_char(html_context,
link_state);
int x = part->cx;
int y = part->cy;
assert(part);
if_assert_failed return;
if (realloc_spaces(part, x + charslen))
return;
if (part->document) {
if (realloc_line(html_context, part->document,
Y(y), X(x) + charslen - 1))
return;
for (; charslen > 0; charslen--, x++, chars++) {
if (*chars == NBSP_CHAR) {
schar->data = ' ';
part->spaces[x] = html_context->options->wrap_nbsp;
} else {
part->spaces[x] = (*chars == ' ');
schar->data = *chars;
}
copy_screen_chars(&POS(x, y), schar, 1);
}
} else {
for (; charslen > 0; charslen--, x++, chars++) {
part->spaces[x] = (*chars == ' ');
}
}
}
#endif /* CONFIG_UTF_8 */
static void
move_links(struct html_context *html_context, int xf, int yf, int xt, int yt)
{
struct part *part;
struct tag *tag;
int nlink = renderer_context.last_link_to_move;
int matched = 0;
assert(html_context);
if_assert_failed return;
part = html_context->part;
assert(part && part->document);
if_assert_failed return;
if (!realloc_lines(part->document, Y(yt)))
return;
for (; nlink < part->document->nlinks; nlink++) {
struct link *link = &part->document->links[nlink];
int i;
for (i = 0; i < link->npoints; i++) {
/* Fix for bug 479 (part one) */
/* The scenario that triggered it:
*
* Imagine a centered element containing a really long
* word (over half of the screen width long) followed
* by a few links with no spaces between them where all
* the link text combined with the really long word
* will force the line to be wrapped. When rendering
* the line first words (including link text words) are
* put on one line. Then wrapping is performed moving
* all links from current line to the one below. Then
* the current line (now only containing the really
* long word) is centered. This will trigger a call to
* move_links() which will increment.
*
* Without the fix below the centering of the current
* line will increment last_link_to_move to that of the
* last link which means centering of the next line
* with all the links will only move the last link
* leaving all the other links' points dangling and
* causing buggy link highlighting.
*
* Even links like textareas will be correctly handled
* because @last_link_to_move is a way to optimize how
* many links move_links() will have to iterate and
* this little fix will only decrease the effect of the
* optimization by always ensuring it is never
* incremented too far. */
if (!matched && link->points[i].y > Y(yf)) {
matched = 1;
continue;
}
if (link->points[i].y != Y(yf))
continue;
matched = 1;
if (link->points[i].x < X(xf))
continue;
if (yt >= 0) {
link->points[i].y = Y(yt);
link->points[i].x += -xf + xt;
} else {
int to_move = link->npoints - (i + 1);
assert(to_move >= 0);
if (to_move > 0) {
memmove(&link->points[i],
&link->points[i + 1],
to_move *
sizeof(*link->points));
i--;
}
link->npoints--;
}
}
if (!matched) {
renderer_context.last_link_to_move = nlink;
}
}
/* Don't move tags when removing links. */
if (yt < 0) return;
matched = 0;
tag = renderer_context.last_tag_to_move;
while (list_has_next(part->document->tags, tag)) {
tag = tag->next;
if (tag->y == Y(yf)) {
matched = 1;
if (tag->x >= X(xf)) {
tag->y = Y(yt);
tag->x += -xf + xt;
}
} else if (!matched && tag->y > Y(yf)) {
/* Fix for bug 479 (part two) */
matched = 1;
}
if (!matched) renderer_context.last_tag_to_move = tag;
}
}
static inline void
copy_chars(struct html_context *html_context, int x, int y, int width, struct screen_char *d)
{
struct part *part;
assert(html_context);
if_assert_failed return;
part = html_context->part;
assert(width > 0 && part && part->document && part->document->data);
if_assert_failed return;
if (realloc_line(html_context, part->document, Y(y), X(x) + width - 1))
return;
copy_screen_chars(&POS(x, y), d, width);
}
static inline void
move_chars(struct html_context *html_context, int x, int y, int nx, int ny)
{
struct part *part;
assert(html_context);
if_assert_failed return;
part = html_context->part;
assert(part && part->document && part->document->data);
if_assert_failed return;
if (LEN(y) - x <= 0) return;
copy_chars(html_context, nx, ny, LEN(y) - x, &POS(x, y));
LINE(y).length = X(x);
move_links(html_context, x, y, nx, ny);
}
static inline void
shift_chars(struct html_context *html_context, int y, int shift)
{
struct part *part;
struct screen_char *a;
int len;
assert(html_context);
if_assert_failed return;
part = html_context->part;
assert(part && part->document && part->document->data);
if_assert_failed return;
len = LEN(y);
a = fmem_alloc(len * sizeof(*a));
if (!a) return;
copy_screen_chars(a, &POS(0, y), len);
clear_hchars(html_context, 0, y, shift);
copy_chars(html_context, shift, y, len, a);
fmem_free(a);
move_links(html_context, 0, y, shift, y);
}
static inline void
del_chars(struct html_context *html_context, int x, int y)
{
struct part *part;
assert(html_context);
if_assert_failed return;
part = html_context->part;
assert(part && part->document && part->document->data);
if_assert_failed return;
LINE(y).length = X(x);
move_links(html_context, x, y, -1, -1);
}
#if TABLE_LINE_PADDING < 0
# define overlap_width(x) (x).width
#else
# define overlap_width(x) int_min((x).width, \
html_context->options->box.width - TABLE_LINE_PADDING)
#endif
#define overlap(x) int_max(overlap_width(x) - (x).rightmargin, 0)
static int inline
split_line_at(struct html_context *html_context, int width)
{
struct part *part;
int tmp;
int new_width = width + par_format.rightmargin;
assert(html_context);
if_assert_failed return 0;
part = html_context->part;
assert(part);
if_assert_failed return 0;
/* Make sure that we count the right margin to the total
* actual box width. */
int_lower_bound(&part->box.width, new_width);
if (part->document) {
assert(part->document->data);
if_assert_failed return 0;
assertm(POS(width, part->cy).data == ' ',
"bad split: %c", POS(width, part->cy).data);
move_chars(html_context, width + 1, part->cy, par_format.leftmargin, part->cy + 1);
del_chars(html_context, width, part->cy);
}
width++; /* Since we were using (x + 1) only later... */
tmp = part->spaces_len - width;
if (tmp > 0) {
/* 0 is possible and I'm paranoid ... --Zas */
memmove(part->spaces, part->spaces + width, tmp);
}
assert(tmp >= 0);
if_assert_failed tmp = 0;
memset(part->spaces + tmp, 0, width);
if (par_format.leftmargin > 0) {
tmp = part->spaces_len - par_format.leftmargin;
assertm(tmp > 0, "part->spaces_len - par_format.leftmargin == %d", tmp);
/* So tmp is zero, memmove() should survive that. Don't recover. */
memmove(part->spaces + par_format.leftmargin, part->spaces, tmp);
}
part->cy++;
if (part->cx == width) {
part->cx = -1;
int_lower_bound(&part->box.height, part->cy);
return 2;
} else {
part->cx -= width - par_format.leftmargin;
int_lower_bound(&part->box.height, part->cy + 1);
return 1;
}
}
/* Here, we scan the line for a possible place where we could split it into two
* (breaking it, because it is too long), if it is overlapping from the maximal
* box width. */
/* Returns 0 if there was found no spot suitable for breaking the line.
* 1 if the line was split into two.
* 2 if the (second) splitted line is blank (that is useful to determine
* ie. if the next line_break() should really break the line; we don't
* want to see any blank lines to pop up, do we?). */
static int
split_line(struct html_context *html_context)
{
struct part *part;
int x;
assert(html_context);
if_assert_failed return 0;
part = html_context->part;
assert(part);
if_assert_failed return 0;
for (x = overlap(par_format); x >= par_format.leftmargin; x--)
if (x < part->spaces_len && part->spaces[x])
return split_line_at(html_context, x);
for (x = par_format.leftmargin; x < part->cx ; x++)
if (x < part->spaces_len && part->spaces[x])
return split_line_at(html_context, x);
/* Make sure that we count the right margin to the total
* actual box width. */
int_lower_bound(&part->box.width, part->cx + par_format.rightmargin);
return 0;
}
/* Insert @new_spaces spaces before the coordinates @x and @y,
* adding those spaces to whatever link is at those coordinates. */
/* TODO: Integrate with move_links. */
static void
insert_spaces_in_link(struct part *part, int x, int y, int new_spaces)
{
int i = part->document->nlinks;
x = X(x);
y = Y(y);
while (i--) {
struct link *link = &part->document->links[i];
int j = link->npoints;
while (j-- > 1) {
struct point *point = &link->points[j];
if (point->x != x || point->y != y)
continue;
if (!realloc_points(link, link->npoints + new_spaces))
return;
link->npoints += new_spaces;
point = &link->points[link->npoints - 1];
while (new_spaces--) {
point->x = --x;
point->y = y;
point--;
}
return;
}
}
}
/* This function is very rare exemplary of clean and beautyful code here.
* Please handle with care. --pasky */
static void
justify_line(struct html_context *html_context, int y)
{
struct part *part;
struct screen_char *line; /* we save original line here */
int len;
int pos;
int *space_list;
int spaces;
int diff;
assert(html_context);
if_assert_failed return;
part = html_context->part;
assert(part && part->document && part->document->data);
if_assert_failed return;
len = LEN(y);
assert(len > 0);
if_assert_failed return;
line = fmem_alloc(len * sizeof(*line));
if (!line) return;
/* It may sometimes happen that the line is only one char long and that
* char is space - then we're going to write to both [0] and [1], but
* we allocated only one field. Thus, we've to do (len + 1). --pasky */
space_list = fmem_alloc((len + 1) * sizeof(*space_list));
if (!space_list) {
fmem_free(line);
return;
}
copy_screen_chars(line, &POS(0, y), len);
/* Skip leading spaces */
spaces = 0;
pos = 0;
while (line[pos].data == ' ')
pos++;
/* Yes, this can be negative, we know. But we add one to it always
* anyway, so it's ok. */
space_list[spaces++] = pos - 1;
/* Count spaces */
for (; pos < len; pos++)
if (line[pos].data == ' ')
space_list[spaces++] = pos;
space_list[spaces] = len;
/* Realign line */
/* Diff is the difference between the width of the paragraph
* and the current length of the line. */
diff = overlap(par_format) - len;
/* We check diff > 0 because diff can be negative (i.e., we have
* an unbroken line of length > overlap(par_format))
* even when spaces > 1 if the line has only non-breaking spaces. */
if (spaces > 1 && diff > 0) {
int prev_end = 0;
int word;
clear_hchars(html_context, 0, y, overlap(par_format));
for (word = 0; word < spaces; word++) {
/* We have to increase line length by 'diff' num. of
* characters, so we move 'word'th word 'word_shift'
* characters right. */
int word_start = space_list[word] + 1;
int word_len = space_list[word + 1] - word_start;
int word_shift;
int new_start;
int new_spaces;
assert(word_len >= 0);
if_assert_failed continue;
if (!word_len) continue;
word_shift = (word * diff) / (spaces - 1);
new_start = word_start + word_shift;
copy_chars(html_context, new_start, y, word_len,
&line[word_start]);
new_spaces = new_start - prev_end - 1;
if (word && new_spaces) {
move_links(html_context, prev_end + 1, y, new_start, y);
insert_spaces_in_link(part,
new_start, y, new_spaces);
}
prev_end = new_start + word_len;
}
}
fmem_free(space_list);
fmem_free(line);
}
static void
align_line(struct html_context *html_context, int y, int last)
{
struct part *part;
int shift;
int len;
assert(html_context);
if_assert_failed return;
part = html_context->part;
assert(part && part->document && part->document->data);
if_assert_failed return;
len = LEN(y);
if (!len || par_format.align == ALIGN_LEFT)
return;
if (par_format.align == ALIGN_JUSTIFY) {
if (!last)
justify_line(html_context, y);
return;
}
shift = overlap(par_format) - len;
if (par_format.align == ALIGN_CENTER)
shift /= 2;
if (shift > 0)
shift_chars(html_context, y, shift);
}
static inline void
init_link_event_hooks(struct html_context *html_context, struct link *link)
{
link->event_hooks = mem_calloc(1, sizeof(*link->event_hooks));
if (!link->event_hooks) return;
#define add_evhook(list_, type_, src_) \
do { \
struct script_event_hook *evhook; \
\
if (!src_) break; \
\
evhook = mem_calloc(1, sizeof(*evhook)); \
if (!evhook) break; \
\
evhook->type = type_; \
evhook->src = stracpy(src_); \
add_to_list(*(list_), evhook); \
} while (0)
init_list(*link->event_hooks);
add_evhook(link->event_hooks, SEVHOOK_ONCLICK, format.onclick);
add_evhook(link->event_hooks, SEVHOOK_ONDBLCLICK, format.ondblclick);
add_evhook(link->event_hooks, SEVHOOK_ONMOUSEOVER, format.onmouseover);
add_evhook(link->event_hooks, SEVHOOK_ONHOVER, format.onhover);
add_evhook(link->event_hooks, SEVHOOK_ONFOCUS, format.onfocus);
add_evhook(link->event_hooks, SEVHOOK_ONMOUSEOUT, format.onmouseout);
add_evhook(link->event_hooks, SEVHOOK_ONBLUR, format.onblur);
#undef add_evhook
}
static struct link *
new_link(struct html_context *html_context, unsigned char *name, int namelen)
{
struct document *document;
struct part *part;
int link_number;
struct link *link;
assert(html_context);
if_assert_failed return NULL;
part = html_context->part;
assert(part);
if_assert_failed return NULL;
document = part->document;
assert(document);
if_assert_failed return NULL;
link_number = part->link_num;
if (!ALIGN_LINK(&document->links, document->nlinks, document->nlinks + 1))
return NULL;
link = &document->links[document->nlinks++];
link->number = link_number - 1;
if (document->options.use_tabindex) link->number += format.tabindex;
link->accesskey = format.accesskey;
link->title = null_or_stracpy(format.title);
link->where_img = null_or_stracpy(format.image);
if (!format.form) {
link->target = null_or_stracpy(format.target);
link->data.name = memacpy(name, namelen);
/* if (strlen(url) > 4 && !strncasecmp(url, "MAP@", 4)) { */
if (format.link
&& ((format.link[0]|32) == 'm')
&& ((format.link[1]|32) == 'a')
&& ((format.link[2]|32) == 'p')
&& (format.link[3] == '@')
&& format.link[4]) {
link->type = LINK_MAP;
link->where = stracpy(format.link + 4);
} else {
link->type = LINK_HYPERTEXT;
link->where = null_or_stracpy(format.link);
}
} else {
struct form_control *fc = format.form;
struct form *form;
switch (fc->type) {
case FC_TEXT:
case FC_PASSWORD:
case FC_FILE:
link->type = LINK_FIELD;
break;
case FC_TEXTAREA:
link->type = LINK_AREA;
break;
case FC_CHECKBOX:
case FC_RADIO:
link->type = LINK_CHECKBOX;
break;
case FC_SELECT:
link->type = LINK_SELECT;
break;
case FC_SUBMIT:
case FC_IMAGE:
case FC_RESET:
case FC_BUTTON:
case FC_HIDDEN:
link->type = LINK_BUTTON;
}
link->data.form_control = fc;
/* At this point, format.form might already be set but
* the form_control not registered through SP_CONTROL
* yet, therefore without fc->form set. It is always
* after the "good" last form was already processed,
* though, so we can safely just take that. */
form = fc->form;
if (!form && !list_empty(document->forms))
form = document->forms.next;
link->target = null_or_stracpy(form ? form->target : NULL);
}
link->color.background = format.style.bg;
link->color.foreground = link_is_textinput(link)
? format.style.fg : format.clink;
init_link_event_hooks(html_context, link);
document->links_sorted = 0;
return link;
}
static void
html_special_tag(struct document *document, unsigned char *t, int x, int y)
{
struct tag *tag;
int tag_len;
assert(document);
if_assert_failed return;
tag_len = strlen(t);
/* One byte is reserved for name in struct tag. */
tag = mem_alloc(sizeof(*tag) + tag_len);
if (!tag) return;
tag->x = x;
tag->y = y;
memcpy(tag->name, t, tag_len + 1);
add_to_list(document->tags, tag);
if (renderer_context.last_tag_for_newline == (struct tag *) &document->tags)
renderer_context.last_tag_for_newline = tag;
}
static void
put_chars_conv(struct html_context *html_context,
unsigned char *chars, int charslen)
{
struct part *part;
assert(html_context);
if_assert_failed return;
part = html_context->part;
assert(part && chars && charslen);
if_assert_failed return;
if (format.style.attr & AT_GRAPHICS) {
put_chars(html_context, chars, charslen);
return;
}
convert_string(renderer_context.convert_table, chars, charslen,
html_context->options->cp,
CSM_DEFAULT, NULL, (void (*)(void *, unsigned char *, int)) put_chars, html_context);
}
static inline void
put_link_number(struct html_context *html_context)
{
struct part *part = html_context->part;
unsigned char s[64];
unsigned char *fl = format.link;
unsigned char *ft = format.target;
unsigned char *fi = format.image;
struct form_control *ff = format.form;
int slen = 0;
format.link = format.target = format.image = NULL;
format.form = NULL;
s[slen++] = '[';
ulongcat(s, &slen, part->link_num, sizeof(s) - 3, 0);
s[slen++] = ']';
s[slen] = '\0';
renderer_context.nosearchable = 1;
put_chars(html_context, s, slen);
renderer_context.nosearchable = 0;
if (ff && ff->type == FC_TEXTAREA) line_break(html_context);
/* We might have ended up on a new line after the line breaking
* or putting the link number chars. */
if (part->cx == -1) part->cx = par_format.leftmargin;
format.link = fl;
format.target = ft;
format.image = fi;
format.form = ff;
}
#define assert_link_variable(old, new) \
assertm(!(old), "Old link value [%s]. New value [%s]", old, new);
static inline void
init_link_state_info(unsigned char *link, unsigned char *target,
unsigned char *image, struct form_control *form)
{
assert_link_variable(renderer_context.link_state_info.image, image);
assert_link_variable(renderer_context.link_state_info.target, target);
assert_link_variable(renderer_context.link_state_info.link, link);
renderer_context.link_state_info.link = null_or_stracpy(link);
renderer_context.link_state_info.target = null_or_stracpy(target);
renderer_context.link_state_info.image = null_or_stracpy(image);
renderer_context.link_state_info.form = form;
}
static inline void
done_link_state_info(void)
{
mem_free_if(renderer_context.link_state_info.link);
mem_free_if(renderer_context.link_state_info.target);
mem_free_if(renderer_context.link_state_info.image);
memset(&renderer_context.link_state_info, 0,
sizeof(renderer_context.link_state_info));
}
#ifdef CONFIG_UTF_8
static inline void
process_link(struct html_context *html_context, enum link_state link_state,
unsigned char *chars, int charslen, int utf8_len)
#else
static inline void
process_link(struct html_context *html_context, enum link_state link_state,
unsigned char *chars, int charslen)
#endif /* CONFIG_UTF_8 */
{
struct part *part = html_context->part;
struct link *link;
int x_offset = 0;
switch (link_state) {
case LINK_STATE_SAME: {
unsigned char *name;
if (!part->document) return;
assertm(part->document->nlinks > 0, "no link");
if_assert_failed return;
link = &part->document->links[part->document->nlinks - 1];
name = get_link_name(link);
if (name) {
unsigned char *new_name;
new_name = straconcat(name, chars, NULL);
if (new_name) {
mem_free(name);
link->data.name = new_name;
}
}
/* FIXME: Concatenating two adjectent <a> elements to a single
* link is broken since we lose the event handlers for the
* second one. OTOH simply appending them here won't fly since
* we may get here multiple times for even a single link. We
* will probably need some SP_ for creating a new link or so.
* --pasky */
break;
}
case LINK_STATE_NEW:
part->link_num++;
init_link_state_info(format.link, format.target,
format.image, format.form);
if (!part->document) return;
/* Trim leading space from the link text */
while (x_offset < charslen && chars[x_offset] <= ' ')
x_offset++;
if (x_offset) {
charslen -= x_offset;
chars += x_offset;
#ifdef CONFIG_UTF_8
utf8_len -= x_offset;
#endif /* CONFIG_UTF_8 */
}
link = new_link(html_context, chars, charslen);
if (!link) return;
break;
case LINK_STATE_NONE:
default:
INTERNAL("bad link_state %i", (int) link_state);
return;
}
/* Add new canvas positions to the link. */
#ifdef CONFIG_UTF_8
if (realloc_points(link, link->npoints + utf8_len))
#else
if (realloc_points(link, link->npoints + charslen))
#endif /* CONFIG_UTF_8 */
{
struct point *point = &link->points[link->npoints];
int x = X(part->cx) + x_offset;
int y = Y(part->cy);
#ifdef CONFIG_UTF_8
link->npoints += utf8_len;
for (; utf8_len > 0; utf8_len--, point++, x++)
#else
for (; charslen > 0; charslen--, point++, x++)
#endif /* CONFIG_UTF_8 */
{
point->x = x;
point->y = y;
}
}
}
static inline enum link_state
get_link_state(struct html_context *html_context)
{
enum link_state state;
if (!(format.link || format.image || format.form)) {
state = LINK_STATE_NONE;
} else if ((renderer_context.link_state_info.link
|| renderer_context.link_state_info.image
|| renderer_context.link_state_info.form)
&& !xstrcmp(format.link, renderer_context.link_state_info.link)
&& !xstrcmp(format.target, renderer_context.link_state_info.target)
&& !xstrcmp(format.image, renderer_context.link_state_info.image)
&& format.form == renderer_context.link_state_info.form) {
return LINK_STATE_SAME;
} else {
state = LINK_STATE_NEW;
}
done_link_state_info();
return state;
}
static inline int
html_has_non_space_chars(unsigned char *chars, int charslen)
{
int pos = 0;
while (pos < charslen)
if (!isspace(chars[pos++]))
return 1;
return 0;
}
void
put_chars(struct html_context *html_context, unsigned char *chars, int charslen)
{
enum link_state link_state;
int update_after_subscript = renderer_context.subscript;
struct part *part;
#ifdef CONFIG_UTF_8
int utf8_len;
#endif /* CONFIG_UTF_8 */
assert(html_context);
if_assert_failed return;
part = html_context->part;
assert(part);
if_assert_failed return;
assert(chars && charslen);
if_assert_failed return;
/* If we are not handling verbatim aligning and we are at the begining
* of a line trim whitespace. */
if (part->cx == -1) {
/* If we are not handling verbatim aligning trim leading
* whitespaces. */
if (!html_is_preformatted()) {
while (charslen && *chars == ' ') {
chars++;
charslen--;
}
if (charslen < 1) return;
}
part->cx = par_format.leftmargin;
}
/* For preformatted html always update 'the last tag' so we never end
* up moving tags to the wrong line (Fixes bug 324). For all other html
* it is moved only when the line being rendered carry some real
* non-whitespace content. */
if (html_is_preformatted()
|| html_has_non_space_chars(chars, charslen)) {
renderer_context.last_tag_for_newline = (struct tag *) &part->document->tags;
}
int_lower_bound(&part->box.height, part->cy + 1);
link_state = get_link_state(html_context);
if (link_state == LINK_STATE_NEW) {
int x_offset = 0;
/* Don't add inaccessible links. It seems to be caused
* by the parser putting a space char after stuff like
* <img>-tags or comments wrapped in <a>-tags. See bug
* 30 for test case. */
while (x_offset < charslen && chars[x_offset] <= ' ')
x_offset++;
/* For pure spaces reset the link state */
if (x_offset == charslen)
link_state = LINK_STATE_NONE;
else if (html_context->options->links_numbering)
put_link_number(html_context);
}
#ifdef CONFIG_UTF_8
utf8_len =
#endif /* CONFIG_UTF_8 */
set_hline(html_context, chars, charslen, link_state);
if (link_state != LINK_STATE_NONE) {
#define is_drawing_subs_or_sups() \
((format.style.attr & AT_SUBSCRIPT \
&& html_context->options->display_subs) \
|| (format.style.attr & AT_SUPERSCRIPT \
&& html_context->options->display_sups))
/* We need to update the current @link_state because <sub> and
* <sup> tags will output to the canvas using an inner
* put_chars() call which results in their process_link() call
* will ``update'' the @link_state. */
if (link_state == LINK_STATE_NEW
&& (is_drawing_subs_or_sups()
|| update_after_subscript != renderer_context.subscript)) {
link_state = get_link_state(html_context);
}
#undef is_drawing_subs_or_sups
#ifdef CONFIG_UTF_8
process_link(html_context, link_state, chars, charslen,
utf8_len);
#else
process_link(html_context, link_state, chars, charslen);
#endif /* CONFIG_UTF_8 */
}
#ifdef CONFIG_UTF_8
if (renderer_context.nowrap
&& part->cx + utf8_len > overlap(par_format))
return;
part->cx += utf8_len;
#else
if (renderer_context.nowrap
&& part->cx + charslen > overlap(par_format))
return;
part->cx += charslen;
#endif /* CONFIG_UTF_8 */
renderer_context.nobreak = 0;
if (!(html_context->options->wrap || html_is_preformatted())) {
while (part->cx > overlap(par_format)
&& part->cx > par_format.leftmargin) {
int x = split_line(html_context);
if (!x) break;
if (part->document)
align_line(html_context, part->cy - 1, 0);
renderer_context.nobreak = !!(x - 1);
}
}
assert(charslen > 0);
#ifdef CONFIG_UTF_8
part->xa += utf8_len;
#else
part->xa += charslen;
#endif /* CONFIG_UTF_8 */
int_lower_bound(&part->max_width, part->xa
+ par_format.leftmargin + par_format.rightmargin
- (chars[charslen - 1] == ' '
&& !html_is_preformatted()));
return;
}
#undef overlap
void
line_break(struct html_context *html_context)
{
struct part *part;
struct tag *tag;
assert(html_context);
if_assert_failed return;
part = html_context->part;
assert(part);
if_assert_failed return;
int_lower_bound(&part->box.width, part->cx + par_format.rightmargin);
if (renderer_context.nobreak) {
renderer_context.nobreak = 0;
part->cx = -1;
part->xa = 0;
return;
}
if (!part->document || !part->document->data) goto end;
if (!realloc_lines(part->document, part->box.height + part->cy + 1))
return;
if (part->cx > par_format.leftmargin && LEN(part->cy) > part->cx - 1
&& POS(part->cx - 1, part->cy).data == ' ') {
del_chars(html_context, part->cx - 1, part->cy);
part->cx--;
}
if (part->cx > 0) align_line(html_context, part->cy, 1);
for (tag = renderer_context.last_tag_for_newline;
tag && tag != (struct tag *) &part->document->tags;
tag = tag->prev) {
tag->x = X(0);
tag->y = Y(part->cy + 1);
}
end:
part->cy++;
part->cx = -1;
part->xa = 0;
memset(part->spaces, 0, part->spaces_len);
}
static void
html_special_form(struct part *part, struct form *form)
{
assert(part && form);
if_assert_failed return;
if (!part->document) {
done_form(form);
return;
}
if (!list_empty(part->document->forms)) {
struct form *nform;
/* Make sure the new form ``claims'' its slice of the form range
* maintained in the form_num and form_end variables. */
foreach (nform, part->document->forms) {
if (form->form_num < nform->form_num
|| nform->form_end < form->form_num)
continue;
/* First check if the form has identical form numbers.
* That should only be the case when the form being
* added is in fact the same form in which case it
* should be dropped. The fact that this can happen
* suggests that the table renderering can be confused.
* See bug 647 for a test case. */
if (nform->form_num == form->form_num
&& nform->form_end == form->form_end) {
done_form(form);
return;
}
/* The form start is inside an already added form, so
* partition the space of the existing form and get
* |old|new|. */
nform->form_end = form->form_num - 1;
assertm(nform->form_num <= nform->form_end,
"[%d:%d] [%d:%d]", nform->form_num, nform->form_end,
form->form_num, form->form_end);
break;
}
} else {
/* If it is the first form make sure it eats the whole form
* range. */
#if 0
/* Disabled because in tables the parse order may lead to a
* later form being parsed before a preceeding one causing the
* wrong order if we set it to zero. Let's hope it doesn't break
* anything else. */
form->form_num = 0;
#endif
}
add_to_list(part->document->forms, form);
}
static void
html_special_form_control(struct part *part, struct form_control *fc)
{
struct form *form;
assert(part && fc);
if_assert_failed return;
if (!part->document) {
done_form_control(fc);
mem_free(fc);
return;
}
fc->g_ctrl_num = renderer_context.g_ctrl_num++;
/* We don't want to recode hidden fields. */
if (fc->type == FC_TEXT || fc->type == FC_PASSWORD ||
fc->type == FC_TEXTAREA) {
unsigned char *dv = convert_string(renderer_context.convert_table,
fc->default_value,
strlen(fc->default_value),
part->document->options.cp,
CSM_QUERY, NULL, NULL, NULL);
if (dv) mem_free_set(&fc->default_value, dv);
}
if (list_empty(part->document->forms)) {
/* No forms encountered yet, that means a homeless form
* control. Generate a dummy form for those Flying
* Dutchmans. */
form = init_form();
form->form_num = 0;
add_to_list(part->document->forms, form);
}
/* Attach this form control to the last form encountered. */
form = part->document->forms.next;
fc->form = form;
add_to_list(form->items, fc);
}
/* Reparents form items based on position in the source. */
void
check_html_form_hierarchy(struct part *part)
{
struct document *document = part->document;
INIT_LIST_HEAD(form_controls);
struct form *form;
struct form_control *fc, *next;
if (list_empty(document->forms))
return;
/* Take out all badly placed form items. */
foreach (form, document->forms) {
assertm(form->form_num <= form->form_end,
"%p [%d : %d]", form, form->form_num, form->form_end);
foreachsafe (fc, next, form->items) {
if (form->form_num <= fc->position
&& fc->position <= form->form_end)
continue;
move_to_top_of_list(form_controls, fc);
}
}
/* Re-insert the form items the correct places. */
foreachsafe (fc, next, form_controls) {
foreach (form, document->forms) {
if (fc->position < form->form_num
|| form->form_end < fc->position)
continue;
fc->form = form;
move_to_top_of_list(form->items, fc);
break;
}
}
assert(list_empty(form_controls));
}
static inline void
color_link_lines(struct html_context *html_context)
{
struct document *document = html_context->part->document;
struct color_pair colors = INIT_COLOR_PAIR(par_format.bgcolor, 0x0);
enum color_mode color_mode = document->options.color_mode;
enum color_flags color_flags = document->options.color_flags;
int y;
for (y = 0; y < document->height; y++) {
int x;
for (x = 0; x < document->data[y].length; x++) {
struct screen_char *schar = &document->data[y].chars[x];
set_term_color(schar, &colors, color_flags, color_mode);
/* XXX: Entering hack zone! Change to clink color after
* link text has been recolored. */
if (schar->data == ':' && colors.foreground == 0x0)
colors.foreground = format.clink;
}
colors.foreground = 0x0;
}
}
static void *
html_special(struct html_context *html_context, enum html_special_type c, ...)
{
va_list l;
struct part *part;
struct document *document;
void *ret_val = NULL;
assert(html_context);
if_assert_failed return NULL;
part = html_context->part;
assert(part);
if_assert_failed return NULL;
document = part->document;
va_start(l, c);
switch (c) {
case SP_TAG:
if (document) {
unsigned char *t = va_arg(l, unsigned char *);
html_special_tag(document, t, X(part->cx), Y(part->cy));
}
break;
case SP_FORM:
{
struct form *form = va_arg(l, struct form *);
html_special_form(part, form);
break;
}
case SP_CONTROL:
{
struct form_control *fc = va_arg(l, struct form_control *);
html_special_form_control(part, fc);
break;
}
case SP_TABLE:
ret_val = renderer_context.convert_table;
break;
case SP_USED:
ret_val = (void *) (long) !!document;
break;
case SP_CACHE_CONTROL:
{
struct cache_entry *cached = renderer_context.cached;
cached->cache_mode = CACHE_MODE_NEVER;
cached->expire = 0;
break;
}
case SP_CACHE_EXPIRES:
{
time_t expires = va_arg(l, time_t);
struct cache_entry *cached = renderer_context.cached;
if (!expires || cached->cache_mode == CACHE_MODE_NEVER)
break;
timeval_from_seconds(&cached->max_age, expires);
cached->expire = 1;
break;
}
case SP_FRAMESET:
{
struct frameset_param *fsp = va_arg(l, struct frameset_param *);
struct frameset_desc *frameset_desc;
if (!fsp->parent && document->frame_desc)
break;
frameset_desc = create_frameset(fsp);
if (!fsp->parent && !document->frame_desc)
document->frame_desc = frameset_desc;
ret_val = frameset_desc;
break;
}
case SP_FRAME:
{
struct frameset_desc *parent = va_arg(l, struct frameset_desc *);
unsigned char *name = va_arg(l, unsigned char *);
unsigned char *url = va_arg(l, unsigned char *);
add_frameset_entry(parent, NULL, name, url);
break;
}
case SP_NOWRAP:
renderer_context.nowrap = !!va_arg(l, int);
break;
case SP_REFRESH:
{
unsigned long seconds = va_arg(l, unsigned long);
unsigned char *t = va_arg(l, unsigned char *);
document->refresh = init_document_refresh(t, seconds);
break;
}
case SP_COLOR_LINK_LINES:
if (document && use_document_bg_colors(&document->options))
color_link_lines(html_context);
break;
case SP_STYLESHEET:
#ifdef CONFIG_CSS
if (document) {
struct uri *uri = va_arg(l, struct uri *);
add_to_uri_list(&document->css_imports, uri);
}
#endif
break;
case SP_SCRIPT:
#ifdef CONFIG_ECMASCRIPT
if (document) {
struct uri *uri = va_arg(l, struct uri *);
add_to_uri_list(&document->ecmascript_imports, uri);
}
#endif
break;
}
va_end(l);
return ret_val;
}
void
free_table_cache(void)
{
if (table_cache) {
struct hash_item *item;
int i;
/* We do not free key here. */
foreach_hash_item (item, *table_cache, i) {
mem_free_if(item->value);
}
free_hash(table_cache);
}
table_cache = NULL;
table_cache_entries = 0;
}
struct part *
format_html_part(struct html_context *html_context,
unsigned char *start, unsigned char *end,
int align, int margin, int width, struct document *document,
int x, int y, unsigned char *head,
int link_num)
{
struct part *part;
struct html_element *html_state;
int llm = renderer_context.last_link_to_move;
struct tag *ltm = renderer_context.last_tag_to_move;
int ef = renderer_context.empty_format;
int lm = html_context->margin;
/* Hash creation if needed. */
if (!table_cache) {
table_cache = init_hash(8, &strhash);
} else if (!document) {
/* Search for cached entry. */
struct table_cache_entry_key key;
struct hash_item *item;
/* Clear key to prevent potential alignment problem
* when keys are compared. */
memset(&key, 0, sizeof(key));
key.start = start;
key.end = end;
key.align = align;
key.margin = margin;
key.width = width;
key.x = x;
key.link_num = link_num;
item = get_hash_item(table_cache,
(unsigned char *) &key,
sizeof(key));
if (item) { /* We found it in cache, so just copy and return. */
part = mem_alloc(sizeof(*part));
if (part) {
copy_struct(part, &((struct table_cache_entry *)
item->value)->part);
return part;
}
}
}
assertm(y >= 0, "format_html_part: y == %d", y);
if_assert_failed return NULL;
if (document) {
struct node *node = mem_alloc(sizeof(*node));
if (node) {
int node_width = !html_context->table_level ? INT_MAX : width;
set_box(&node->box, x, y, node_width, 1);
add_to_list(document->nodes, node);
}
renderer_context.last_link_to_move = document->nlinks;
renderer_context.last_tag_to_move = (struct tag *) &document->tags;
renderer_context.last_tag_for_newline = (struct tag *) &document->tags;
} else {
renderer_context.last_link_to_move = 0;
renderer_context.last_tag_to_move = (struct tag *) NULL;
renderer_context.last_tag_for_newline = (struct tag *) NULL;
}
html_context->margin = margin;
renderer_context.empty_format = !document;
done_link_state_info();
renderer_context.nobreak = 1;
part = mem_calloc(1, sizeof(*part));
if (!part) goto ret;
part->document = document;
part->box.x = x;
part->box.y = y;
part->cx = -1;
part->cy = 0;
part->link_num = link_num;
html_state = init_html_parser_state(html_context, ELEMENT_IMMORTAL, align, margin, width);
parse_html(start, end, part, head, html_context);
done_html_parser_state(html_context, html_state);
int_lower_bound(&part->max_width, part->box.width);
renderer_context.nobreak = 0;
done_link_state_info();
mem_free_if(part->spaces);
if (document) {
struct node *node = document->nodes.next;
node->box.height = y - node->box.y + part->box.height;
}
ret:
renderer_context.last_link_to_move = llm;
renderer_context.last_tag_to_move = ltm;
renderer_context.empty_format = ef;
html_context->margin = lm;
if (html_context->table_level > 1 && !document
&& table_cache
&& table_cache_entries < MAX_TABLE_CACHE_ENTRIES) {
/* Create a new entry. */
/* Clear memory to prevent bad key comparaison due to alignment
* of key fields. */
struct table_cache_entry *tce = mem_calloc(1, sizeof(*tce));
/* A goto is used here to prevent a test or code
* redundancy. */
if (!tce) goto end;
tce->key.start = start;
tce->key.end = end;
tce->key.align = align;
tce->key.margin = margin;
tce->key.width = width;
tce->key.x = x;
tce->key.link_num = link_num;
copy_struct(&tce->part, part);
if (!add_hash_item(table_cache,
(unsigned char *) &tce->key,
sizeof(tce->key), tce)) {
mem_free(tce);
} else {
table_cache_entries++;
}
}
end:
return part;
}
void
render_html_document(struct cache_entry *cached, struct document *document,
struct string *buffer)
{
struct html_context *html_context;
struct part *part;
unsigned char *start;
unsigned char *end;
struct string title;
struct string head;
int i;
assert(cached && document);
if_assert_failed return;
if (!init_string(&head)) return;
if (cached->head) add_to_string(&head, cached->head);
start = buffer->source;
end = buffer->source + buffer->length;
html_context = init_html_parser(cached->uri, &document->options,
start, end, &head, &title,
put_chars_conv, line_break,
html_special);
if (!html_context) return;
renderer_context.g_ctrl_num = 0;
renderer_context.cached = cached;
renderer_context.convert_table = get_convert_table(head.source,
document->options.cp,
document->options.assume_cp,
&document->cp,
&document->cp_status,
document->options.hard_assume);
#ifdef CONFIG_UTF_8
html_context->options->utf8 = is_cp_special(document->options.cp);
#endif /* CONFIG_UTF_8 */
if (title.length) {
document->title = convert_string(renderer_context.convert_table,
title.source, title.length,
document->options.cp,
CSM_DEFAULT, NULL, NULL, NULL);
}
done_string(&title);
part = format_html_part(html_context, start, end, par_format.align,
par_format.leftmargin,
document->options.box.width, document,
0, 0, head.source, 1);
/* Drop empty allocated lines at end of document if any
* and adjust document height. */
for (i = document->height - 1; i >= 0 ; i--) {
if (!document->data[i].length) {
mem_free_if(document->data[i].chars);
document->height--;
} else break;
}
/* Calculate document width. */
document->width = 0;
for (i = 0; i < document->height; i++)
int_lower_bound(&document->width, document->data[i].length);
#if 1
document->options.needs_width = 1;
#else
/* FIXME: This needs more tuning since if we are centering stuff it
* does not work. */
document->options.needs_width =
(document->width + (document->options.margin
>= document->options.width));
#endif
document->bgcolor = par_format.bgcolor;
done_html_parser(html_context);
/* Drop forms which has been serving as a placeholder for form items
* added in the wrong order due to the ordering of table rendering. */
{
struct form *form;
foreach (form, document->forms) {
if (form->form_num)
continue;
if (list_empty(form->items))
done_form(form);
break;
}
}
/* @part was residing in html_context so it has to stay alive until
* done_html_parser(). */
done_string(&head);
mem_free_if(part);
#if 0 /* debug purpose */
{
FILE *f = fopen("forms", "ab");
struct form_control *form;
unsigned char *qq;
fprintf(f,"FORM:\n");
foreach (form, document->forms) {
fprintf(f, "g=%d f=%d c=%d t:%d\n",
form->g_ctrl_num, form->form_num,
form->ctrl_num, form->type);
}
fprintf(f,"fragment: \n");
for (qq = start; qq < end; qq++) fprintf(f, "%c", *qq);
fprintf(f,"----------\n\n");
fclose(f);
}
#endif
}
int
find_tag(struct document *document, unsigned char *name, int namelen)
{
struct tag *tag;
foreach (tag, document->tags)
if (!strlcasecmp(tag->name, -1, name, namelen))
return tag->y;
return -1;
}