2005-09-15 09:58:31 -04:00
|
|
|
/* DOM document renderer */
|
|
|
|
|
|
|
|
#ifdef HAVE_CONFIG_H
|
|
|
|
#include "config.h"
|
|
|
|
#endif
|
|
|
|
|
2005-12-25 09:16:21 -05:00
|
|
|
#include <sys/types.h> /* FreeBSD needs this before regex.h */
|
|
|
|
#ifdef HAVE_REGEX_H
|
|
|
|
#include <regex.h>
|
|
|
|
#endif
|
2005-09-15 09:58:31 -04:00
|
|
|
#include <string.h>
|
|
|
|
|
|
|
|
#include "elinks.h"
|
|
|
|
|
|
|
|
#include "bookmarks/bookmarks.h" /* get_bookmark() */
|
|
|
|
#include "cache/cache.h"
|
|
|
|
#include "document/css/css.h"
|
|
|
|
#include "document/css/parser.h"
|
|
|
|
#include "document/css/property.h"
|
|
|
|
#include "document/css/stylesheet.h"
|
|
|
|
#include "document/docdata.h"
|
|
|
|
#include "document/document.h"
|
|
|
|
#include "document/dom/renderer.h"
|
|
|
|
#include "document/renderer.h"
|
2006-01-15 23:12:34 -05:00
|
|
|
#include "dom/configuration.h"
|
2005-12-28 08:05:14 -05:00
|
|
|
#include "dom/scanner.h"
|
|
|
|
#include "dom/sgml/parser.h"
|
2006-01-25 17:16:30 -05:00
|
|
|
#include "dom/sgml/html/html.h"
|
2006-01-07 21:44:23 -05:00
|
|
|
#include "dom/sgml/rss/rss.h"
|
2005-12-28 08:05:14 -05:00
|
|
|
#include "dom/node.h"
|
|
|
|
#include "dom/stack.h"
|
2005-09-15 09:58:31 -04:00
|
|
|
#include "intl/charsets.h"
|
|
|
|
#include "globhist/globhist.h" /* get_global_history_item() */
|
|
|
|
#include "protocol/uri.h"
|
|
|
|
#include "terminal/draw.h"
|
|
|
|
#include "util/box.h"
|
|
|
|
#include "util/error.h"
|
|
|
|
#include "util/memory.h"
|
|
|
|
#include "util/snprintf.h"
|
|
|
|
#include "util/string.h"
|
|
|
|
|
|
|
|
|
|
|
|
struct dom_renderer {
|
2006-01-25 17:16:30 -05:00
|
|
|
enum sgml_document_type doctype;
|
2005-09-15 09:58:31 -04:00
|
|
|
struct document *document;
|
|
|
|
|
|
|
|
struct conv_table *convert_table;
|
|
|
|
enum convert_string_mode convert_mode;
|
|
|
|
|
2006-01-25 17:16:30 -05:00
|
|
|
struct uri *base_uri;
|
|
|
|
|
2005-09-15 09:58:31 -04:00
|
|
|
unsigned char *source;
|
|
|
|
unsigned char *end;
|
|
|
|
|
|
|
|
unsigned char *position;
|
|
|
|
int canvas_x, canvas_y;
|
|
|
|
|
2005-12-25 09:16:21 -05:00
|
|
|
#ifdef HAVE_REGEX_H
|
|
|
|
regex_t url_regex;
|
|
|
|
unsigned int find_url:1;
|
|
|
|
#endif
|
2005-09-15 09:58:31 -04:00
|
|
|
struct screen_char styles[DOM_NODES];
|
2006-01-07 21:44:23 -05:00
|
|
|
|
|
|
|
/* RSS renderer variables */
|
|
|
|
struct dom_node *channel;
|
|
|
|
struct dom_node_list *items;
|
|
|
|
struct dom_node *item;
|
|
|
|
struct dom_node *node;
|
|
|
|
struct dom_string text;
|
2005-09-15 09:58:31 -04:00
|
|
|
};
|
|
|
|
|
2005-12-25 10:22:20 -05:00
|
|
|
#define URL_REGEX "(file://|((f|ht|nt)tp(s)?|smb)://[[:alnum:]]+([-@:.]?[[:alnum:]])*\\.[[:alpha:]]{2,4}(:[[:digit:]]+)?)(/(%[[:xdigit:]]{2}|[-_~&=;?.a-z0-9])*)*"
|
2005-12-25 09:16:21 -05:00
|
|
|
#define URL_REGFLAGS (REG_ICASE | REG_EXTENDED)
|
2005-09-15 09:58:31 -04:00
|
|
|
|
|
|
|
static void
|
|
|
|
init_template(struct screen_char *template, struct document_options *options,
|
2006-01-04 12:08:48 -05:00
|
|
|
color_T background, color_T foreground, enum screen_char_attr attr)
|
2005-09-15 09:58:31 -04:00
|
|
|
{
|
|
|
|
struct color_pair colors = INIT_COLOR_PAIR(background, foreground);
|
|
|
|
|
2006-01-03 18:50:40 -05:00
|
|
|
template->attr = attr;
|
2005-09-15 09:58:31 -04:00
|
|
|
template->data = ' ';
|
|
|
|
set_term_color(template, &colors,
|
|
|
|
options->color_flags, options->color_mode);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline struct css_property *
|
|
|
|
get_css_property(struct list_head *list, enum css_property_type type)
|
|
|
|
{
|
|
|
|
struct css_property *property;
|
|
|
|
|
|
|
|
foreach (property, *list)
|
|
|
|
if (property->type == type)
|
|
|
|
return property;
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/* Checks the user CSS for properties for each DOM node type name */
|
|
|
|
static inline void
|
|
|
|
init_dom_renderer(struct dom_renderer *renderer, struct document *document,
|
2005-11-15 06:11:48 -05:00
|
|
|
struct string *buffer, struct conv_table *convert_table)
|
2005-09-15 09:58:31 -04:00
|
|
|
{
|
|
|
|
enum dom_node_type type;
|
|
|
|
struct css_stylesheet *css = &default_stylesheet;
|
|
|
|
|
|
|
|
memset(renderer, 0, sizeof(*renderer));
|
|
|
|
|
|
|
|
renderer->document = document;
|
|
|
|
renderer->convert_table = convert_table;
|
|
|
|
renderer->convert_mode = document->options.plain ? CSM_NONE : CSM_DEFAULT;
|
|
|
|
renderer->source = buffer->source;
|
|
|
|
renderer->end = buffer->source + buffer->length;
|
|
|
|
renderer->position = renderer->source;
|
2006-01-25 17:16:30 -05:00
|
|
|
renderer->base_uri = get_uri_reference(document->uri);
|
2005-09-15 09:58:31 -04:00
|
|
|
|
2005-12-25 09:16:21 -05:00
|
|
|
#ifdef HAVE_REGEX_H
|
|
|
|
if (renderer->document->options.plain_display_links) {
|
|
|
|
if (regcomp(&renderer->url_regex, URL_REGEX, URL_REGFLAGS)) {
|
|
|
|
regfree(&renderer->url_regex);
|
|
|
|
} else {
|
|
|
|
renderer->find_url = 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
2005-09-15 09:58:31 -04:00
|
|
|
for (type = 0; type < DOM_NODES; type++) {
|
|
|
|
struct screen_char *template = &renderer->styles[type];
|
|
|
|
color_T background = document->options.default_bg;
|
|
|
|
color_T foreground = document->options.default_fg;
|
2006-01-03 18:50:40 -05:00
|
|
|
enum screen_char_attr attr = 0;
|
2005-09-15 09:58:31 -04:00
|
|
|
static int i_want_struct_module_for_dom;
|
|
|
|
|
2005-12-10 13:28:37 -05:00
|
|
|
struct dom_string *name = get_dom_node_type_name(type);
|
2005-09-15 09:58:31 -04:00
|
|
|
struct css_selector *selector = NULL;
|
|
|
|
|
|
|
|
if (!i_want_struct_module_for_dom) {
|
|
|
|
static const unsigned char default_colors[] =
|
|
|
|
"document { color: yellow } "
|
|
|
|
"element { color: lightgreen } "
|
|
|
|
"entity-reference { color: red } "
|
|
|
|
"proc-instruction { color: red } "
|
|
|
|
"attribute { color: magenta } "
|
2005-12-26 13:56:07 -05:00
|
|
|
"comment { color: aqua } "
|
|
|
|
"cdata-section { color: orange2 } ";
|
2005-09-15 09:58:31 -04:00
|
|
|
unsigned char *styles = (unsigned char *) default_colors;
|
|
|
|
|
|
|
|
i_want_struct_module_for_dom = 1;
|
|
|
|
/* When someone will get here earlier than at 4am,
|
|
|
|
* this will be done in some init function, perhaps
|
|
|
|
* not overriding the user's default stylesheet. */
|
|
|
|
css_parse_stylesheet(css, NULL, styles, styles + sizeof(default_colors) + 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (name)
|
2005-12-10 13:28:37 -05:00
|
|
|
if (is_dom_string_set(name))
|
2005-09-15 09:58:31 -04:00
|
|
|
selector = find_css_selector(&css->selectors,
|
|
|
|
CST_ELEMENT, CSR_ROOT,
|
2005-12-10 13:28:37 -05:00
|
|
|
name->string, name->length);
|
2005-09-15 09:58:31 -04:00
|
|
|
|
|
|
|
if (selector) {
|
|
|
|
struct list_head *properties = &selector->properties;
|
|
|
|
struct css_property *property;
|
|
|
|
|
|
|
|
property = get_css_property(properties, CSS_PT_BACKGROUND_COLOR);
|
|
|
|
if (!property)
|
|
|
|
property = get_css_property(properties, CSS_PT_BACKGROUND);
|
|
|
|
|
|
|
|
if (property && property->value_type == CSS_VT_COLOR)
|
|
|
|
background = property->value.color;
|
|
|
|
|
|
|
|
property = get_css_property(properties, CSS_PT_COLOR);
|
|
|
|
if (property) foreground = property->value.color;
|
2006-01-03 18:50:40 -05:00
|
|
|
|
|
|
|
property = get_css_property(properties, CSS_PT_FONT_WEIGHT);
|
|
|
|
if (property) {
|
|
|
|
if (property->value.font_attribute.add & AT_BOLD)
|
|
|
|
attr |= SCREEN_ATTR_BOLD;
|
|
|
|
}
|
|
|
|
|
|
|
|
property = get_css_property(properties, CSS_PT_FONT_STYLE);
|
|
|
|
if (property) {
|
|
|
|
if (property->value.font_attribute.add & AT_UNDERLINE)
|
|
|
|
attr |= SCREEN_ATTR_UNDERLINE;
|
|
|
|
|
|
|
|
if (property->value.font_attribute.add & AT_ITALIC)
|
|
|
|
attr |= SCREEN_ATTR_ITALIC;
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
property = get_css_property(properties, CSS_PT_TEXT_DECORATION);
|
|
|
|
if (property) {
|
|
|
|
if (property->value.font_attribute.add & AT_UNDERLINE)
|
|
|
|
attr |= SCREEN_ATTR_UNDERLINE;
|
|
|
|
}
|
2005-09-15 09:58:31 -04:00
|
|
|
}
|
|
|
|
|
2006-01-03 18:50:40 -05:00
|
|
|
init_template(template, &document->options, background, foreground, attr);
|
2005-09-15 09:58:31 -04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/* Document maintainance */
|
|
|
|
|
|
|
|
static struct screen_char *
|
|
|
|
realloc_line(struct document *document, int x, int y)
|
|
|
|
{
|
|
|
|
struct line *line = realloc_lines(document, y);
|
|
|
|
|
|
|
|
if (!line) return NULL;
|
|
|
|
|
|
|
|
if (x > line->length) {
|
|
|
|
if (!ALIGN_LINE(&line->chars, line->length, x))
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
for (; line->length < x; line->length++) {
|
|
|
|
line->chars[line->length].data = ' ';
|
|
|
|
}
|
|
|
|
|
|
|
|
if (x > document->width) document->width = x;
|
|
|
|
}
|
|
|
|
|
|
|
|
return line->chars;
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct node *
|
|
|
|
add_search_node(struct dom_renderer *renderer, int width)
|
|
|
|
{
|
|
|
|
struct node *node = mem_alloc(sizeof(*node));
|
|
|
|
|
|
|
|
if (node) {
|
|
|
|
set_box(&node->box, renderer->canvas_x, renderer->canvas_y,
|
|
|
|
width, 1);
|
|
|
|
add_to_list(renderer->document->nodes, node);
|
|
|
|
}
|
|
|
|
|
|
|
|
return node;
|
|
|
|
}
|
|
|
|
|
|
|
|
#define X(renderer) ((renderer)->canvas_x)
|
|
|
|
#define Y(renderer) ((renderer)->canvas_y)
|
|
|
|
#define POS(renderer) (&(renderer)->document->data[Y(renderer)].chars[X(renderer)])
|
|
|
|
#define WIDTH(renderer, add) ((renderer)->canvas_x + (add))
|
|
|
|
|
|
|
|
static void
|
|
|
|
render_dom_line(struct dom_renderer *renderer, struct screen_char *template,
|
|
|
|
unsigned char *string, int length)
|
|
|
|
{
|
|
|
|
struct document *document = renderer->document;
|
|
|
|
struct conv_table *convert = renderer->convert_table;
|
|
|
|
enum convert_string_mode mode = renderer->convert_mode;
|
|
|
|
int x;
|
|
|
|
|
|
|
|
assert(renderer && template && string && length);
|
|
|
|
|
|
|
|
string = convert_string(convert, string, length, document->options.cp,
|
|
|
|
mode, &length, NULL, NULL);
|
|
|
|
if (!string) return;
|
|
|
|
|
|
|
|
if (!realloc_line(document, WIDTH(renderer, length), Y(renderer))) {
|
|
|
|
mem_free(string);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
add_search_node(renderer, length);
|
|
|
|
|
|
|
|
for (x = 0; x < length; x++, renderer->canvas_x++) {
|
|
|
|
unsigned char data = string[x];
|
|
|
|
|
|
|
|
/* This is mostly to be able to break out so the indentation
|
|
|
|
* level won't get to high. */
|
|
|
|
switch (data) {
|
|
|
|
case ASCII_TAB:
|
|
|
|
{
|
|
|
|
int tab_width = 7 - (X(renderer) & 7);
|
|
|
|
int width = WIDTH(renderer, length - x + tab_width);
|
|
|
|
|
|
|
|
template->data = ' ';
|
|
|
|
|
|
|
|
if (!realloc_line(document, width, Y(renderer)))
|
|
|
|
break;
|
|
|
|
|
|
|
|
/* Only loop over the expanded tab chars and let the
|
|
|
|
* ``main loop'' add the actual tab char. */
|
|
|
|
for (; tab_width-- > 0; renderer->canvas_x++)
|
|
|
|
copy_screen_chars(POS(renderer), template, 1);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default:
|
|
|
|
template->data = isscreensafe(data) ? data : '.';
|
|
|
|
}
|
|
|
|
|
|
|
|
copy_screen_chars(POS(renderer), template, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
mem_free(string);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned char *
|
|
|
|
split_dom_line(unsigned char *line, int length, int *linelen)
|
|
|
|
{
|
|
|
|
unsigned char *end = line + length;
|
|
|
|
unsigned char *pos;
|
|
|
|
|
|
|
|
/* End of line detection.
|
|
|
|
* We handle \r, \r\n and \n types here. */
|
|
|
|
for (pos = line; pos < end; pos++) {
|
|
|
|
int step = 0;
|
|
|
|
|
|
|
|
if (pos[step] == ASCII_CR)
|
|
|
|
step++;
|
|
|
|
|
|
|
|
if (pos[step] == ASCII_LF)
|
|
|
|
step++;
|
|
|
|
|
|
|
|
if (step) {
|
|
|
|
*linelen = pos - line;
|
|
|
|
return pos + step;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
*linelen = length;
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
render_dom_text(struct dom_renderer *renderer, struct screen_char *template,
|
|
|
|
unsigned char *string, int length)
|
|
|
|
{
|
|
|
|
int linelen;
|
|
|
|
|
|
|
|
for (; length > 0; string += linelen, length -= linelen) {
|
|
|
|
unsigned char *newline = split_dom_line(string, length, &linelen);
|
|
|
|
|
|
|
|
if (linelen)
|
|
|
|
render_dom_line(renderer, template, string, linelen);
|
|
|
|
|
|
|
|
if (newline) {
|
|
|
|
renderer->canvas_y++;
|
|
|
|
renderer->canvas_x = 0;
|
|
|
|
linelen = newline - string;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
#define realloc_document_links(doc, size) \
|
|
|
|
ALIGN_LINK(&(doc)->links, (doc)->nlinks, size)
|
|
|
|
|
|
|
|
static inline struct link *
|
2006-01-07 21:44:23 -05:00
|
|
|
add_dom_link(struct dom_renderer *renderer, unsigned char *string, int length,
|
|
|
|
unsigned char *uristring, int urilength)
|
2005-09-15 09:58:31 -04:00
|
|
|
{
|
|
|
|
struct document *document = renderer->document;
|
|
|
|
int x = renderer->canvas_x;
|
|
|
|
int y = renderer->canvas_y;
|
|
|
|
unsigned char *where;
|
|
|
|
struct link *link;
|
|
|
|
struct point *point;
|
|
|
|
struct screen_char template;
|
|
|
|
color_T fgcolor;
|
|
|
|
|
|
|
|
if (!realloc_document_links(document, document->nlinks + 1))
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
link = &document->links[document->nlinks];
|
|
|
|
|
|
|
|
if (!realloc_points(link, length))
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
uristring = convert_string(renderer->convert_table,
|
2006-01-07 21:44:23 -05:00
|
|
|
uristring, urilength, document->options.cp,
|
2005-09-15 09:58:31 -04:00
|
|
|
CSM_DEFAULT, NULL, NULL, NULL);
|
|
|
|
if (!uristring) return NULL;
|
|
|
|
|
2006-01-25 17:16:30 -05:00
|
|
|
where = join_urls(renderer->base_uri, uristring);
|
2005-09-15 09:58:31 -04:00
|
|
|
|
|
|
|
mem_free(uristring);
|
|
|
|
|
|
|
|
if (!where)
|
|
|
|
return NULL;
|
|
|
|
#ifdef CONFIG_GLOBHIST
|
|
|
|
else if (get_global_history_item(where))
|
|
|
|
fgcolor = document->options.default_vlink;
|
|
|
|
#endif
|
|
|
|
#ifdef CONFIG_BOOKMARKS
|
|
|
|
else if (get_bookmark(where))
|
|
|
|
fgcolor = document->options.default_bookmark_link;
|
|
|
|
#endif
|
|
|
|
else
|
|
|
|
fgcolor = document->options.default_link;
|
|
|
|
|
|
|
|
link->npoints = length;
|
|
|
|
link->type = LINK_HYPERTEXT;
|
|
|
|
link->where = where;
|
|
|
|
link->color.background = document->options.default_bg;
|
|
|
|
link->color.foreground = fgcolor;
|
|
|
|
link->number = document->nlinks;
|
|
|
|
|
|
|
|
init_template(&template, &document->options,
|
2006-01-03 18:50:40 -05:00
|
|
|
link->color.background, link->color.foreground, 0);
|
2005-09-15 09:58:31 -04:00
|
|
|
|
|
|
|
render_dom_text(renderer, &template, string, length);
|
|
|
|
|
|
|
|
for (point = link->points; length > 0; length--, point++, x++) {
|
|
|
|
point->x = x;
|
|
|
|
point->y = y;
|
|
|
|
}
|
|
|
|
|
|
|
|
document->nlinks++;
|
2006-01-28 08:13:41 -05:00
|
|
|
document->links_sorted = 0;
|
2005-09-15 09:58:31 -04:00
|
|
|
|
|
|
|
return link;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/* DOM Source Renderer */
|
|
|
|
|
|
|
|
#define check_dom_node_source(renderer, str, len) \
|
|
|
|
((renderer)->source <= (str) && (str) + (len) <= (renderer)->end)
|
|
|
|
|
|
|
|
#define assert_source(renderer, str, len) \
|
|
|
|
assertm(check_dom_node_source(renderer, str, len), "renderer[%p : %p] str[%p : %p]", \
|
|
|
|
(renderer)->source, (renderer)->end, (str), (str) + (len))
|
|
|
|
|
|
|
|
static inline void
|
|
|
|
render_dom_flush(struct dom_renderer *renderer, unsigned char *string)
|
|
|
|
{
|
|
|
|
struct screen_char *template = &renderer->styles[DOM_NODE_TEXT];
|
|
|
|
int length = string - renderer->position;
|
|
|
|
|
|
|
|
assert_source(renderer, renderer->position, 0);
|
|
|
|
assert_source(renderer, string, 0);
|
|
|
|
|
|
|
|
if (length <= 0) return;
|
|
|
|
render_dom_text(renderer, template, renderer->position, length);
|
|
|
|
renderer->position = string;
|
|
|
|
|
|
|
|
assert_source(renderer, renderer->position, 0);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void
|
|
|
|
render_dom_node_text(struct dom_renderer *renderer, struct screen_char *template,
|
|
|
|
struct dom_node *node)
|
|
|
|
{
|
2005-12-10 12:37:47 -05:00
|
|
|
unsigned char *string = node->string.string;
|
|
|
|
int length = node->string.length;
|
2005-09-15 09:58:31 -04:00
|
|
|
|
|
|
|
if (node->type == DOM_NODE_ENTITY_REFERENCE) {
|
|
|
|
string -= 1;
|
|
|
|
length += 2;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (check_dom_node_source(renderer, string, length)) {
|
|
|
|
render_dom_flush(renderer, string);
|
|
|
|
renderer->position = string + length;
|
|
|
|
assert_source(renderer, renderer->position, 0);
|
|
|
|
}
|
|
|
|
|
|
|
|
render_dom_text(renderer, template, string, length);
|
|
|
|
}
|
|
|
|
|
2005-12-25 09:16:21 -05:00
|
|
|
#ifdef HAVE_REGEX_H
|
|
|
|
static inline void
|
|
|
|
render_dom_node_enhanced_text(struct dom_renderer *renderer, struct dom_node *node)
|
|
|
|
{
|
|
|
|
regex_t *regex = &renderer->url_regex;
|
|
|
|
regmatch_t regmatch;
|
|
|
|
unsigned char *string = node->string.string;
|
|
|
|
int length = node->string.length;
|
|
|
|
struct screen_char *template = &renderer->styles[node->type];
|
2005-12-25 10:08:00 -05:00
|
|
|
unsigned char *alloc_string;
|
2005-12-25 09:16:21 -05:00
|
|
|
|
|
|
|
if (check_dom_node_source(renderer, string, length)) {
|
|
|
|
render_dom_flush(renderer, string);
|
|
|
|
renderer->position = string + length;
|
|
|
|
assert_source(renderer, renderer->position, 0);
|
|
|
|
}
|
|
|
|
|
2005-12-25 10:08:00 -05:00
|
|
|
alloc_string = memacpy(string, length);
|
|
|
|
if (alloc_string)
|
|
|
|
string = alloc_string;
|
|
|
|
|
2005-12-25 09:16:21 -05:00
|
|
|
while (length > 0 && !regexec(regex, string, 1, ®match, 0)) {
|
|
|
|
int matchlen = regmatch.rm_eo - regmatch.rm_so;
|
|
|
|
int offset = regmatch.rm_so;
|
|
|
|
|
|
|
|
if (!matchlen || offset < 0 || regmatch.rm_eo > length)
|
|
|
|
break;
|
|
|
|
|
|
|
|
if (offset > 0)
|
|
|
|
render_dom_text(renderer, template, string, offset);
|
|
|
|
|
|
|
|
string += offset;
|
|
|
|
length -= offset;
|
|
|
|
|
2006-01-07 21:44:23 -05:00
|
|
|
add_dom_link(renderer, string, matchlen, string, matchlen);
|
2005-12-25 09:16:21 -05:00
|
|
|
|
|
|
|
length -= matchlen;
|
|
|
|
string += matchlen;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (length > 0)
|
|
|
|
render_dom_text(renderer, template, string, length);
|
2005-12-25 10:08:00 -05:00
|
|
|
|
|
|
|
mem_free_if(alloc_string);
|
2005-12-25 09:16:21 -05:00
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
2006-01-29 06:11:35 -05:00
|
|
|
static enum dom_stack_code
|
2005-11-15 04:43:52 -05:00
|
|
|
render_dom_node_source(struct dom_stack *stack, struct dom_node *node, void *data)
|
2005-09-15 09:58:31 -04:00
|
|
|
{
|
2005-12-20 19:36:47 -05:00
|
|
|
struct dom_renderer *renderer = stack->current->data;
|
2005-09-15 09:58:31 -04:00
|
|
|
|
|
|
|
assert(node && renderer && renderer->document);
|
|
|
|
|
2005-12-25 09:16:21 -05:00
|
|
|
#ifdef HAVE_REGEX_H
|
|
|
|
if (renderer->find_url
|
|
|
|
&& (node->type == DOM_NODE_TEXT
|
|
|
|
|| node->type == DOM_NODE_CDATA_SECTION
|
|
|
|
|| node->type == DOM_NODE_COMMENT)) {
|
|
|
|
render_dom_node_enhanced_text(renderer, node);
|
2006-01-15 18:55:58 -05:00
|
|
|
} else
|
2005-12-25 09:16:21 -05:00
|
|
|
#endif
|
2006-01-15 18:55:58 -05:00
|
|
|
render_dom_node_text(renderer, &renderer->styles[node->type], node);
|
2005-12-25 09:16:21 -05:00
|
|
|
|
2006-01-15 18:55:58 -05:00
|
|
|
return DOM_STACK_CODE_OK;
|
2005-09-15 09:58:31 -04:00
|
|
|
}
|
|
|
|
|
2005-12-19 21:25:51 -05:00
|
|
|
/* This callback is also used for rendering processing instruction nodes. */
|
2006-01-15 18:55:58 -05:00
|
|
|
static enum dom_stack_code
|
2005-11-15 04:43:52 -05:00
|
|
|
render_dom_element_source(struct dom_stack *stack, struct dom_node *node, void *data)
|
2005-09-15 09:58:31 -04:00
|
|
|
{
|
2005-12-20 19:36:47 -05:00
|
|
|
struct dom_renderer *renderer = stack->current->data;
|
2005-09-15 09:58:31 -04:00
|
|
|
|
|
|
|
assert(node && renderer && renderer->document);
|
|
|
|
|
|
|
|
render_dom_node_text(renderer, &renderer->styles[node->type], node);
|
2006-01-15 18:55:58 -05:00
|
|
|
|
|
|
|
return DOM_STACK_CODE_OK;
|
2005-09-15 09:58:31 -04:00
|
|
|
}
|
|
|
|
|
2006-01-15 18:55:58 -05:00
|
|
|
enum dom_stack_code
|
2005-12-05 13:33:15 -05:00
|
|
|
render_dom_element_end_source(struct dom_stack *stack, struct dom_node *node, void *data)
|
|
|
|
{
|
2005-12-20 19:36:47 -05:00
|
|
|
struct dom_renderer *renderer = stack->current->data;
|
2005-12-20 22:38:04 -05:00
|
|
|
struct dom_stack_state *state = get_dom_stack_top(stack);
|
2005-12-26 23:59:12 -05:00
|
|
|
struct sgml_parser_state *pstate = get_dom_stack_state_data(stack->contexts[0], state);
|
2005-12-28 08:05:14 -05:00
|
|
|
struct dom_scanner_token *token = &pstate->end_token;
|
2005-12-28 10:23:36 -05:00
|
|
|
unsigned char *string = token->string.string;
|
|
|
|
int length = token->string.length;
|
2005-12-05 13:33:15 -05:00
|
|
|
|
|
|
|
assert(node && renderer && renderer->document);
|
|
|
|
|
|
|
|
if (!string || !length)
|
2006-01-15 18:55:58 -05:00
|
|
|
return DOM_STACK_CODE_OK;
|
2005-12-05 13:33:15 -05:00
|
|
|
|
|
|
|
if (check_dom_node_source(renderer, string, length)) {
|
|
|
|
render_dom_flush(renderer, string);
|
|
|
|
renderer->position = string + length;
|
|
|
|
assert_source(renderer, renderer->position, 0);
|
|
|
|
}
|
|
|
|
|
|
|
|
render_dom_text(renderer, &renderer->styles[node->type], string, length);
|
2006-01-15 18:55:58 -05:00
|
|
|
|
|
|
|
return DOM_STACK_CODE_OK;
|
2005-12-05 13:33:15 -05:00
|
|
|
}
|
|
|
|
|
2006-01-25 17:16:30 -05:00
|
|
|
static void
|
|
|
|
set_base_uri(struct dom_renderer *renderer, unsigned char *value, size_t valuelen)
|
|
|
|
{
|
|
|
|
unsigned char *href = memacpy(value, valuelen);
|
|
|
|
unsigned char *uristring;
|
|
|
|
struct uri *uri;
|
|
|
|
|
|
|
|
if (!href) return;
|
|
|
|
uristring = join_urls(renderer->base_uri, href);
|
|
|
|
mem_free(href);
|
|
|
|
|
|
|
|
if (!uristring) return;
|
|
|
|
uri = get_uri(uristring, 0);
|
|
|
|
mem_free(uristring);
|
|
|
|
|
|
|
|
if (!uri) return;
|
|
|
|
|
|
|
|
done_uri(renderer->base_uri);
|
|
|
|
renderer->base_uri = uri;
|
|
|
|
}
|
|
|
|
|
2006-01-15 18:55:58 -05:00
|
|
|
enum dom_stack_code
|
2005-11-15 04:43:52 -05:00
|
|
|
render_dom_attribute_source(struct dom_stack *stack, struct dom_node *node, void *data)
|
2005-09-15 09:58:31 -04:00
|
|
|
{
|
2005-12-20 19:36:47 -05:00
|
|
|
struct dom_renderer *renderer = stack->current->data;
|
2005-09-15 09:58:31 -04:00
|
|
|
struct screen_char *template = &renderer->styles[node->type];
|
|
|
|
|
|
|
|
assert(node && renderer->document);
|
|
|
|
|
|
|
|
render_dom_node_text(renderer, template, node);
|
|
|
|
|
2005-12-10 12:42:54 -05:00
|
|
|
if (is_dom_string_set(&node->data.attribute.value)) {
|
2005-09-15 09:58:31 -04:00
|
|
|
int quoted = node->data.attribute.quoted == 1;
|
2005-12-10 12:42:54 -05:00
|
|
|
unsigned char *value = node->data.attribute.value.string - quoted;
|
|
|
|
int valuelen = node->data.attribute.value.length + quoted * 2;
|
2005-09-15 09:58:31 -04:00
|
|
|
|
|
|
|
if (check_dom_node_source(renderer, value, 0)) {
|
|
|
|
render_dom_flush(renderer, value);
|
|
|
|
renderer->position = value + valuelen;
|
|
|
|
assert_source(renderer, renderer->position, 0);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (node->data.attribute.reference
|
|
|
|
&& valuelen - quoted * 2 > 0) {
|
|
|
|
int skips;
|
|
|
|
|
|
|
|
/* Need to flush the first quoting delimiter and any
|
|
|
|
* leading whitespace so that the renderers x position
|
|
|
|
* is at the start of the value string. */
|
|
|
|
for (skips = 0; skips < valuelen; skips++) {
|
|
|
|
if ((quoted && skips == 0)
|
|
|
|
|| isspace(value[skips])
|
|
|
|
|| value[skips] < ' ')
|
|
|
|
continue;
|
|
|
|
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (skips > 0) {
|
|
|
|
render_dom_text(renderer, template, value, skips);
|
|
|
|
value += skips;
|
|
|
|
valuelen -= skips;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Figure out what should be skipped after the actual
|
|
|
|
* link text. */
|
|
|
|
for (skips = 0; skips < valuelen; skips++) {
|
|
|
|
if ((quoted && skips == 0)
|
|
|
|
|| isspace(value[valuelen - skips - 1])
|
|
|
|
|| value[valuelen - skips - 1] < ' ')
|
|
|
|
continue;
|
|
|
|
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2006-01-25 17:16:30 -05:00
|
|
|
if (renderer->doctype == SGML_DOCTYPE_HTML
|
|
|
|
&& node->data.attribute.type == HTML_ATTRIBUTE_HREF
|
|
|
|
&& node->parent->data.element.type == HTML_ELEMENT_BASE) {
|
|
|
|
set_base_uri(renderer, value, valuelen - skips);
|
|
|
|
}
|
|
|
|
|
2006-01-07 21:44:23 -05:00
|
|
|
add_dom_link(renderer, value, valuelen - skips,
|
|
|
|
value, valuelen - skips);
|
2005-09-15 09:58:31 -04:00
|
|
|
|
|
|
|
if (skips > 0) {
|
|
|
|
value += valuelen - skips;
|
|
|
|
render_dom_text(renderer, template, value, skips);
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
render_dom_text(renderer, template, value, valuelen);
|
|
|
|
}
|
|
|
|
}
|
2006-01-15 18:55:58 -05:00
|
|
|
|
|
|
|
return DOM_STACK_CODE_OK;
|
2005-09-15 09:58:31 -04:00
|
|
|
}
|
|
|
|
|
2006-01-15 18:55:58 -05:00
|
|
|
enum dom_stack_code
|
2005-12-26 14:51:01 -05:00
|
|
|
render_dom_cdata_source(struct dom_stack *stack, struct dom_node *node, void *data)
|
|
|
|
{
|
|
|
|
struct dom_renderer *renderer = stack->current->data;
|
|
|
|
unsigned char *string = node->string.string;
|
|
|
|
|
|
|
|
assert(node && renderer && renderer->document);
|
|
|
|
|
|
|
|
/* Highlight the 'CDATA' part of <![CDATA[ if it is there. */
|
|
|
|
if (check_dom_node_source(renderer, string - 6, 6)) {
|
|
|
|
render_dom_flush(renderer, string - 6);
|
|
|
|
render_dom_text(renderer, &renderer->styles[DOM_NODE_ATTRIBUTE], string - 6, 5);
|
|
|
|
renderer->position = string - 1;
|
|
|
|
assert_source(renderer, renderer->position, 0);
|
|
|
|
}
|
|
|
|
|
|
|
|
render_dom_node_text(renderer, &renderer->styles[node->type], node);
|
2006-01-15 18:55:58 -05:00
|
|
|
|
|
|
|
return DOM_STACK_CODE_OK;
|
2005-12-26 14:51:01 -05:00
|
|
|
}
|
|
|
|
|
2006-01-15 18:55:58 -05:00
|
|
|
enum dom_stack_code
|
2005-12-22 06:33:27 -05:00
|
|
|
render_dom_document_end(struct dom_stack *stack, struct dom_node *node, void *data)
|
|
|
|
{
|
|
|
|
struct dom_renderer *renderer = stack->current->data;
|
|
|
|
|
|
|
|
/* If there are no non-element nodes after the last element node make
|
|
|
|
* sure that we flush to the end of the cache entry source including
|
|
|
|
* the '>' of the last element tag if it has one. (bug 519) */
|
|
|
|
if (check_dom_node_source(renderer, renderer->position, 0)) {
|
|
|
|
render_dom_flush(renderer, renderer->end);
|
|
|
|
}
|
2006-01-15 18:55:58 -05:00
|
|
|
|
|
|
|
return DOM_STACK_CODE_OK;
|
2005-12-22 06:33:27 -05:00
|
|
|
}
|
|
|
|
|
2005-12-20 18:58:22 -05:00
|
|
|
static struct dom_stack_context_info dom_source_renderer_context_info = {
|
2005-12-20 22:38:04 -05:00
|
|
|
/* Object size: */ 0,
|
2005-12-20 13:20:04 -05:00
|
|
|
/* Push: */
|
|
|
|
{
|
|
|
|
/* */ NULL,
|
|
|
|
/* DOM_NODE_ELEMENT */ render_dom_element_source,
|
|
|
|
/* DOM_NODE_ATTRIBUTE */ render_dom_attribute_source,
|
|
|
|
/* DOM_NODE_TEXT */ render_dom_node_source,
|
2005-12-26 14:51:01 -05:00
|
|
|
/* DOM_NODE_CDATA_SECTION */ render_dom_cdata_source,
|
2005-12-20 13:20:04 -05:00
|
|
|
/* DOM_NODE_ENTITY_REFERENCE */ render_dom_node_source,
|
|
|
|
/* DOM_NODE_ENTITY */ render_dom_node_source,
|
|
|
|
/* DOM_NODE_PROC_INSTRUCTION */ render_dom_element_source,
|
|
|
|
/* DOM_NODE_COMMENT */ render_dom_node_source,
|
|
|
|
/* DOM_NODE_DOCUMENT */ NULL,
|
|
|
|
/* DOM_NODE_DOCUMENT_TYPE */ render_dom_node_source,
|
|
|
|
/* DOM_NODE_DOCUMENT_FRAGMENT */ render_dom_node_source,
|
|
|
|
/* DOM_NODE_NOTATION */ render_dom_node_source,
|
|
|
|
},
|
|
|
|
/* Pop: */
|
|
|
|
{
|
|
|
|
/* */ NULL,
|
|
|
|
/* DOM_NODE_ELEMENT */ render_dom_element_end_source,
|
|
|
|
/* DOM_NODE_ATTRIBUTE */ NULL,
|
|
|
|
/* DOM_NODE_TEXT */ NULL,
|
|
|
|
/* DOM_NODE_CDATA_SECTION */ NULL,
|
|
|
|
/* DOM_NODE_ENTITY_REFERENCE */ NULL,
|
|
|
|
/* DOM_NODE_ENTITY */ NULL,
|
|
|
|
/* DOM_NODE_PROC_INSTRUCTION */ NULL,
|
|
|
|
/* DOM_NODE_COMMENT */ NULL,
|
2005-12-22 06:33:27 -05:00
|
|
|
/* DOM_NODE_DOCUMENT */ render_dom_document_end,
|
2005-12-20 13:20:04 -05:00
|
|
|
/* DOM_NODE_DOCUMENT_TYPE */ NULL,
|
|
|
|
/* DOM_NODE_DOCUMENT_FRAGMENT */ NULL,
|
|
|
|
/* DOM_NODE_NOTATION */ NULL,
|
|
|
|
}
|
2005-12-05 13:31:42 -05:00
|
|
|
};
|
|
|
|
|
2005-09-15 09:58:31 -04:00
|
|
|
|
2006-01-07 21:44:23 -05:00
|
|
|
/* DOM RSS Renderer */
|
|
|
|
|
2006-01-15 23:12:34 -05:00
|
|
|
#define RSS_CONFIG_FLAGS \
|
|
|
|
(DOM_CONFIG_NORMALIZE_WHITESPACE | DOM_CONFIG_NORMALIZE_CHARACTERS)
|
|
|
|
|
2006-01-15 18:55:58 -05:00
|
|
|
enum dom_stack_code
|
2006-01-07 21:44:23 -05:00
|
|
|
dom_rss_push_element(struct dom_stack *stack, struct dom_node *node, void *data)
|
|
|
|
{
|
|
|
|
struct dom_renderer *renderer = stack->current->data;
|
|
|
|
|
|
|
|
assert(node && renderer && renderer->document);
|
|
|
|
|
|
|
|
switch (node->data.element.type) {
|
|
|
|
case RSS_ELEMENT_CHANNEL:
|
|
|
|
/* The stack should have: #document * channel */
|
|
|
|
if (stack->depth != 3)
|
|
|
|
break;
|
|
|
|
|
|
|
|
if (!renderer->channel) {
|
|
|
|
renderer->channel = node;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
|
|
|
case RSS_ELEMENT_ITEM:
|
|
|
|
/* The stack should have: #document * channel item */
|
|
|
|
#if 0
|
|
|
|
/* Don't be so strict ... */
|
|
|
|
if (stack->depth != 4)
|
|
|
|
break;
|
|
|
|
#endif
|
|
|
|
/* ... but be exclusive. */
|
|
|
|
if (renderer->item)
|
|
|
|
break;
|
|
|
|
add_to_dom_node_list(&renderer->items, node, -1);
|
|
|
|
renderer->item = node;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case RSS_ELEMENT_LINK:
|
|
|
|
case RSS_ELEMENT_DESCRIPTION:
|
|
|
|
case RSS_ELEMENT_TITLE:
|
|
|
|
case RSS_ELEMENT_AUTHOR:
|
|
|
|
case RSS_ELEMENT_PUBDATE:
|
|
|
|
if (!node->parent || renderer->node != node->parent)
|
|
|
|
break;
|
|
|
|
|
|
|
|
renderer->node = node;
|
|
|
|
}
|
2006-01-15 18:55:58 -05:00
|
|
|
|
|
|
|
return DOM_STACK_CODE_OK;
|
2006-01-07 21:44:23 -05:00
|
|
|
}
|
|
|
|
|
2006-01-15 18:55:58 -05:00
|
|
|
enum dom_stack_code
|
2006-01-07 21:44:23 -05:00
|
|
|
dom_rss_pop_element(struct dom_stack *stack, struct dom_node *node, void *data)
|
|
|
|
{
|
|
|
|
struct dom_renderer *renderer = stack->current->data;
|
|
|
|
struct dom_node_list **list;
|
|
|
|
|
|
|
|
assert(node && renderer && renderer->document);
|
|
|
|
|
|
|
|
switch (node->data.element.type) {
|
|
|
|
case RSS_ELEMENT_ITEM:
|
|
|
|
if (is_dom_string_set(&renderer->text))
|
|
|
|
done_dom_string(&renderer->text);
|
|
|
|
renderer->item = NULL;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case RSS_ELEMENT_LINK:
|
|
|
|
case RSS_ELEMENT_DESCRIPTION:
|
|
|
|
case RSS_ELEMENT_TITLE:
|
|
|
|
case RSS_ELEMENT_AUTHOR:
|
|
|
|
case RSS_ELEMENT_PUBDATE:
|
|
|
|
if (!is_dom_string_set(&renderer->text)
|
|
|
|
|| !node->parent
|
|
|
|
|| renderer->item != node->parent
|
|
|
|
|| renderer->node != node)
|
|
|
|
break;
|
|
|
|
|
|
|
|
/* Replace any child nodes with the normalized text node. */
|
|
|
|
list = get_dom_node_list(node->parent, node);
|
|
|
|
done_dom_node_list(*list);
|
|
|
|
if (is_dom_string_set(&renderer->text)) {
|
|
|
|
if (!add_dom_node(node, DOM_NODE_TEXT, &renderer->text))
|
|
|
|
done_dom_string(&renderer->text);
|
|
|
|
}
|
|
|
|
renderer->node = NULL;
|
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
|
|
|
break;
|
|
|
|
}
|
2006-01-15 18:55:58 -05:00
|
|
|
|
|
|
|
return DOM_STACK_CODE_OK;
|
2006-01-07 21:44:23 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static struct dom_string *
|
|
|
|
get_rss_text(struct dom_node *node, enum rss_element_type type)
|
|
|
|
{
|
2006-01-16 01:11:02 -05:00
|
|
|
node = get_dom_node_child(node, DOM_NODE_ELEMENT, type);
|
|
|
|
|
|
|
|
if (!node) return NULL;
|
|
|
|
|
|
|
|
node = get_dom_node_child(node, DOM_NODE_TEXT, 0);
|
2006-01-07 21:44:23 -05:00
|
|
|
|
2006-01-16 01:11:02 -05:00
|
|
|
return node ? &node->string: NULL;
|
2006-01-07 21:44:23 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
render_rss_item(struct dom_renderer *renderer, struct dom_node *item)
|
|
|
|
{
|
|
|
|
struct dom_string *title = get_rss_text(item, RSS_ELEMENT_TITLE);
|
|
|
|
struct dom_string *link = get_rss_text(item, RSS_ELEMENT_LINK);
|
|
|
|
struct dom_string *author = get_rss_text(item, RSS_ELEMENT_AUTHOR);
|
|
|
|
struct dom_string *date = get_rss_text(item, RSS_ELEMENT_PUBDATE);
|
|
|
|
|
|
|
|
if (title && is_dom_string_set(title)) {
|
2006-01-09 13:14:28 -05:00
|
|
|
if (item == renderer->channel) {
|
|
|
|
unsigned char *str;
|
|
|
|
|
|
|
|
str = convert_string(renderer->convert_table,
|
|
|
|
title->string, title->length,
|
|
|
|
renderer->document->options.cp,
|
|
|
|
CSM_DEFAULT, NULL, NULL, NULL);
|
|
|
|
if (str)
|
|
|
|
renderer->document->title = str;
|
|
|
|
}
|
2006-01-07 21:44:23 -05:00
|
|
|
render_dom_text(renderer, &renderer->styles[DOM_NODE_ELEMENT],
|
|
|
|
title->string, title->length);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (link && is_dom_string_set(link)) {
|
|
|
|
X(renderer)++;
|
|
|
|
add_dom_link(renderer, "[link]", 6, link->string, link->length);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* New line, and indent */
|
|
|
|
Y(renderer)++;
|
|
|
|
X(renderer) = 0;
|
|
|
|
|
|
|
|
if (author && is_dom_string_set(author)) {
|
|
|
|
render_dom_text(renderer, &renderer->styles[DOM_NODE_COMMENT],
|
|
|
|
author->string, author->length);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (date && is_dom_string_set(date)) {
|
|
|
|
if (author && is_dom_string_set(author)) {
|
|
|
|
render_dom_text(renderer, &renderer->styles[DOM_NODE_COMMENT],
|
|
|
|
" - ", 3);
|
|
|
|
}
|
|
|
|
|
|
|
|
render_dom_text(renderer, &renderer->styles[DOM_NODE_COMMENT],
|
|
|
|
date->string, date->length);
|
|
|
|
}
|
|
|
|
|
|
|
|
if ((author && is_dom_string_set(author))
|
|
|
|
|| (date && is_dom_string_set(date))) {
|
|
|
|
/* New line, and indent */
|
|
|
|
Y(renderer)++;
|
|
|
|
X(renderer) = 0;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2006-01-15 18:55:58 -05:00
|
|
|
enum dom_stack_code
|
2006-01-07 21:44:23 -05:00
|
|
|
dom_rss_pop_document(struct dom_stack *stack, struct dom_node *root, void *data)
|
|
|
|
{
|
|
|
|
struct dom_renderer *renderer = stack->current->data;
|
|
|
|
|
|
|
|
if (!renderer->channel)
|
2006-01-15 18:55:58 -05:00
|
|
|
return DOM_STACK_CODE_OK;
|
2006-01-07 21:44:23 -05:00
|
|
|
|
|
|
|
render_rss_item(renderer, renderer->channel);
|
|
|
|
|
|
|
|
if (renderer->items) {
|
|
|
|
struct dom_node *node;
|
|
|
|
int index;
|
|
|
|
|
|
|
|
foreach_dom_node (renderer->items, node, index) {
|
|
|
|
Y(renderer)++;
|
|
|
|
X(renderer) = 0;
|
|
|
|
render_rss_item(renderer, node);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (is_dom_string_set(&renderer->text))
|
|
|
|
done_dom_string(&renderer->text);
|
|
|
|
mem_free_if(renderer->items);
|
|
|
|
|
|
|
|
done_dom_node(root);
|
2006-01-15 18:55:58 -05:00
|
|
|
|
|
|
|
return DOM_STACK_CODE_OK;
|
2006-01-07 21:44:23 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static struct dom_stack_context_info dom_rss_renderer_context_info = {
|
|
|
|
/* Object size: */ 0,
|
|
|
|
/* Push: */
|
|
|
|
{
|
|
|
|
/* */ NULL,
|
|
|
|
/* DOM_NODE_ELEMENT */ dom_rss_push_element,
|
|
|
|
/* DOM_NODE_ATTRIBUTE */ NULL,
|
2006-01-15 23:12:34 -05:00
|
|
|
/* DOM_NODE_TEXT */ NULL,
|
|
|
|
/* DOM_NODE_CDATA_SECTION */ NULL,
|
|
|
|
/* DOM_NODE_ENTITY_REFERENCE */ NULL,
|
2006-01-07 21:44:23 -05:00
|
|
|
/* DOM_NODE_ENTITY */ NULL,
|
|
|
|
/* DOM_NODE_PROC_INSTRUCTION */ NULL,
|
|
|
|
/* DOM_NODE_COMMENT */ NULL,
|
|
|
|
/* DOM_NODE_DOCUMENT */ NULL,
|
|
|
|
/* DOM_NODE_DOCUMENT_TYPE */ NULL,
|
|
|
|
/* DOM_NODE_DOCUMENT_FRAGMENT */ NULL,
|
|
|
|
/* DOM_NODE_NOTATION */ NULL,
|
|
|
|
},
|
|
|
|
/* Pop: */
|
|
|
|
{
|
|
|
|
/* */ NULL,
|
|
|
|
/* DOM_NODE_ELEMENT */ dom_rss_pop_element,
|
|
|
|
/* DOM_NODE_ATTRIBUTE */ NULL,
|
|
|
|
/* DOM_NODE_TEXT */ NULL,
|
|
|
|
/* DOM_NODE_CDATA_SECTION */ NULL,
|
|
|
|
/* DOM_NODE_ENTITY_REFERENCE */ NULL,
|
|
|
|
/* DOM_NODE_ENTITY */ NULL,
|
|
|
|
/* DOM_NODE_PROC_INSTRUCTION */ NULL,
|
|
|
|
/* DOM_NODE_COMMENT */ NULL,
|
|
|
|
/* DOM_NODE_DOCUMENT */ dom_rss_pop_document,
|
|
|
|
/* DOM_NODE_DOCUMENT_TYPE */ NULL,
|
|
|
|
/* DOM_NODE_DOCUMENT_FRAGMENT */ NULL,
|
|
|
|
/* DOM_NODE_NOTATION */ NULL,
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
|
2005-09-15 09:58:31 -04:00
|
|
|
/* Shared multiplexor between renderers */
|
|
|
|
void
|
|
|
|
render_dom_document(struct cache_entry *cached, struct document *document,
|
|
|
|
struct string *buffer)
|
|
|
|
{
|
|
|
|
unsigned char *head = empty_string_or_(cached->head);
|
|
|
|
struct dom_renderer renderer;
|
|
|
|
struct conv_table *convert_table;
|
2005-11-27 03:18:40 -05:00
|
|
|
struct sgml_parser *parser;
|
2006-01-07 21:44:23 -05:00
|
|
|
enum sgml_parser_type parser_type;
|
2005-12-28 09:19:10 -05:00
|
|
|
unsigned char *string = struri(cached->uri);
|
|
|
|
size_t length = strlen(string);
|
|
|
|
struct dom_string uri = INIT_DOM_STRING(string, length);
|
2006-01-02 11:40:42 -05:00
|
|
|
enum sgml_parser_code code;
|
2005-09-15 09:58:31 -04:00
|
|
|
|
|
|
|
convert_table = get_convert_table(head, document->options.cp,
|
|
|
|
document->options.assume_cp,
|
|
|
|
&document->cp,
|
|
|
|
&document->cp_status,
|
|
|
|
document->options.hard_assume);
|
|
|
|
|
2005-11-15 06:11:48 -05:00
|
|
|
init_dom_renderer(&renderer, document, buffer, convert_table);
|
2005-09-15 09:58:31 -04:00
|
|
|
|
|
|
|
document->bgcolor = document->options.default_bg;
|
|
|
|
|
2006-01-07 21:44:23 -05:00
|
|
|
if (document->options.plain)
|
|
|
|
parser_type = SGML_PARSER_STREAM;
|
|
|
|
else
|
|
|
|
parser_type = SGML_PARSER_TREE;
|
|
|
|
|
2006-01-01 17:22:10 -05:00
|
|
|
/* FIXME: Refactor the doctype lookup. */
|
2006-01-01 17:14:16 -05:00
|
|
|
if (!strcasecmp("application/rss+xml", cached->content_type)) {
|
2006-01-25 17:16:30 -05:00
|
|
|
renderer.doctype = SGML_DOCTYPE_RSS;
|
2006-01-01 17:14:16 -05:00
|
|
|
|
2006-01-01 17:22:10 -05:00
|
|
|
} else if (!strcasecmp("application/docbook+xml", cached->content_type)) {
|
2006-01-25 17:16:30 -05:00
|
|
|
renderer.doctype = SGML_DOCTYPE_DOCBOOK;
|
2006-01-01 17:22:10 -05:00
|
|
|
|
2006-01-01 17:14:16 -05:00
|
|
|
} else if (!strcasecmp("application/xbel+xml", cached->content_type)
|
|
|
|
|| !strcasecmp("application/x-xbel", cached->content_type)
|
|
|
|
|| !strcasecmp("application/xbel", cached->content_type)) {
|
2006-01-25 17:16:30 -05:00
|
|
|
renderer.doctype = SGML_DOCTYPE_XBEL;
|
2006-01-01 17:14:16 -05:00
|
|
|
|
|
|
|
} else {
|
|
|
|
assertm(!strcasecmp("text/html", cached->content_type)
|
|
|
|
|| !strcasecmp("application/xhtml+xml", cached->content_type),
|
|
|
|
"Couldn't resolve doctype '%s'", cached->content_type);
|
|
|
|
|
2006-01-25 17:16:30 -05:00
|
|
|
renderer.doctype = SGML_DOCTYPE_HTML;
|
2006-01-01 17:14:16 -05:00
|
|
|
}
|
2005-12-19 21:08:13 -05:00
|
|
|
|
2006-01-25 17:16:30 -05:00
|
|
|
parser = init_sgml_parser(parser_type, renderer.doctype, &uri, 0);
|
2006-01-07 21:44:23 -05:00
|
|
|
if (!parser) return;
|
2006-01-12 18:11:39 -05:00
|
|
|
|
2006-01-07 21:44:23 -05:00
|
|
|
if (document->options.plain) {
|
|
|
|
add_dom_stack_context(&parser->stack, &renderer,
|
|
|
|
&dom_source_renderer_context_info);
|
2005-12-05 13:20:48 -05:00
|
|
|
|
2006-01-25 17:16:30 -05:00
|
|
|
} else if (renderer.doctype == SGML_DOCTYPE_RSS) {
|
2006-01-07 21:44:23 -05:00
|
|
|
add_dom_stack_context(&parser->stack, &renderer,
|
|
|
|
&dom_rss_renderer_context_info);
|
2006-01-27 19:59:22 -05:00
|
|
|
add_dom_config_normalizer(&parser->stack, RSS_CONFIG_FLAGS);
|
2006-01-07 21:44:23 -05:00
|
|
|
}
|
2005-12-21 08:41:28 -05:00
|
|
|
|
2006-01-02 11:40:42 -05:00
|
|
|
/* FIXME: When rendering this way we don't really care about the code.
|
|
|
|
* However, it will be useful when we will be able to also
|
|
|
|
* incrementally parse new data. This will require the parser to live
|
|
|
|
* during the fetching of data. */
|
2006-01-14 05:32:11 -05:00
|
|
|
code = parse_sgml(parser, buffer->source, buffer->length, 1);
|
2006-01-02 11:40:42 -05:00
|
|
|
if (parser->root) {
|
2005-12-22 06:33:27 -05:00
|
|
|
assert(parser->stack.depth == 1);
|
2005-12-05 13:20:48 -05:00
|
|
|
|
2005-12-22 06:33:27 -05:00
|
|
|
get_dom_stack_top(&parser->stack)->immutable = 0;
|
|
|
|
/* For SGML_PARSER_STREAM this will free the DOM
|
|
|
|
* root node. */
|
|
|
|
pop_dom_node(&parser->stack);
|
2005-09-15 09:58:31 -04:00
|
|
|
}
|
|
|
|
|
2005-12-25 09:16:21 -05:00
|
|
|
#ifdef HAVE_REGEX_H
|
|
|
|
if (renderer.find_url)
|
|
|
|
regfree(&renderer.url_regex);
|
|
|
|
#endif
|
2006-01-25 17:16:30 -05:00
|
|
|
done_uri(renderer.base_uri);
|
2005-12-22 06:33:27 -05:00
|
|
|
done_sgml_parser(parser);
|
2005-09-15 09:58:31 -04:00
|
|
|
}
|