2005-09-15 09:58:31 -04:00
|
|
|
|
2005-12-28 08:05:14 -05:00
|
|
|
#ifndef EL_DOM_SGML_SGML_H
|
|
|
|
#define EL_DOM_SGML_SGML_H
|
2005-09-15 09:58:31 -04:00
|
|
|
|
|
|
|
#include <stdlib.h>
|
|
|
|
|
2006-01-18 22:50:10 -05:00
|
|
|
#include "dom/node.h"
|
2005-12-28 08:05:14 -05:00
|
|
|
#include "dom/string.h"
|
2005-09-15 09:58:31 -04:00
|
|
|
|
|
|
|
/* The flags stored in the attribute sgml node info data */
|
|
|
|
/* TODO: Other potential flags (there can be only 16)
|
|
|
|
*
|
|
|
|
* - interaction info for forms (diabled, readonly, maxlength) maybe tabindex,
|
|
|
|
* - table layout,
|
|
|
|
* - generic layout style attributes maybe giving color values an additional flag,
|
|
|
|
* - meta information (rel, rev, title, alt, summary, caption, standby, lang),
|
|
|
|
* - scripting hooks (onblur, ...)
|
|
|
|
* - information about the referenced content (hreflang, codetype, media, type)
|
|
|
|
*
|
|
|
|
* Anyway the flags should of course optimally have a purpose to speed things up
|
|
|
|
* by quickly making it possible to identify certain attribute groups. --jonas */
|
|
|
|
enum sgml_attribute_flags {
|
|
|
|
/* The value uniquely identifies the owner */
|
|
|
|
SGML_ATTRIBUTE_IDENTIFIER = 1,
|
|
|
|
/* The value contains an URI of some sort */
|
|
|
|
SGML_ATTRIBUTE_REFERENCE = 2,
|
|
|
|
};
|
|
|
|
|
|
|
|
/* TODO: We also need an element flag to signal to the parser that all the
|
|
|
|
* content should be skipped; possible with some ugly hacks to not use the
|
|
|
|
* scanner since it could get confused. The purpose of this flag is to group
|
|
|
|
* all element content in one text node. Kind of like a ``verbatim'' thing
|
|
|
|
* where not parsing should be done. For HTML the <script> and <style> tags
|
|
|
|
* should use it. */
|
|
|
|
enum sgml_element_flags {
|
|
|
|
/* The start and end tags are optional */
|
|
|
|
SGML_ELEMENT_OPTIONAL = 1,
|
|
|
|
|
|
|
|
/* The element is empty and end tags are forbidden */
|
|
|
|
SGML_ELEMENT_EMPTY = 2,
|
|
|
|
|
|
|
|
/* The end tag is obtional */
|
|
|
|
SGML_ELEMENT_END_OPTIONAL = 4,
|
|
|
|
};
|
|
|
|
|
|
|
|
struct sgml_node_info {
|
2005-12-10 15:58:59 -05:00
|
|
|
struct dom_string string;
|
2005-09-15 09:58:31 -04:00
|
|
|
uint16_t type;
|
|
|
|
uint16_t flags;
|
|
|
|
};
|
|
|
|
|
2005-12-10 15:58:59 -05:00
|
|
|
/* The header node is special. It is used for storing the number of nodes and
|
|
|
|
* for returning the default 'unknown' node. */
|
2005-09-15 09:58:31 -04:00
|
|
|
#define SGML_NODE_HEAD(doctype, nodetype) \
|
2005-12-10 15:58:59 -05:00
|
|
|
{ INIT_DOM_STRING(NULL, doctype##_##nodetype##S - 1), doctype##_##nodetype##_UNKNOWN }
|
2005-09-15 09:58:31 -04:00
|
|
|
|
|
|
|
#define SGML_NODE_INFO(doctype, nodetype, name, data) \
|
2005-12-10 15:58:59 -05:00
|
|
|
{ INIT_DOM_STRING(#name, sizeof(#name) - 1), doctype##_##nodetype##_##name, data }
|
2005-09-15 09:58:31 -04:00
|
|
|
|
|
|
|
#define SGML_NODE_INF2(doctype, nodetype, name, ident, data) \
|
2005-12-10 15:58:59 -05:00
|
|
|
{ INIT_DOM_STRING(ident, sizeof(ident) - 1), doctype##_##nodetype##_##name, data }
|
2005-09-15 09:58:31 -04:00
|
|
|
|
|
|
|
#define SGML_NODE_INFO_TYPE(doctype, nodetype, name) doctype##_##nodetype##_##name
|
|
|
|
|
|
|
|
int sgml_info_strcmp(const void *key, const void *node);
|
|
|
|
|
|
|
|
static inline struct sgml_node_info *
|
|
|
|
get_sgml_node_info(struct sgml_node_info list[], struct dom_node *node)
|
|
|
|
{
|
|
|
|
struct sgml_node_info *map = &list[1];
|
2005-12-10 15:58:59 -05:00
|
|
|
size_t map_size = list->string.length;
|
2005-09-15 09:58:31 -04:00
|
|
|
size_t obj_size = sizeof(struct sgml_node_info);
|
|
|
|
void *match = bsearch(node, map, map_size, obj_size, sgml_info_strcmp);
|
|
|
|
|
|
|
|
return match ? match : list;
|
|
|
|
}
|
|
|
|
|
2005-12-19 19:04:33 -05:00
|
|
|
enum sgml_document_type {
|
2006-01-01 17:22:10 -05:00
|
|
|
SGML_DOCTYPE_DOCBOOK,
|
2005-12-19 19:04:33 -05:00
|
|
|
SGML_DOCTYPE_HTML,
|
2005-12-19 21:08:13 -05:00
|
|
|
SGML_DOCTYPE_RSS,
|
2005-12-30 16:19:32 -05:00
|
|
|
SGML_DOCTYPE_XBEL,
|
2005-12-19 19:04:33 -05:00
|
|
|
|
|
|
|
SGML_DOCTYPES,
|
|
|
|
};
|
|
|
|
|
2005-09-15 09:58:31 -04:00
|
|
|
struct sgml_info {
|
2005-12-19 19:04:33 -05:00
|
|
|
enum sgml_document_type doctype;
|
2005-09-15 09:58:31 -04:00
|
|
|
struct sgml_node_info *attributes;
|
|
|
|
struct sgml_node_info *elements;
|
|
|
|
};
|
|
|
|
|
2005-12-19 19:04:33 -05:00
|
|
|
struct sgml_info *get_sgml_info(enum sgml_document_type doctype);
|
|
|
|
|
2005-09-15 09:58:31 -04:00
|
|
|
#endif
|