blob: ed97915333b9fc02064783be9e821627521c54f5 [file] [log] [blame]
William M. Brack2ad1dff2003-11-15 10:35:20 +00001<html><head><meta http-equiv="Content-Type" content="text/html; charset=ISO-8859-1"><title>HTMLparser</title><meta name="generator" content="DocBook XSL Stylesheets V1.48"><meta name="generator" content="GTK-Doc V1.1 (XML mode)"><style type="text/css">
Daniel Veillardd4330462003-04-29 12:40:16 +00002 .synopsis, .classsynopsis {
3 background: #eeeeee;
4 border: solid 1px #aaaaaa;
5 padding: 0.5em;
6 }
7 .programlisting {
8 background: #eeeeff;
9 border: solid 1px #aaaaff;
10 padding: 0.5em;
11 }
12 .variablelist {
13 padding: 4px;
14 margin-left: 3em;
15 }
16 .navigation {
17 background: #ffeeee;
18 border: solid 1px #ffaaaa;
19 margin-top: 0.5em;
20 margin-bottom: 0.5em;
21 }
22 .navigation a {
23 color: #770000;
24 }
25 .navigation a:visited {
26 color: #550000;
27 }
28 .navigation .title {
29 font-size: 200%;
30 }
William M. Brack2ad1dff2003-11-15 10:35:20 +000031 </style><link rel="home" href="index.html" title="Gnome XML Library Reference Manual "><link rel="up" href="ch01.html" title="Libxml Programming Notes"><link rel="previous" href="libxml-entities.html" title="entities"><link rel="next" href="libxml-valid.html" title="valid"></head><body text="black" link="#0000FF" vlink="#840084" alink="#0000FF"><table class="navigation" width="100%" summary="Navigation header" cellpadding="2" cellspacing="2"><tr valign="middle"><td><a accesskey="p" href="libxml-entities.html"><img src="left.png" width="24" height="24" border="0" alt="Prev"></a></td><td><a accesskey="u" href="ch01.html"><img src="up.png" width="24" height="24" border="0" alt="Up"></a></td><td><a accesskey="h" href="index.html"><img src="home.png" width="24" height="24" border="0" alt="Home"></a></td><th width="100%" align="center">Gnome XML Library Reference Manual </th><td><a accesskey="n" href="libxml-valid.html"><img src="right.png" width="24" height="24" border="0" alt="Next"></a></td></tr></table><div class="refentry"><a name="libxml-HTMLparser"></a><div class="titlepage"></div><div class="refnamediv"><h2>HTMLparser</h2><p>HTMLparser &#8212; </p></div><div class="refsynopsisdiv"><h2><h1 class="title"><a name="id2684037"></a>Synopsis</h1></h2><pre class="synopsis">
Daniel Veillardd4330462003-04-29 12:40:16 +000032
33
34
35typedef <a href="libxml-HTMLparser.html#htmlParserCtxt">htmlParserCtxt</a>;
36typedef <a href="libxml-HTMLparser.html#htmlParserCtxtPtr">htmlParserCtxtPtr</a>;
37typedef <a href="libxml-HTMLparser.html#htmlParserNodeInfo">htmlParserNodeInfo</a>;
38typedef <a href="libxml-HTMLparser.html#htmlSAXHandler">htmlSAXHandler</a>;
39typedef <a href="libxml-HTMLparser.html#htmlSAXHandlerPtr">htmlSAXHandlerPtr</a>;
40typedef <a href="libxml-HTMLparser.html#htmlParserInput">htmlParserInput</a>;
41typedef <a href="libxml-HTMLparser.html#htmlParserInputPtr">htmlParserInputPtr</a>;
42typedef <a href="libxml-HTMLparser.html#htmlDocPtr">htmlDocPtr</a>;
43typedef <a href="libxml-HTMLparser.html#htmlNodePtr">htmlNodePtr</a>;
44struct <a href="libxml-HTMLparser.html#htmlElemDesc">htmlElemDesc</a>;
45typedef <a href="libxml-HTMLparser.html#htmlElemDescPtr">htmlElemDescPtr</a>;
46struct <a href="libxml-HTMLparser.html#htmlEntityDesc">htmlEntityDesc</a>;
47typedef <a href="libxml-HTMLparser.html#htmlEntityDescPtr">htmlEntityDescPtr</a>;
William M. Brack2ad1dff2003-11-15 10:35:20 +000048enum <a href="libxml-HTMLparser.html#htmlParserOption">htmlParserOption</a>;
49</pre></div><div class="refsect1"><h2>Description</h2><p>
Daniel Veillardd4330462003-04-29 12:40:16 +000050
William M. Brack2ad1dff2003-11-15 10:35:20 +000051</p></div><div class="refsect1"><h2>Details</h2><div class="refsect2"><h3><a name="htmlParserCtxt"></a>htmlParserCtxt</h3><pre class="programlisting">typedef xmlParserCtxt htmlParserCtxt;
Daniel Veillardd7cec922003-06-13 12:30:10 +000052</pre><p>
Daniel Veillardd4330462003-04-29 12:40:16 +000053
William M. Brack2ad1dff2003-11-15 10:35:20 +000054</p></div><hr><div class="refsect2"><h3><a name="htmlParserCtxtPtr"></a>htmlParserCtxtPtr</h3><pre class="programlisting">typedef xmlParserCtxtPtr htmlParserCtxtPtr;
Daniel Veillardd7cec922003-06-13 12:30:10 +000055</pre><p>
Daniel Veillardd4330462003-04-29 12:40:16 +000056
William M. Brack2ad1dff2003-11-15 10:35:20 +000057</p></div><hr><div class="refsect2"><h3><a name="htmlParserNodeInfo"></a>htmlParserNodeInfo</h3><pre class="programlisting">typedef xmlParserNodeInfo htmlParserNodeInfo;
Daniel Veillardd7cec922003-06-13 12:30:10 +000058</pre><p>
Daniel Veillardd4330462003-04-29 12:40:16 +000059
William M. Brack2ad1dff2003-11-15 10:35:20 +000060</p></div><hr><div class="refsect2"><h3><a name="htmlSAXHandler"></a>htmlSAXHandler</h3><pre class="programlisting">typedef xmlSAXHandler htmlSAXHandler;
Daniel Veillardd7cec922003-06-13 12:30:10 +000061</pre><p>
Daniel Veillardd4330462003-04-29 12:40:16 +000062
William M. Brack2ad1dff2003-11-15 10:35:20 +000063</p></div><hr><div class="refsect2"><h3><a name="htmlSAXHandlerPtr"></a>htmlSAXHandlerPtr</h3><pre class="programlisting">typedef xmlSAXHandlerPtr htmlSAXHandlerPtr;
Daniel Veillardd7cec922003-06-13 12:30:10 +000064</pre><p>
Daniel Veillardd4330462003-04-29 12:40:16 +000065
William M. Brack2ad1dff2003-11-15 10:35:20 +000066</p></div><hr><div class="refsect2"><h3><a name="htmlParserInput"></a>htmlParserInput</h3><pre class="programlisting">typedef xmlParserInput htmlParserInput;
Daniel Veillardd7cec922003-06-13 12:30:10 +000067</pre><p>
Daniel Veillardd4330462003-04-29 12:40:16 +000068
William M. Brack2ad1dff2003-11-15 10:35:20 +000069</p></div><hr><div class="refsect2"><h3><a name="htmlParserInputPtr"></a>htmlParserInputPtr</h3><pre class="programlisting">typedef xmlParserInputPtr htmlParserInputPtr;
Daniel Veillardd7cec922003-06-13 12:30:10 +000070</pre><p>
Daniel Veillardd4330462003-04-29 12:40:16 +000071
William M. Brack2ad1dff2003-11-15 10:35:20 +000072</p></div><hr><div class="refsect2"><h3><a name="htmlDocPtr"></a>htmlDocPtr</h3><pre class="programlisting">typedef xmlDocPtr htmlDocPtr;
Daniel Veillardd7cec922003-06-13 12:30:10 +000073</pre><p>
Daniel Veillardd4330462003-04-29 12:40:16 +000074
William M. Brack2ad1dff2003-11-15 10:35:20 +000075</p></div><hr><div class="refsect2"><h3><a name="htmlNodePtr"></a>htmlNodePtr</h3><pre class="programlisting">typedef xmlNodePtr htmlNodePtr;
Daniel Veillardd7cec922003-06-13 12:30:10 +000076</pre><p>
Daniel Veillardd4330462003-04-29 12:40:16 +000077
William M. Brack2ad1dff2003-11-15 10:35:20 +000078</p></div><hr><div class="refsect2"><h3><a name="htmlElemDesc"></a>struct htmlElemDesc</h3><pre class="programlisting">struct htmlElemDesc {
79
Daniel Veillardd4330462003-04-29 12:40:16 +000080 const char *name; /* The tag name */
81 char startTag; /* Whether the start tag can be implied */
82 char endTag; /* Whether the end tag can be implied */
83 char saveEndTag; /* Whether the end tag should be saved */
84 char empty; /* Is this an empty element ? */
85 char depr; /* Is this a deprecated element ? */
86 char dtd; /* 1: only in Loose DTD, 2: only Frameset one */
87 char isinline; /* is this a block 0 or inline 1 element */
88 const char *desc; /* the description */
89
90/* NRK Jan.2003
91 * New fields encapsulating HTML structure
92 *
93 * Bugs:
94 * This is a very limited representation. It fails to tell us when
95 * an element *requires* subelements (we only have whether they're
96 * allowed or not), and it doesn't tell us where CDATA and PCDATA
97 * are allowed. Some element relationships are not fully represented:
98 * these are flagged with the word MODIFIER
99 */
100 const char** subelts; /* allowed sub-elements of this element */
101 const char* defaultsubelt; /* subelement for suggested auto-repair
102 if necessary or NULL */
103 const char** attrs_opt; /* Optional Attributes */
104 const char** attrs_depr; /* Additional deprecated attributes */
105 const char** attrs_req; /* Required attributes */
106};
107</pre><p>
108
William M. Brack2ad1dff2003-11-15 10:35:20 +0000109</p></div><hr><div class="refsect2"><h3><a name="htmlElemDescPtr"></a>htmlElemDescPtr</h3><pre class="programlisting">typedef htmlElemDesc *htmlElemDescPtr;
Daniel Veillardd7cec922003-06-13 12:30:10 +0000110</pre><p>
Daniel Veillardd4330462003-04-29 12:40:16 +0000111
William M. Brack2ad1dff2003-11-15 10:35:20 +0000112</p></div><hr><div class="refsect2"><h3><a name="htmlEntityDesc"></a>struct htmlEntityDesc</h3><pre class="programlisting">struct htmlEntityDesc {
113
Daniel Veillardd4330462003-04-29 12:40:16 +0000114 unsigned int value; /* the UNICODE value for the character */
115 const char *name; /* The entity name */
116 const char *desc; /* the description */
117};
118</pre><p>
119
William M. Brack2ad1dff2003-11-15 10:35:20 +0000120</p></div><hr><div class="refsect2"><h3><a name="htmlEntityDescPtr"></a>htmlEntityDescPtr</h3><pre class="programlisting">typedef htmlEntityDesc *htmlEntityDescPtr;
Daniel Veillardd7cec922003-06-13 12:30:10 +0000121</pre><p>
Daniel Veillardd4330462003-04-29 12:40:16 +0000122
William M. Brack2ad1dff2003-11-15 10:35:20 +0000123</p></div><hr><div class="refsect2"><h3><a name="htmlParserOption"></a>enum htmlParserOption</h3><pre class="programlisting">typedef enum {
124 HTML_PARSE_NOERROR = 1&lt;&lt;5, /* suppress error reports */
125 HTML_PARSE_NOWARNING= 1&lt;&lt;6, /* suppress warning reports */
126 HTML_PARSE_PEDANTIC = 1&lt;&lt;7, /* pedantic error reporting */
127 HTML_PARSE_NOBLANKS = 1&lt;&lt;8, /* remove blank nodes */
128 HTML_PARSE_NONET = 1&lt;&lt;11 /* Forbid network access */
129} htmlParserOption;
130</pre><p>
Daniel Veillardd4330462003-04-29 12:40:16 +0000131
William M. Brack2ad1dff2003-11-15 10:35:20 +0000132</p></div></div></div><table class="navigation" width="100%" summary="Navigation footer" cellpadding="2" cellspacing="0"><tr valign="middle"><td align="left"><a accesskey="p" href="libxml-entities.html"><b>&lt;&lt; entities</b></a></td><td align="right"><a accesskey="n" href="libxml-valid.html"><b>valid &gt;&gt;</b></a></td></tr></table></body></html>