blob: 0f68966ba8ccbc6f0c2e883dfc16995cb075df56 [file] [log] [blame]
Daniel Veillard1566d3a1999-07-15 14:24:29 +00001<HTML
2><HEAD
3><TITLE
4>HTMLparser</TITLE
5><META
6NAME="GENERATOR"
Daniel Veillard71b656e2000-01-05 14:46:17 +00007CONTENT="Modular DocBook HTML Stylesheet Version 1.44"><LINK
Daniel Veillard1566d3a1999-07-15 14:24:29 +00008REL="HOME"
9TITLE="Gnome XML Library Reference Manual"
10HREF="book1.html"><LINK
11REL="UP"
Daniel Veillard35008381999-10-25 13:15:52 +000012TITLE="Libxml Library Reference"
13HREF="libxml-lib.html"><LINK
Daniel Veillard1566d3a1999-07-15 14:24:29 +000014REL="PREVIOUS"
Daniel Veillard6bd26dc1999-09-03 14:28:40 +000015TITLE="xml-error"
16HREF="gnome-xml-xml-error.html"><LINK
Daniel Veillard1566d3a1999-07-15 14:24:29 +000017REL="NEXT"
18TITLE="HTMLtree"
19HREF="gnome-xml-htmltree.html"></HEAD
20><BODY
21BGCOLOR="#FFFFFF"
22TEXT="#000000"
Daniel Veillard71b656e2000-01-05 14:46:17 +000023LINK="#0000FF"
24VLINK="#840084"
25ALINK="#0000FF"
Daniel Veillard1566d3a1999-07-15 14:24:29 +000026><DIV
27CLASS="NAVHEADER"
28><TABLE
29WIDTH="100%"
30BORDER="0"
31BGCOLOR="#000000"
32CELLPADDING="1"
33CELLSPACING="0"
34><TR
35><TH
36COLSPAN="4"
37ALIGN="center"
38><FONT
39COLOR="#FFFFFF"
40SIZE="5"
41>Gnome XML Library Reference Manual</FONT
42></TH
43></TR
44><TR
45><TD
46WIDTH="25%"
47BGCOLOR="#C00000"
48ALIGN="left"
49><A
Daniel Veillard6bd26dc1999-09-03 14:28:40 +000050HREF="gnome-xml-xml-error.html"
Daniel Veillard1566d3a1999-07-15 14:24:29 +000051><FONT
52COLOR="#FFFFFF"
53SIZE="3"
54><B
55>&#60;&#60;&#60; Previous Page</B
56></FONT
57></A
58></TD
59><TD
60WIDTH="25%"
61BGCOLOR="#0000C0"
62ALIGN="center"
63><FONT
64COLOR="#FFFFFF"
65SIZE="3"
66><B
67><A
68HREF="book1.html"
69><FONT
70COLOR="#FFFFFF"
71SIZE="3"
72><B
73>Home</B
74></FONT
75></A
76></B
77></FONT
78></TD
79><TD
80WIDTH="25%"
81BGCOLOR="#00C000"
82ALIGN="center"
83><FONT
84COLOR="#FFFFFF"
85SIZE="3"
86><B
87><A
Daniel Veillard35008381999-10-25 13:15:52 +000088HREF="libxml-lib.html"
Daniel Veillard1566d3a1999-07-15 14:24:29 +000089><FONT
90COLOR="#FFFFFF"
91SIZE="3"
92><B
93>Up</B
94></FONT
95></A
96></B
97></FONT
98></TD
99><TD
100WIDTH="25%"
101BGCOLOR="#C00000"
102ALIGN="right"
103><A
104HREF="gnome-xml-htmltree.html"
105><FONT
106COLOR="#FFFFFF"
107SIZE="3"
108><B
109>Next Page &#62;&#62;&#62;</B
110></FONT
111></A
112></TD
113></TR
114></TABLE
115></DIV
116><H1
Daniel Veillard71b656e2000-01-05 14:46:17 +0000117><A
118NAME="GNOME-XML-HTMLPARSER"
119>HTMLparser</A
120></H1
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000121><DIV
122CLASS="REFNAMEDIV"
123><A
Daniel Veillard71b656e2000-01-05 14:46:17 +0000124NAME="AEN7186"
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000125></A
126><H2
127>Name</H2
Daniel Veillard71b656e2000-01-05 14:46:17 +0000128>HTMLparser&nbsp;--&nbsp;</DIV
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000129><DIV
130CLASS="REFSYNOPSISDIV"
131><A
Daniel Veillard71b656e2000-01-05 14:46:17 +0000132NAME="AEN7189"
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000133></A
134><H2
135>Synopsis</H2
136><TABLE
137BORDER="0"
138BGCOLOR="#D6E8FF"
139WIDTH="100%"
140CELLPADDING="6"
141><TR
142><TD
143><PRE
144CLASS="SYNOPSIS"
145>&#13;
146
147typedef <A
148HREF="gnome-xml-htmlparser.html#HTMLPARSERCTXT"
149>htmlParserCtxt</A
150>;
151typedef <A
152HREF="gnome-xml-htmlparser.html#HTMLPARSERCTXTPTR"
153>htmlParserCtxtPtr</A
154>;
155typedef <A
156HREF="gnome-xml-htmlparser.html#HTMLPARSERNODEINFO"
157>htmlParserNodeInfo</A
158>;
159typedef <A
160HREF="gnome-xml-htmlparser.html#HTMLSAXHANDLER"
161>htmlSAXHandler</A
162>;
163typedef <A
164HREF="gnome-xml-htmlparser.html#HTMLSAXHANDLERPTR"
165>htmlSAXHandlerPtr</A
166>;
167typedef <A
168HREF="gnome-xml-htmlparser.html#HTMLPARSERINPUT"
169>htmlParserInput</A
170>;
171typedef <A
172HREF="gnome-xml-htmlparser.html#HTMLPARSERINPUTPTR"
173>htmlParserInputPtr</A
174>;
175typedef <A
176HREF="gnome-xml-htmlparser.html#HTMLDOCPTR"
177>htmlDocPtr</A
178>;
179typedef <A
180HREF="gnome-xml-htmlparser.html#HTMLNODEPTR"
181>htmlNodePtr</A
182>;
183<GTKDOCLINK
184HREF="HTMLELEMDESCPTR"
185>htmlElemDescPtr</GTKDOCLINK
186> <A
187HREF="gnome-xml-htmlparser.html#HTMLTAGLOOKUP"
188>htmlTagLookup</A
189> (const <A
Daniel Veillarddd6b3671999-09-23 22:19:22 +0000190HREF="gnome-xml-tree.html#XMLCHAR"
191>xmlChar</A
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000192> *tag);
193<GTKDOCLINK
194HREF="HTMLENTITYDESCPTR"
195>htmlEntityDescPtr</GTKDOCLINK
196> <A
197HREF="gnome-xml-htmlparser.html#HTMLENTITYLOOKUP"
198>htmlEntityLookup</A
199> (const <A
Daniel Veillarddd6b3671999-09-23 22:19:22 +0000200HREF="gnome-xml-tree.html#XMLCHAR"
201>xmlChar</A
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000202> *name);
203<GTKDOCLINK
204HREF="HTMLENTITYDESCPTR"
205>htmlEntityDescPtr</GTKDOCLINK
206> <A
207HREF="gnome-xml-htmlparser.html#HTMLPARSEENTITYREF"
208>htmlParseEntityRef</A
209> (<A
210HREF="gnome-xml-htmlparser.html#HTMLPARSERCTXTPTR"
211>htmlParserCtxtPtr</A
212> ctxt,
213 <A
Daniel Veillarddd6b3671999-09-23 22:19:22 +0000214HREF="gnome-xml-tree.html#XMLCHAR"
215>xmlChar</A
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000216> **str);
217int <A
218HREF="gnome-xml-htmlparser.html#HTMLPARSECHARREF"
219>htmlParseCharRef</A
220> (<A
221HREF="gnome-xml-htmlparser.html#HTMLPARSERCTXTPTR"
222>htmlParserCtxtPtr</A
223> ctxt);
224void <A
225HREF="gnome-xml-htmlparser.html#HTMLPARSEELEMENT"
226>htmlParseElement</A
227> (<A
228HREF="gnome-xml-htmlparser.html#HTMLPARSERCTXTPTR"
229>htmlParserCtxtPtr</A
230> ctxt);
231<A
232HREF="gnome-xml-htmlparser.html#HTMLDOCPTR"
233>htmlDocPtr</A
234> <A
235HREF="gnome-xml-htmlparser.html#HTMLSAXPARSEDOC"
236>htmlSAXParseDoc</A
237> (<A
Daniel Veillarddd6b3671999-09-23 22:19:22 +0000238HREF="gnome-xml-tree.html#XMLCHAR"
239>xmlChar</A
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000240> *cur,
241 const char *encoding,
242 <A
243HREF="gnome-xml-htmlparser.html#HTMLSAXHANDLERPTR"
244>htmlSAXHandlerPtr</A
245> sax,
246 void *userData);
247<A
248HREF="gnome-xml-htmlparser.html#HTMLDOCPTR"
249>htmlDocPtr</A
250> <A
251HREF="gnome-xml-htmlparser.html#HTMLPARSEDOC"
252>htmlParseDoc</A
253> (<A
Daniel Veillarddd6b3671999-09-23 22:19:22 +0000254HREF="gnome-xml-tree.html#XMLCHAR"
255>xmlChar</A
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000256> *cur,
257 const char *encoding);
258<A
259HREF="gnome-xml-htmlparser.html#HTMLDOCPTR"
260>htmlDocPtr</A
261> <A
262HREF="gnome-xml-htmlparser.html#HTMLSAXPARSEFILE"
263>htmlSAXParseFile</A
264> (const char *filename,
265 const char *encoding,
266 <A
267HREF="gnome-xml-htmlparser.html#HTMLSAXHANDLERPTR"
268>htmlSAXHandlerPtr</A
269> sax,
270 void *userData);
271<A
272HREF="gnome-xml-htmlparser.html#HTMLDOCPTR"
273>htmlDocPtr</A
274> <A
275HREF="gnome-xml-htmlparser.html#HTMLPARSEFILE"
276>htmlParseFile</A
277> (const char *filename,
Daniel Veillard71b656e2000-01-05 14:46:17 +0000278 const char *encoding);</PRE
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000279></TD
280></TR
281></TABLE
282></DIV
283><DIV
284CLASS="REFSECT1"
285><A
Daniel Veillard71b656e2000-01-05 14:46:17 +0000286NAME="AEN7227"
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000287></A
288><H2
289>Description</H2
290><P
291></P
292></DIV
293><DIV
294CLASS="REFSECT1"
295><A
Daniel Veillard71b656e2000-01-05 14:46:17 +0000296NAME="AEN7230"
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000297></A
298><H2
299>Details</H2
300><DIV
301CLASS="REFSECT2"
302><A
Daniel Veillard71b656e2000-01-05 14:46:17 +0000303NAME="AEN7232"
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000304></A
305><H3
306><A
307NAME="HTMLPARSERCTXT"
308></A
309>htmlParserCtxt</H3
310><P
311></P
312></DIV
313><HR><DIV
314CLASS="REFSECT2"
315><A
Daniel Veillard71b656e2000-01-05 14:46:17 +0000316NAME="AEN7236"
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000317></A
318><H3
319><A
320NAME="HTMLPARSERCTXTPTR"
321></A
322>htmlParserCtxtPtr</H3
323><P
324></P
325></DIV
326><HR><DIV
327CLASS="REFSECT2"
328><A
Daniel Veillard71b656e2000-01-05 14:46:17 +0000329NAME="AEN7240"
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000330></A
331><H3
332><A
333NAME="HTMLPARSERNODEINFO"
334></A
335>htmlParserNodeInfo</H3
336><P
337></P
338></DIV
339><HR><DIV
340CLASS="REFSECT2"
341><A
Daniel Veillard71b656e2000-01-05 14:46:17 +0000342NAME="AEN7244"
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000343></A
344><H3
345><A
346NAME="HTMLSAXHANDLER"
347></A
348>htmlSAXHandler</H3
349><P
350></P
351></DIV
352><HR><DIV
353CLASS="REFSECT2"
354><A
Daniel Veillard71b656e2000-01-05 14:46:17 +0000355NAME="AEN7248"
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000356></A
357><H3
358><A
359NAME="HTMLSAXHANDLERPTR"
360></A
361>htmlSAXHandlerPtr</H3
362><P
363></P
364></DIV
365><HR><DIV
366CLASS="REFSECT2"
367><A
Daniel Veillard71b656e2000-01-05 14:46:17 +0000368NAME="AEN7252"
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000369></A
370><H3
371><A
372NAME="HTMLPARSERINPUT"
373></A
374>htmlParserInput</H3
375><P
376></P
377></DIV
378><HR><DIV
379CLASS="REFSECT2"
380><A
Daniel Veillard71b656e2000-01-05 14:46:17 +0000381NAME="AEN7256"
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000382></A
383><H3
384><A
385NAME="HTMLPARSERINPUTPTR"
386></A
387>htmlParserInputPtr</H3
388><P
389></P
390></DIV
391><HR><DIV
392CLASS="REFSECT2"
393><A
Daniel Veillard71b656e2000-01-05 14:46:17 +0000394NAME="AEN7260"
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000395></A
396><H3
397><A
398NAME="HTMLDOCPTR"
399></A
400>htmlDocPtr</H3
401><P
402></P
403></DIV
404><HR><DIV
405CLASS="REFSECT2"
406><A
Daniel Veillard71b656e2000-01-05 14:46:17 +0000407NAME="AEN7264"
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000408></A
409><H3
410><A
411NAME="HTMLNODEPTR"
412></A
413>htmlNodePtr</H3
414><P
415></P
416></DIV
417><HR><DIV
418CLASS="REFSECT2"
419><A
Daniel Veillard71b656e2000-01-05 14:46:17 +0000420NAME="AEN7268"
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000421></A
422><H3
423><A
424NAME="HTMLTAGLOOKUP"
425></A
426>htmlTagLookup ()</H3
427><TABLE
428BORDER="0"
429BGCOLOR="#D6E8FF"
430WIDTH="100%"
431CELLPADDING="6"
432><TR
433><TD
434><PRE
435CLASS="PROGRAMLISTING"
436><GTKDOCLINK
437HREF="HTMLELEMDESCPTR"
438>htmlElemDescPtr</GTKDOCLINK
439> htmlTagLookup (const <A
Daniel Veillarddd6b3671999-09-23 22:19:22 +0000440HREF="gnome-xml-tree.html#XMLCHAR"
441>xmlChar</A
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000442> *tag);</PRE
443></TD
444></TR
445></TABLE
446><P
447>Lookup the HTML tag in the ElementTable</P
448><P
449></P
450><DIV
451CLASS="INFORMALTABLE"
452><P
453></P
454><TABLE
455BORDER="0"
456WIDTH="100%"
457BGCOLOR="#FFD0D0"
458CELLSPACING="0"
459CELLPADDING="4"
460CLASS="CALSTABLE"
461><TR
462><TD
463WIDTH="20%"
464ALIGN="RIGHT"
465VALIGN="TOP"
466><TT
467CLASS="PARAMETER"
468><I
469>tag</I
470></TT
471>&nbsp;:</TD
472><TD
473WIDTH="80%"
474ALIGN="LEFT"
475VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +0000476>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000477></TR
478><TR
479><TD
480WIDTH="20%"
481ALIGN="RIGHT"
482VALIGN="TOP"
483><I
484CLASS="EMPHASIS"
485>Returns</I
486> :</TD
487><TD
488WIDTH="80%"
489ALIGN="LEFT"
490VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +0000491>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000492></TR
493></TABLE
494><P
495></P
496></DIV
497></DIV
498><HR><DIV
499CLASS="REFSECT2"
500><A
Daniel Veillard71b656e2000-01-05 14:46:17 +0000501NAME="AEN7289"
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000502></A
503><H3
504><A
505NAME="HTMLENTITYLOOKUP"
506></A
507>htmlEntityLookup ()</H3
508><TABLE
509BORDER="0"
510BGCOLOR="#D6E8FF"
511WIDTH="100%"
512CELLPADDING="6"
513><TR
514><TD
515><PRE
516CLASS="PROGRAMLISTING"
517><GTKDOCLINK
518HREF="HTMLENTITYDESCPTR"
519>htmlEntityDescPtr</GTKDOCLINK
520> htmlEntityLookup (const <A
Daniel Veillarddd6b3671999-09-23 22:19:22 +0000521HREF="gnome-xml-tree.html#XMLCHAR"
522>xmlChar</A
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000523> *name);</PRE
524></TD
525></TR
526></TABLE
527><P
528>Lookup the given entity in EntitiesTable</P
529><P
530>TODO: the linear scan is really ugly, an hash table is really needed.</P
531><P
532></P
533><DIV
534CLASS="INFORMALTABLE"
535><P
536></P
537><TABLE
538BORDER="0"
539WIDTH="100%"
540BGCOLOR="#FFD0D0"
541CELLSPACING="0"
542CELLPADDING="4"
543CLASS="CALSTABLE"
544><TR
545><TD
546WIDTH="20%"
547ALIGN="RIGHT"
548VALIGN="TOP"
549><TT
550CLASS="PARAMETER"
551><I
552>name</I
553></TT
554>&nbsp;:</TD
555><TD
556WIDTH="80%"
557ALIGN="LEFT"
558VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +0000559>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000560></TR
561><TR
562><TD
563WIDTH="20%"
564ALIGN="RIGHT"
565VALIGN="TOP"
566><I
567CLASS="EMPHASIS"
568>Returns</I
569> :</TD
570><TD
571WIDTH="80%"
572ALIGN="LEFT"
573VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +0000574>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000575></TR
576></TABLE
577><P
578></P
579></DIV
580></DIV
581><HR><DIV
582CLASS="REFSECT2"
583><A
Daniel Veillard71b656e2000-01-05 14:46:17 +0000584NAME="AEN7311"
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000585></A
586><H3
587><A
588NAME="HTMLPARSEENTITYREF"
589></A
590>htmlParseEntityRef ()</H3
591><TABLE
592BORDER="0"
593BGCOLOR="#D6E8FF"
594WIDTH="100%"
595CELLPADDING="6"
596><TR
597><TD
598><PRE
599CLASS="PROGRAMLISTING"
600><GTKDOCLINK
601HREF="HTMLENTITYDESCPTR"
602>htmlEntityDescPtr</GTKDOCLINK
603> htmlParseEntityRef (<A
604HREF="gnome-xml-htmlparser.html#HTMLPARSERCTXTPTR"
605>htmlParserCtxtPtr</A
606> ctxt,
607 <A
Daniel Veillarddd6b3671999-09-23 22:19:22 +0000608HREF="gnome-xml-tree.html#XMLCHAR"
609>xmlChar</A
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000610> **str);</PRE
611></TD
612></TR
613></TABLE
614><P
615>parse an HTML ENTITY references</P
616><P
617>[68] EntityRef ::= '&amp;' Name ';'</P
618><P
619></P
620><DIV
621CLASS="INFORMALTABLE"
622><P
623></P
624><TABLE
625BORDER="0"
626WIDTH="100%"
627BGCOLOR="#FFD0D0"
628CELLSPACING="0"
629CELLPADDING="4"
630CLASS="CALSTABLE"
631><TR
632><TD
633WIDTH="20%"
634ALIGN="RIGHT"
635VALIGN="TOP"
636><TT
637CLASS="PARAMETER"
638><I
639>ctxt</I
640></TT
641>&nbsp;:</TD
642><TD
643WIDTH="80%"
644ALIGN="LEFT"
645VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +0000646>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000647></TR
648><TR
649><TD
650WIDTH="20%"
651ALIGN="RIGHT"
652VALIGN="TOP"
653><TT
654CLASS="PARAMETER"
655><I
656>str</I
657></TT
658>&nbsp;:</TD
659><TD
660WIDTH="80%"
661ALIGN="LEFT"
662VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +0000663>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000664></TR
665><TR
666><TD
667WIDTH="20%"
668ALIGN="RIGHT"
669VALIGN="TOP"
670><I
671CLASS="EMPHASIS"
672>Returns</I
673> :</TD
674><TD
675WIDTH="80%"
676ALIGN="LEFT"
677VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +0000678>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000679></TR
680></TABLE
681><P
682></P
683></DIV
684></DIV
685><HR><DIV
686CLASS="REFSECT2"
687><A
Daniel Veillard71b656e2000-01-05 14:46:17 +0000688NAME="AEN7338"
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000689></A
690><H3
691><A
692NAME="HTMLPARSECHARREF"
693></A
694>htmlParseCharRef ()</H3
695><TABLE
696BORDER="0"
697BGCOLOR="#D6E8FF"
698WIDTH="100%"
699CELLPADDING="6"
700><TR
701><TD
702><PRE
703CLASS="PROGRAMLISTING"
704>int htmlParseCharRef (<A
705HREF="gnome-xml-htmlparser.html#HTMLPARSERCTXTPTR"
706>htmlParserCtxtPtr</A
707> ctxt);</PRE
708></TD
709></TR
710></TABLE
711><P
712>parse Reference declarations</P
713><P
714>[66] CharRef ::= '&amp;#' [0-9]+ ';' |
715'&amp;<GTKDOCLINK
716HREF="X"
717>x</GTKDOCLINK
718>' [0-9a-fA-F]+ ';'</P
719><P
720></P
721><DIV
722CLASS="INFORMALTABLE"
723><P
724></P
725><TABLE
726BORDER="0"
727WIDTH="100%"
728BGCOLOR="#FFD0D0"
729CELLSPACING="0"
730CELLPADDING="4"
731CLASS="CALSTABLE"
732><TR
733><TD
734WIDTH="20%"
735ALIGN="RIGHT"
736VALIGN="TOP"
737><TT
738CLASS="PARAMETER"
739><I
740>ctxt</I
741></TT
742>&nbsp;:</TD
743><TD
744WIDTH="80%"
745ALIGN="LEFT"
746VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +0000747>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000748></TR
749><TR
750><TD
751WIDTH="20%"
752ALIGN="RIGHT"
753VALIGN="TOP"
754><I
755CLASS="EMPHASIS"
756>Returns</I
757> :</TD
758><TD
759WIDTH="80%"
760ALIGN="LEFT"
761VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +0000762>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000763></TR
764></TABLE
765><P
766></P
767></DIV
768></DIV
769><HR><DIV
770CLASS="REFSECT2"
771><A
Daniel Veillard71b656e2000-01-05 14:46:17 +0000772NAME="AEN7360"
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000773></A
774><H3
775><A
776NAME="HTMLPARSEELEMENT"
777></A
778>htmlParseElement ()</H3
779><TABLE
780BORDER="0"
781BGCOLOR="#D6E8FF"
782WIDTH="100%"
783CELLPADDING="6"
784><TR
785><TD
786><PRE
787CLASS="PROGRAMLISTING"
788>void htmlParseElement (<A
789HREF="gnome-xml-htmlparser.html#HTMLPARSERCTXTPTR"
790>htmlParserCtxtPtr</A
791> ctxt);</PRE
792></TD
793></TR
794></TABLE
795><P
796>parse an HTML element, this is highly recursive</P
797><P
798>[39] element ::= EmptyElemTag | STag content ETag</P
799><P
800>[41] Attribute ::= Name Eq AttValue</P
801><P
802></P
803><DIV
804CLASS="INFORMALTABLE"
805><P
806></P
807><TABLE
808BORDER="0"
809WIDTH="100%"
810BGCOLOR="#FFD0D0"
811CELLSPACING="0"
812CELLPADDING="4"
813CLASS="CALSTABLE"
814><TR
815><TD
816WIDTH="20%"
817ALIGN="RIGHT"
818VALIGN="TOP"
819><TT
820CLASS="PARAMETER"
821><I
822>ctxt</I
823></TT
824>&nbsp;:</TD
825><TD
826WIDTH="80%"
827ALIGN="LEFT"
828VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +0000829>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000830></TR
831></TABLE
832><P
833></P
834></DIV
835></DIV
836><HR><DIV
837CLASS="REFSECT2"
838><A
Daniel Veillard71b656e2000-01-05 14:46:17 +0000839NAME="AEN7378"
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000840></A
841><H3
842><A
843NAME="HTMLSAXPARSEDOC"
844></A
845>htmlSAXParseDoc ()</H3
846><TABLE
847BORDER="0"
848BGCOLOR="#D6E8FF"
849WIDTH="100%"
850CELLPADDING="6"
851><TR
852><TD
853><PRE
854CLASS="PROGRAMLISTING"
855><A
856HREF="gnome-xml-htmlparser.html#HTMLDOCPTR"
857>htmlDocPtr</A
858> htmlSAXParseDoc (<A
Daniel Veillarddd6b3671999-09-23 22:19:22 +0000859HREF="gnome-xml-tree.html#XMLCHAR"
860>xmlChar</A
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000861> *cur,
862 const char *encoding,
863 <A
864HREF="gnome-xml-htmlparser.html#HTMLSAXHANDLERPTR"
865>htmlSAXHandlerPtr</A
866> sax,
867 void *userData);</PRE
868></TD
869></TR
870></TABLE
871><P
872>parse an HTML in-memory document and build a tree.
873It use the given SAX function block to handle the parsing callback.
874If sax is NULL, fallback to the default DOM tree building routines.</P
875><P
876></P
877><DIV
878CLASS="INFORMALTABLE"
879><P
880></P
881><TABLE
882BORDER="0"
883WIDTH="100%"
884BGCOLOR="#FFD0D0"
885CELLSPACING="0"
886CELLPADDING="4"
887CLASS="CALSTABLE"
888><TR
889><TD
890WIDTH="20%"
891ALIGN="RIGHT"
892VALIGN="TOP"
893><TT
894CLASS="PARAMETER"
895><I
896>cur</I
897></TT
898>&nbsp;:</TD
899><TD
900WIDTH="80%"
901ALIGN="LEFT"
902VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +0000903>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000904></TR
905><TR
906><TD
907WIDTH="20%"
908ALIGN="RIGHT"
909VALIGN="TOP"
910><TT
911CLASS="PARAMETER"
912><I
913>encoding</I
914></TT
915>&nbsp;:</TD
916><TD
917WIDTH="80%"
918ALIGN="LEFT"
919VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +0000920>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000921></TR
922><TR
923><TD
924WIDTH="20%"
925ALIGN="RIGHT"
926VALIGN="TOP"
927><TT
928CLASS="PARAMETER"
929><I
930>sax</I
931></TT
932>&nbsp;:</TD
933><TD
934WIDTH="80%"
935ALIGN="LEFT"
936VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +0000937>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000938></TR
939><TR
940><TD
941WIDTH="20%"
942ALIGN="RIGHT"
943VALIGN="TOP"
944><TT
945CLASS="PARAMETER"
946><I
947>userData</I
948></TT
949>&nbsp;:</TD
950><TD
951WIDTH="80%"
952ALIGN="LEFT"
953VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +0000954>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000955></TR
956><TR
957><TD
958WIDTH="20%"
959ALIGN="RIGHT"
960VALIGN="TOP"
961><I
962CLASS="EMPHASIS"
963>Returns</I
964> :</TD
965><TD
966WIDTH="80%"
967ALIGN="LEFT"
968VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +0000969>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000970></TR
971></TABLE
972><P
973></P
974></DIV
975></DIV
976><HR><DIV
977CLASS="REFSECT2"
978><A
Daniel Veillard71b656e2000-01-05 14:46:17 +0000979NAME="AEN7412"
Daniel Veillard1566d3a1999-07-15 14:24:29 +0000980></A
981><H3
982><A
983NAME="HTMLPARSEDOC"
984></A
985>htmlParseDoc ()</H3
986><TABLE
987BORDER="0"
988BGCOLOR="#D6E8FF"
989WIDTH="100%"
990CELLPADDING="6"
991><TR
992><TD
993><PRE
994CLASS="PROGRAMLISTING"
995><A
996HREF="gnome-xml-htmlparser.html#HTMLDOCPTR"
997>htmlDocPtr</A
998> htmlParseDoc (<A
Daniel Veillarddd6b3671999-09-23 22:19:22 +0000999HREF="gnome-xml-tree.html#XMLCHAR"
1000>xmlChar</A
Daniel Veillard1566d3a1999-07-15 14:24:29 +00001001> *cur,
1002 const char *encoding);</PRE
1003></TD
1004></TR
1005></TABLE
1006><P
1007>parse an HTML in-memory document and build a tree.</P
1008><P
1009></P
1010><DIV
1011CLASS="INFORMALTABLE"
1012><P
1013></P
1014><TABLE
1015BORDER="0"
1016WIDTH="100%"
1017BGCOLOR="#FFD0D0"
1018CELLSPACING="0"
1019CELLPADDING="4"
1020CLASS="CALSTABLE"
1021><TR
1022><TD
1023WIDTH="20%"
1024ALIGN="RIGHT"
1025VALIGN="TOP"
1026><TT
1027CLASS="PARAMETER"
1028><I
1029>cur</I
1030></TT
1031>&nbsp;:</TD
1032><TD
1033WIDTH="80%"
1034ALIGN="LEFT"
1035VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +00001036>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +00001037></TR
1038><TR
1039><TD
1040WIDTH="20%"
1041ALIGN="RIGHT"
1042VALIGN="TOP"
1043><TT
1044CLASS="PARAMETER"
1045><I
1046>encoding</I
1047></TT
1048>&nbsp;:</TD
1049><TD
1050WIDTH="80%"
1051ALIGN="LEFT"
1052VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +00001053>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +00001054></TR
1055><TR
1056><TD
1057WIDTH="20%"
1058ALIGN="RIGHT"
1059VALIGN="TOP"
1060><I
1061CLASS="EMPHASIS"
1062>Returns</I
1063> :</TD
1064><TD
1065WIDTH="80%"
1066ALIGN="LEFT"
1067VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +00001068>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +00001069></TR
1070></TABLE
1071><P
1072></P
1073></DIV
1074></DIV
1075><HR><DIV
1076CLASS="REFSECT2"
1077><A
Daniel Veillard71b656e2000-01-05 14:46:17 +00001078NAME="AEN7437"
Daniel Veillard1566d3a1999-07-15 14:24:29 +00001079></A
1080><H3
1081><A
1082NAME="HTMLSAXPARSEFILE"
1083></A
1084>htmlSAXParseFile ()</H3
1085><TABLE
1086BORDER="0"
1087BGCOLOR="#D6E8FF"
1088WIDTH="100%"
1089CELLPADDING="6"
1090><TR
1091><TD
1092><PRE
1093CLASS="PROGRAMLISTING"
1094><A
1095HREF="gnome-xml-htmlparser.html#HTMLDOCPTR"
1096>htmlDocPtr</A
1097> htmlSAXParseFile (const char *filename,
1098 const char *encoding,
1099 <A
1100HREF="gnome-xml-htmlparser.html#HTMLSAXHANDLERPTR"
1101>htmlSAXHandlerPtr</A
1102> sax,
1103 void *userData);</PRE
1104></TD
1105></TR
1106></TABLE
1107><P
1108>parse an HTML file and build a tree. Automatic support for ZLIB/Compress
1109compressed document is provided by default if found at compile-time.
1110It use the given SAX function block to handle the parsing callback.
1111If sax is NULL, fallback to the default DOM tree building routines.</P
1112><P
1113></P
1114><DIV
1115CLASS="INFORMALTABLE"
1116><P
1117></P
1118><TABLE
1119BORDER="0"
1120WIDTH="100%"
1121BGCOLOR="#FFD0D0"
1122CELLSPACING="0"
1123CELLPADDING="4"
1124CLASS="CALSTABLE"
1125><TR
1126><TD
1127WIDTH="20%"
1128ALIGN="RIGHT"
1129VALIGN="TOP"
1130><TT
1131CLASS="PARAMETER"
1132><I
1133>filename</I
1134></TT
1135>&nbsp;:</TD
1136><TD
1137WIDTH="80%"
1138ALIGN="LEFT"
1139VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +00001140>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +00001141></TR
1142><TR
1143><TD
1144WIDTH="20%"
1145ALIGN="RIGHT"
1146VALIGN="TOP"
1147><TT
1148CLASS="PARAMETER"
1149><I
1150>encoding</I
1151></TT
1152>&nbsp;:</TD
1153><TD
1154WIDTH="80%"
1155ALIGN="LEFT"
1156VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +00001157>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +00001158></TR
1159><TR
1160><TD
1161WIDTH="20%"
1162ALIGN="RIGHT"
1163VALIGN="TOP"
1164><TT
1165CLASS="PARAMETER"
1166><I
1167>sax</I
1168></TT
1169>&nbsp;:</TD
1170><TD
1171WIDTH="80%"
1172ALIGN="LEFT"
1173VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +00001174>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +00001175></TR
1176><TR
1177><TD
1178WIDTH="20%"
1179ALIGN="RIGHT"
1180VALIGN="TOP"
1181><TT
1182CLASS="PARAMETER"
1183><I
1184>userData</I
1185></TT
1186>&nbsp;:</TD
1187><TD
1188WIDTH="80%"
1189ALIGN="LEFT"
1190VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +00001191>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +00001192></TR
1193><TR
1194><TD
1195WIDTH="20%"
1196ALIGN="RIGHT"
1197VALIGN="TOP"
1198><I
1199CLASS="EMPHASIS"
1200>Returns</I
1201> :</TD
1202><TD
1203WIDTH="80%"
1204ALIGN="LEFT"
1205VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +00001206>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +00001207></TR
1208></TABLE
1209><P
1210></P
1211></DIV
1212></DIV
1213><HR><DIV
1214CLASS="REFSECT2"
1215><A
Daniel Veillard71b656e2000-01-05 14:46:17 +00001216NAME="AEN7470"
Daniel Veillard1566d3a1999-07-15 14:24:29 +00001217></A
1218><H3
1219><A
1220NAME="HTMLPARSEFILE"
1221></A
1222>htmlParseFile ()</H3
1223><TABLE
1224BORDER="0"
1225BGCOLOR="#D6E8FF"
1226WIDTH="100%"
1227CELLPADDING="6"
1228><TR
1229><TD
1230><PRE
1231CLASS="PROGRAMLISTING"
1232><A
1233HREF="gnome-xml-htmlparser.html#HTMLDOCPTR"
1234>htmlDocPtr</A
1235> htmlParseFile (const char *filename,
1236 const char *encoding);</PRE
1237></TD
1238></TR
1239></TABLE
1240><P
1241>parse an HTML file and build a tree. Automatic support for ZLIB/Compress
1242compressed document is provided by default if found at compile-time.</P
1243><P
1244></P
1245><DIV
1246CLASS="INFORMALTABLE"
1247><P
1248></P
1249><TABLE
1250BORDER="0"
1251WIDTH="100%"
1252BGCOLOR="#FFD0D0"
1253CELLSPACING="0"
1254CELLPADDING="4"
1255CLASS="CALSTABLE"
1256><TR
1257><TD
1258WIDTH="20%"
1259ALIGN="RIGHT"
1260VALIGN="TOP"
1261><TT
1262CLASS="PARAMETER"
1263><I
1264>filename</I
1265></TT
1266>&nbsp;:</TD
1267><TD
1268WIDTH="80%"
1269ALIGN="LEFT"
1270VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +00001271>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +00001272></TR
1273><TR
1274><TD
1275WIDTH="20%"
1276ALIGN="RIGHT"
1277VALIGN="TOP"
1278><TT
1279CLASS="PARAMETER"
1280><I
1281>encoding</I
1282></TT
1283>&nbsp;:</TD
1284><TD
1285WIDTH="80%"
1286ALIGN="LEFT"
1287VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +00001288>&nbsp;</TD
Daniel Veillard1566d3a1999-07-15 14:24:29 +00001289></TR
1290><TR
1291><TD
1292WIDTH="20%"
1293ALIGN="RIGHT"
1294VALIGN="TOP"
1295><I
1296CLASS="EMPHASIS"
1297>Returns</I
1298> :</TD
1299><TD
1300WIDTH="80%"
1301ALIGN="LEFT"
1302VALIGN="TOP"
Daniel Veillard71b656e2000-01-05 14:46:17 +00001303>&nbsp;</TD
Daniel Veillard437b87b2000-01-03 17:30:46 +00001304></TR
1305></TABLE
1306><P
1307></P
1308></DIV
1309></DIV
Daniel Veillard1566d3a1999-07-15 14:24:29 +00001310></DIV
1311><DIV
1312CLASS="NAVFOOTER"
Daniel Veillard00fdf371999-10-08 09:40:39 +00001313><BR
1314CLEAR="all"><BR><TABLE
Daniel Veillard1566d3a1999-07-15 14:24:29 +00001315WIDTH="100%"
1316BORDER="0"
1317BGCOLOR="#000000"
1318CELLPADDING="1"
1319CELLSPACING="0"
1320><TR
1321><TD
1322WIDTH="25%"
1323BGCOLOR="#C00000"
1324ALIGN="left"
1325><A
Daniel Veillard6bd26dc1999-09-03 14:28:40 +00001326HREF="gnome-xml-xml-error.html"
Daniel Veillard1566d3a1999-07-15 14:24:29 +00001327><FONT
1328COLOR="#FFFFFF"
1329SIZE="3"
1330><B
1331>&#60;&#60;&#60; Previous Page</B
1332></FONT
1333></A
1334></TD
1335><TD
1336WIDTH="25%"
1337BGCOLOR="#0000C0"
1338ALIGN="center"
1339><FONT
1340COLOR="#FFFFFF"
1341SIZE="3"
1342><B
1343><A
1344HREF="book1.html"
1345><FONT
1346COLOR="#FFFFFF"
1347SIZE="3"
1348><B
1349>Home</B
1350></FONT
1351></A
1352></B
1353></FONT
1354></TD
1355><TD
1356WIDTH="25%"
1357BGCOLOR="#00C000"
1358ALIGN="center"
1359><FONT
1360COLOR="#FFFFFF"
1361SIZE="3"
1362><B
1363><A
Daniel Veillard35008381999-10-25 13:15:52 +00001364HREF="libxml-lib.html"
Daniel Veillard1566d3a1999-07-15 14:24:29 +00001365><FONT
1366COLOR="#FFFFFF"
1367SIZE="3"
1368><B
1369>Up</B
1370></FONT
1371></A
1372></B
1373></FONT
1374></TD
1375><TD
1376WIDTH="25%"
1377BGCOLOR="#C00000"
1378ALIGN="right"
1379><A
1380HREF="gnome-xml-htmltree.html"
1381><FONT
1382COLOR="#FFFFFF"
1383SIZE="3"
1384><B
1385>Next Page &#62;&#62;&#62;</B
1386></FONT
1387></A
1388></TD
1389></TR
1390><TR
1391><TD
1392COLSPAN="2"
1393ALIGN="left"
1394><FONT
1395COLOR="#FFFFFF"
1396SIZE="3"
1397><B
Daniel Veillard6bd26dc1999-09-03 14:28:40 +00001398>xml-error</B
Daniel Veillard1566d3a1999-07-15 14:24:29 +00001399></FONT
1400></TD
1401><TD
1402COLSPAN="2"
1403ALIGN="right"
1404><FONT
1405COLOR="#FFFFFF"
1406SIZE="3"
1407><B
1408>HTMLtree</B
1409></FONT
1410></TD
1411></TR
1412></TABLE
1413></DIV
1414></BODY
1415></HTML
1416>