blob: 0f0e0e00c73ec37fcb2f8283aa33461776cf9c8c [file] [log] [blame]
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001/*
2 * xmlreader.c: implements the xmlTextReader streaming node API
3 *
Daniel Veillard67df8092002-12-16 22:04:11 +00004 * NOTE:
5 * XmlTextReader.Normalization Property won't be supported, since
6 * it makes the parser non compliant to the XML recommendation
7 *
Daniel Veillarde1ca5032002-12-09 14:13:43 +00008 * See Copyright for the status of this software.
9 *
10 * daniel@veillard.com
11 */
12
Daniel Veillard7704fb12003-01-03 16:19:51 +000013/*
14 * TODOs:
Daniel Veillard067bae52003-01-05 01:27:54 +000015 * - XML Schemas validation
Daniel Veillard7704fb12003-01-03 16:19:51 +000016 */
Daniel Veillarde1ca5032002-12-09 14:13:43 +000017#define IN_LIBXML
18#include "libxml.h"
19
Daniel Veillard81273902003-09-30 00:43:48 +000020#ifdef LIBXML_READER_ENABLED
Daniel Veillarde1ca5032002-12-09 14:13:43 +000021#include <string.h> /* for memset() only ! */
Daniel Veillard26f70262003-01-16 22:45:08 +000022#include <stdarg.h>
Daniel Veillarde1ca5032002-12-09 14:13:43 +000023
24#ifdef HAVE_CTYPE_H
25#include <ctype.h>
26#endif
27#ifdef HAVE_STDLIB_H
28#include <stdlib.h>
29#endif
30
31#include <libxml/xmlmemory.h>
32#include <libxml/xmlIO.h>
33#include <libxml/xmlreader.h>
Daniel Veillardfc8dc352003-10-18 09:07:46 +000034#include <libxml/parserInternals.h>
Daniel Veillardf4e55762003-04-15 23:32:22 +000035#include <libxml/relaxng.h>
Daniel Veillard198c1bf2003-10-20 17:07:41 +000036#include <libxml/uri.h>
Daniel Veillard7899c5c2003-11-03 12:31:38 +000037#ifdef LIBXML_XINCLUDE_ENABLED
38#include <libxml/xinclude.h>
39#endif
Daniel Veillard1e906612003-12-05 14:57:46 +000040#ifdef LIBXML_PATTERN_ENABLED
41#include <libxml/pattern.h>
42#endif
Daniel Veillarde1ca5032002-12-09 14:13:43 +000043
44/* #define DEBUG_CALLBACKS */
45/* #define DEBUG_READER */
46
47/**
48 * TODO:
49 *
50 * macro to flag unimplemented blocks
51 */
52#define TODO \
53 xmlGenericError(xmlGenericErrorContext, \
54 "Unimplemented block at %s:%d\n", \
55 __FILE__, __LINE__);
56
57#ifdef DEBUG_READER
58#define DUMP_READER xmlTextReaderDebug(reader);
59#else
60#define DUMP_READER
61#endif
62
Daniel Veillarda880b122003-04-21 21:36:41 +000063#define CHUNK_SIZE 512
Daniel Veillarde1ca5032002-12-09 14:13:43 +000064/************************************************************************
65 * *
66 * The parser: maps the Text Reader API on top of the existing *
67 * parsing routines building a tree *
68 * *
69 ************************************************************************/
70
71#define XML_TEXTREADER_INPUT 1
72#define XML_TEXTREADER_CTXT 2
73
74typedef enum {
Daniel Veillarde1ca5032002-12-09 14:13:43 +000075 XML_TEXTREADER_NONE = -1,
76 XML_TEXTREADER_START= 0,
77 XML_TEXTREADER_ELEMENT= 1,
78 XML_TEXTREADER_END= 2,
79 XML_TEXTREADER_EMPTY= 3,
Daniel Veillardea7751d2002-12-20 00:16:24 +000080 XML_TEXTREADER_BACKTRACK= 4,
Daniel Veillarda76fe5c2003-04-24 16:06:47 +000081 XML_TEXTREADER_DONE= 5,
82 XML_TEXTREADER_ERROR= 6
Daniel Veillarde1ca5032002-12-09 14:13:43 +000083} xmlTextReaderState;
84
Daniel Veillardf4e55762003-04-15 23:32:22 +000085typedef enum {
86 XML_TEXTREADER_NOT_VALIDATE = 0,
87 XML_TEXTREADER_VALIDATE_DTD = 1,
88 XML_TEXTREADER_VALIDATE_RNG = 2
89} xmlTextReaderValidate;
90
Daniel Veillarde1ca5032002-12-09 14:13:43 +000091struct _xmlTextReader {
92 int mode; /* the parsing mode */
Daniel Veillard198c1bf2003-10-20 17:07:41 +000093 xmlDocPtr doc; /* when walking an existing doc */
Daniel Veillardf4e55762003-04-15 23:32:22 +000094 xmlTextReaderValidate validate;/* is there any validation */
Daniel Veillarde1ca5032002-12-09 14:13:43 +000095 int allocs; /* what structure were deallocated */
96 xmlTextReaderState state;
97 xmlParserCtxtPtr ctxt; /* the parser context */
98 xmlSAXHandlerPtr sax; /* the parser SAX callbacks */
99 xmlParserInputBufferPtr input; /* the input */
100 startElementSAXFunc startElement;/* initial SAX callbacks */
101 endElementSAXFunc endElement; /* idem */
Daniel Veillard07cb8222003-09-10 10:51:05 +0000102 startElementNsSAX2Func startElementNs;/* idem */
Daniel Veillard9ee35f32003-09-28 00:19:54 +0000103 endElementNsSAX2Func endElementNs; /* idem */
Daniel Veillardea7751d2002-12-20 00:16:24 +0000104 charactersSAXFunc characters;
105 cdataBlockSAXFunc cdataBlock;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000106 unsigned int base; /* base of the segment in the input */
107 unsigned int cur; /* current position in the input */
108 xmlNodePtr node; /* current node */
Daniel Veillardda46d2d2002-12-15 23:36:49 +0000109 xmlNodePtr curnode;/* current attribute node */
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000110 int depth; /* depth of the current node */
Daniel Veillardbeb70bd2002-12-18 14:53:54 +0000111 xmlNodePtr faketext;/* fake xmlNs chld */
Daniel Veillard9ee35f32003-09-28 00:19:54 +0000112 int preserve;/* preserve the resulting document */
Daniel Veillard198c1bf2003-10-20 17:07:41 +0000113 xmlBufferPtr buffer; /* used to return const xmlChar * */
114 xmlDictPtr dict; /* the context dictionnary */
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000115
116 /* entity stack when traversing entities content */
117 xmlNodePtr ent; /* Current Entity Ref Node */
118 int entNr; /* Depth of the entities stack */
119 int entMax; /* Max depth of the entities stack */
120 xmlNodePtr *entTab; /* array of entities */
Daniel Veillard26f70262003-01-16 22:45:08 +0000121
122 /* error handling */
123 xmlTextReaderErrorFunc errorFunc; /* callback function */
124 void *errorFuncArg; /* callback function user argument */
Daniel Veillardf4e55762003-04-15 23:32:22 +0000125
126#ifdef LIBXML_SCHEMAS_ENABLED
127 /* Handling of RelaxNG validation */
Daniel Veillard7899c5c2003-11-03 12:31:38 +0000128 xmlRelaxNGPtr rngSchemas; /* The Relax NG schemas */
129 xmlRelaxNGValidCtxtPtr rngValidCtxt;/* The Relax NG validation context */
130 int rngValidErrors;/* The number of errors detected */
131 xmlNodePtr rngFullNode; /* the node if RNG not progressive */
132#endif
133#ifdef LIBXML_XINCLUDE_ENABLED
134 /* Handling of XInclude processing */
135 int xinclude; /* is xinclude asked for */
136 const xmlChar * xinclude_name; /* the xinclude name from dict */
137 xmlXIncludeCtxtPtr xincctxt; /* the xinclude context */
138 int in_xinclude; /* counts for xinclude */
Daniel Veillardf4e55762003-04-15 23:32:22 +0000139#endif
Daniel Veillard1e906612003-12-05 14:57:46 +0000140#ifdef LIBXML_PATTERN_ENABLED
141 int patternNr; /* number of preserve patterns */
142 int patternMax; /* max preserve patterns */
143 xmlPatternPtr *patternTab; /* array of preserve patterns */
144#endif
145 int preserves; /* level of preserves */
Daniel Veillarde74d2e12003-12-09 11:35:37 +0000146 int parserFlags; /* the set of options set */
William M. Brack93d004f2004-02-03 00:14:10 +0000147 /* Structured error handling */
148 xmlStructuredErrorFunc sErrorFunc; /* callback function */
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000149};
150
Daniel Veillarde8039df2003-10-27 11:25:13 +0000151#define NODE_IS_EMPTY 0x1
152#define NODE_IS_PRESERVED 0x2
Daniel Veillard1e906612003-12-05 14:57:46 +0000153#define NODE_IS_SPRESERVED 0x4
Daniel Veillard067bae52003-01-05 01:27:54 +0000154
Daniel Veillarde72c5082003-09-19 12:44:05 +0000155/**
156 * CONSTSTR:
157 *
158 * Macro used to return an interned string
159 */
Daniel Veillard198c1bf2003-10-20 17:07:41 +0000160#define CONSTSTR(str) xmlDictLookup(reader->dict, (str), -1)
161#define CONSTQSTR(p, str) xmlDictQLookup(reader->dict, (p), (str))
162
163static int xmlTextReaderReadTree(xmlTextReaderPtr reader);
164static int xmlTextReaderNextTree(xmlTextReaderPtr reader);
Daniel Veillarde72c5082003-09-19 12:44:05 +0000165
Daniel Veillard9f7eb0b2003-09-17 10:26:25 +0000166/************************************************************************
167 * *
Daniel Veillard9ee35f32003-09-28 00:19:54 +0000168 * Our own version of the freeing routines as we recycle nodes *
169 * *
170 ************************************************************************/
171/**
172 * DICT_FREE:
173 * @str: a string
174 *
175 * Free a string if it is not owned by the "dict" dictionnary in the
176 * current scope
177 */
178#define DICT_FREE(str) \
179 if ((str) && ((!dict) || \
180 (xmlDictOwns(dict, (const xmlChar *)(str)) == 0))) \
181 xmlFree((char *)(str));
182
183static void xmlTextReaderFreeNode(xmlTextReaderPtr reader, xmlNodePtr cur);
184static void xmlTextReaderFreeNodeList(xmlTextReaderPtr reader, xmlNodePtr cur);
185
186/**
Daniel Veillard8d7b5c72003-11-15 18:24:36 +0000187 * xmlFreeID:
188 * @not: A id
189 *
190 * Deallocate the memory used by an id definition
191 */
192static void
193xmlFreeID(xmlIDPtr id) {
194 xmlDictPtr dict = NULL;
195
196 if (id == NULL) return;
197
198 if (id->doc != NULL)
199 dict = id->doc->dict;
200
201 if (id->value != NULL)
202 DICT_FREE(id->value)
203 xmlFree(id);
204}
205
206/**
207 * xmlTextReaderRemoveID:
208 * @doc: the document
209 * @attr: the attribute
210 *
211 * Remove the given attribute from the ID table maintained internally.
212 *
213 * Returns -1 if the lookup failed and 0 otherwise
214 */
215static int
216xmlTextReaderRemoveID(xmlDocPtr doc, xmlAttrPtr attr) {
217 xmlIDTablePtr table;
218 xmlIDPtr id;
219 xmlChar *ID;
220
221 if (doc == NULL) return(-1);
222 if (attr == NULL) return(-1);
223 table = (xmlIDTablePtr) doc->ids;
224 if (table == NULL)
225 return(-1);
226
227 if (attr == NULL)
228 return(-1);
229 ID = xmlNodeListGetString(doc, attr->children, 1);
230 if (ID == NULL)
231 return(-1);
232 id = xmlHashLookup(table, ID);
233 xmlFree(ID);
234 if (id == NULL || id->attr != attr) {
235 return(-1);
236 }
237 id->name = attr->name;
238 id->attr = NULL;
239 return(0);
240}
241
242/**
Daniel Veillard9ee35f32003-09-28 00:19:54 +0000243 * xmlTextReaderFreeProp:
244 * @reader: the xmlTextReaderPtr used
245 * @cur: the node
246 *
247 * Free a node.
248 */
249static void
250xmlTextReaderFreeProp(xmlTextReaderPtr reader, xmlAttrPtr cur) {
251 xmlDictPtr dict;
252
253 dict = reader->ctxt->dict;
254 if (cur == NULL) return;
255
Daniel Veillarda2d51fc2004-04-30 22:25:59 +0000256 if ((__xmlRegisterCallbacks) && (xmlDeregisterNodeDefaultValue))
257 xmlDeregisterNodeDefaultValue((xmlNodePtr) cur);
258
Daniel Veillard9ee35f32003-09-28 00:19:54 +0000259 /* Check for ID removal -> leading to invalid references ! */
260 if ((cur->parent != NULL) && (cur->parent->doc != NULL) &&
261 ((cur->parent->doc->intSubset != NULL) ||
262 (cur->parent->doc->extSubset != NULL))) {
263 if (xmlIsID(cur->parent->doc, cur->parent, cur))
Daniel Veillard8d7b5c72003-11-15 18:24:36 +0000264 xmlTextReaderRemoveID(cur->parent->doc, cur);
Daniel Veillard9ee35f32003-09-28 00:19:54 +0000265 }
266 if (cur->children != NULL)
267 xmlTextReaderFreeNodeList(reader, cur->children);
268
269 DICT_FREE(cur->name);
270 if ((reader != NULL) && (reader->ctxt != NULL) &&
271 (reader->ctxt->freeAttrsNr < 100)) {
272 cur->next = reader->ctxt->freeAttrs;
273 reader->ctxt->freeAttrs = cur;
274 reader->ctxt->freeAttrsNr++;
275 } else {
276 xmlFree(cur);
277 }
278}
279
280/**
281 * xmlTextReaderFreePropList:
282 * @reader: the xmlTextReaderPtr used
283 * @cur: the first property in the list
284 *
285 * Free a property and all its siblings, all the children are freed too.
286 */
287static void
288xmlTextReaderFreePropList(xmlTextReaderPtr reader, xmlAttrPtr cur) {
289 xmlAttrPtr next;
290 if (cur == NULL) return;
291 while (cur != NULL) {
292 next = cur->next;
293 xmlTextReaderFreeProp(reader, cur);
294 cur = next;
295 }
296}
297
298/**
299 * xmlTextReaderFreeNodeList:
300 * @reader: the xmlTextReaderPtr used
301 * @cur: the first node in the list
302 *
303 * Free a node and all its siblings, this is a recursive behaviour, all
304 * the children are freed too.
305 */
306static void
307xmlTextReaderFreeNodeList(xmlTextReaderPtr reader, xmlNodePtr cur) {
308 xmlNodePtr next;
309 xmlDictPtr dict;
310
311 dict = reader->ctxt->dict;
312 if (cur == NULL) return;
313 if (cur->type == XML_NAMESPACE_DECL) {
314 xmlFreeNsList((xmlNsPtr) cur);
315 return;
316 }
317 if ((cur->type == XML_DOCUMENT_NODE) ||
318 (cur->type == XML_HTML_DOCUMENT_NODE)) {
319 xmlFreeDoc((xmlDocPtr) cur);
320 return;
321 }
322 while (cur != NULL) {
323 next = cur->next;
324 /* unroll to speed up freeing the document */
325 if (cur->type != XML_DTD_NODE) {
326
327 if ((cur->children != NULL) &&
Daniel Veillard1d211e22003-10-20 22:32:39 +0000328 (cur->type != XML_ENTITY_REF_NODE)) {
329 if (cur->children->parent == cur)
330 xmlTextReaderFreeNodeList(reader, cur->children);
331 cur->children = NULL;
332 }
Daniel Veillarda2d51fc2004-04-30 22:25:59 +0000333
334 if ((__xmlRegisterCallbacks) && (xmlDeregisterNodeDefaultValue))
335 xmlDeregisterNodeDefaultValue(cur);
336
Daniel Veillard9ee35f32003-09-28 00:19:54 +0000337 if (((cur->type == XML_ELEMENT_NODE) ||
338 (cur->type == XML_XINCLUDE_START) ||
339 (cur->type == XML_XINCLUDE_END)) &&
340 (cur->properties != NULL))
341 xmlTextReaderFreePropList(reader, cur->properties);
342 if ((cur->type != XML_ELEMENT_NODE) &&
343 (cur->type != XML_XINCLUDE_START) &&
344 (cur->type != XML_XINCLUDE_END) &&
345 (cur->type != XML_ENTITY_REF_NODE)) {
346 DICT_FREE(cur->content);
347 }
348 if (((cur->type == XML_ELEMENT_NODE) ||
349 (cur->type == XML_XINCLUDE_START) ||
350 (cur->type == XML_XINCLUDE_END)) &&
351 (cur->nsDef != NULL))
352 xmlFreeNsList(cur->nsDef);
353
354 /*
355 * we don't free element names here they are interned now
356 */
357 if ((cur->type != XML_TEXT_NODE) &&
358 (cur->type != XML_COMMENT_NODE))
359 DICT_FREE(cur->name);
360 if (((cur->type == XML_ELEMENT_NODE) ||
361 (cur->type == XML_TEXT_NODE)) &&
362 (reader != NULL) && (reader->ctxt != NULL) &&
363 (reader->ctxt->freeElemsNr < 100)) {
364 cur->next = reader->ctxt->freeElems;
365 reader->ctxt->freeElems = cur;
366 reader->ctxt->freeElemsNr++;
367 } else {
368 xmlFree(cur);
369 }
370 }
371 cur = next;
372 }
373}
374
375/**
376 * xmlTextReaderFreeNode:
377 * @reader: the xmlTextReaderPtr used
378 * @cur: the node
379 *
380 * Free a node, this is a recursive behaviour, all the children are freed too.
381 * This doesn't unlink the child from the list, use xmlUnlinkNode() first.
382 */
383static void
384xmlTextReaderFreeNode(xmlTextReaderPtr reader, xmlNodePtr cur) {
385 xmlDictPtr dict;
386
387 dict = reader->ctxt->dict;
388 if (cur->type == XML_DTD_NODE) {
389 xmlFreeDtd((xmlDtdPtr) cur);
390 return;
391 }
392 if (cur->type == XML_NAMESPACE_DECL) {
393 xmlFreeNs((xmlNsPtr) cur);
394 return;
395 }
396 if (cur->type == XML_ATTRIBUTE_NODE) {
397 xmlTextReaderFreeProp(reader, (xmlAttrPtr) cur);
398 return;
399 }
400
401 if ((cur->children != NULL) &&
Daniel Veillard1d211e22003-10-20 22:32:39 +0000402 (cur->type != XML_ENTITY_REF_NODE)) {
403 if (cur->children->parent == cur)
404 xmlTextReaderFreeNodeList(reader, cur->children);
405 cur->children = NULL;
406 }
Daniel Veillarda2d51fc2004-04-30 22:25:59 +0000407
408 if ((__xmlRegisterCallbacks) && (xmlDeregisterNodeDefaultValue))
409 xmlDeregisterNodeDefaultValue(cur);
410
Daniel Veillard9ee35f32003-09-28 00:19:54 +0000411 if (((cur->type == XML_ELEMENT_NODE) ||
412 (cur->type == XML_XINCLUDE_START) ||
413 (cur->type == XML_XINCLUDE_END)) &&
414 (cur->properties != NULL))
415 xmlTextReaderFreePropList(reader, cur->properties);
416 if ((cur->type != XML_ELEMENT_NODE) &&
417 (cur->type != XML_XINCLUDE_START) &&
418 (cur->type != XML_XINCLUDE_END) &&
419 (cur->type != XML_ENTITY_REF_NODE)) {
420 DICT_FREE(cur->content);
421 }
422 if (((cur->type == XML_ELEMENT_NODE) ||
423 (cur->type == XML_XINCLUDE_START) ||
424 (cur->type == XML_XINCLUDE_END)) &&
425 (cur->nsDef != NULL))
426 xmlFreeNsList(cur->nsDef);
427
428 /*
429 * we don't free names here they are interned now
430 */
431 if ((cur->type != XML_TEXT_NODE) &&
432 (cur->type != XML_COMMENT_NODE))
433 DICT_FREE(cur->name);
Daniel Veillarda2d51fc2004-04-30 22:25:59 +0000434
Daniel Veillard9ee35f32003-09-28 00:19:54 +0000435 if (((cur->type == XML_ELEMENT_NODE) ||
436 (cur->type == XML_TEXT_NODE)) &&
437 (reader != NULL) && (reader->ctxt != NULL) &&
438 (reader->ctxt->freeElemsNr < 100)) {
439 cur->next = reader->ctxt->freeElems;
440 reader->ctxt->freeElems = cur;
441 reader->ctxt->freeElemsNr++;
442 } else {
443 xmlFree(cur);
444 }
445}
446
447/**
Daniel Veillard8d7b5c72003-11-15 18:24:36 +0000448 * xmlTextReaderFreeIDTable:
449 * @table: An id table
450 *
451 * Deallocate the memory used by an ID hash table.
452 */
William M. Brack60f394e2003-11-16 06:25:42 +0000453static void
Daniel Veillard8d7b5c72003-11-15 18:24:36 +0000454xmlTextReaderFreeIDTable(xmlIDTablePtr table) {
455 xmlHashFree(table, (xmlHashDeallocator) xmlFreeID);
456}
457
458/**
Daniel Veillard9ee35f32003-09-28 00:19:54 +0000459 * xmlTextReaderFreeDoc:
460 * @reader: the xmlTextReaderPtr used
461 * @cur: pointer to the document
462 *
463 * Free up all the structures used by a document, tree included.
464 */
465static void
466xmlTextReaderFreeDoc(xmlTextReaderPtr reader, xmlDocPtr cur) {
467 xmlDtdPtr extSubset, intSubset;
468
469 if (cur == NULL) return;
470
Daniel Veillarda2d51fc2004-04-30 22:25:59 +0000471 if ((__xmlRegisterCallbacks) && (xmlDeregisterNodeDefaultValue))
472 xmlDeregisterNodeDefaultValue((xmlNodePtr) cur);
473
Daniel Veillard9ee35f32003-09-28 00:19:54 +0000474 /*
475 * Do this before freeing the children list to avoid ID lookups
476 */
Daniel Veillard8d7b5c72003-11-15 18:24:36 +0000477 if (cur->ids != NULL) xmlTextReaderFreeIDTable((xmlIDTablePtr) cur->ids);
Daniel Veillard9ee35f32003-09-28 00:19:54 +0000478 cur->ids = NULL;
479 if (cur->refs != NULL) xmlFreeRefTable((xmlRefTablePtr) cur->refs);
480 cur->refs = NULL;
481 extSubset = cur->extSubset;
482 intSubset = cur->intSubset;
483 if (intSubset == extSubset)
484 extSubset = NULL;
485 if (extSubset != NULL) {
486 xmlUnlinkNode((xmlNodePtr) cur->extSubset);
487 cur->extSubset = NULL;
488 xmlFreeDtd(extSubset);
489 }
490 if (intSubset != NULL) {
491 xmlUnlinkNode((xmlNodePtr) cur->intSubset);
492 cur->intSubset = NULL;
493 xmlFreeDtd(intSubset);
494 }
495
496 if (cur->children != NULL) xmlTextReaderFreeNodeList(reader, cur->children);
497
498 if (cur->version != NULL) xmlFree((char *) cur->version);
499 if (cur->name != NULL) xmlFree((char *) cur->name);
500 if (cur->encoding != NULL) xmlFree((char *) cur->encoding);
501 if (cur->oldNs != NULL) xmlFreeNsList(cur->oldNs);
502 if (cur->URL != NULL) xmlFree((char *) cur->URL);
Daniel Veillard500a1de2004-03-22 15:22:58 +0000503 if (cur->dict != NULL) xmlDictFree(cur->dict);
Daniel Veillarda2d51fc2004-04-30 22:25:59 +0000504
Daniel Veillard9ee35f32003-09-28 00:19:54 +0000505 xmlFree(cur);
506}
507
508/************************************************************************
509 * *
Daniel Veillard9f7eb0b2003-09-17 10:26:25 +0000510 * The reader core parser *
511 * *
512 ************************************************************************/
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000513#ifdef DEBUG_READER
514static void
515xmlTextReaderDebug(xmlTextReaderPtr reader) {
516 if ((reader == NULL) || (reader->ctxt == NULL)) {
517 fprintf(stderr, "xmlTextReader NULL\n");
518 return;
519 }
520 fprintf(stderr, "xmlTextReader: state %d depth %d ",
521 reader->state, reader->depth);
522 if (reader->node == NULL) {
523 fprintf(stderr, "node = NULL\n");
524 } else {
525 fprintf(stderr, "node %s\n", reader->node->name);
526 }
527 fprintf(stderr, " input: base %d, cur %d, depth %d: ",
528 reader->base, reader->cur, reader->ctxt->nodeNr);
529 if (reader->input->buffer == NULL) {
530 fprintf(stderr, "buffer is NULL\n");
531 } else {
532#ifdef LIBXML_DEBUG_ENABLED
533 xmlDebugDumpString(stderr,
534 &reader->input->buffer->content[reader->cur]);
535#endif
536 fprintf(stderr, "\n");
537 }
538}
539#endif
540
541/**
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000542 * xmlTextReaderEntPush:
543 * @reader: the xmlTextReaderPtr used
544 * @value: the entity reference node
545 *
546 * Pushes a new entity reference node on top of the entities stack
547 *
548 * Returns 0 in case of error, the index in the stack otherwise
549 */
550static int
551xmlTextReaderEntPush(xmlTextReaderPtr reader, xmlNodePtr value)
552{
553 if (reader->entMax <= 0) {
554 reader->entMax = 10;
555 reader->entTab = (xmlNodePtr *) xmlMalloc(reader->entMax *
556 sizeof(reader->entTab[0]));
557 if (reader->entTab == NULL) {
558 xmlGenericError(xmlGenericErrorContext, "xmlMalloc failed !\n");
559 return (0);
560 }
561 }
562 if (reader->entNr >= reader->entMax) {
563 reader->entMax *= 2;
564 reader->entTab =
565 (xmlNodePtr *) xmlRealloc(reader->entTab,
566 reader->entMax *
567 sizeof(reader->entTab[0]));
568 if (reader->entTab == NULL) {
569 xmlGenericError(xmlGenericErrorContext, "xmlRealloc failed !\n");
570 return (0);
571 }
572 }
573 reader->entTab[reader->entNr] = value;
574 reader->ent = value;
575 return (reader->entNr++);
576}
577
578/**
579 * xmlTextReaderEntPop:
580 * @reader: the xmlTextReaderPtr used
581 *
582 * Pops the top element entity from the entities stack
583 *
584 * Returns the entity just removed
585 */
586static xmlNodePtr
587xmlTextReaderEntPop(xmlTextReaderPtr reader)
588{
589 xmlNodePtr ret;
590
591 if (reader->entNr <= 0)
592 return (0);
593 reader->entNr--;
594 if (reader->entNr > 0)
595 reader->ent = reader->entTab[reader->entNr - 1];
596 else
597 reader->ent = NULL;
598 ret = reader->entTab[reader->entNr];
599 reader->entTab[reader->entNr] = 0;
600 return (ret);
601}
602
603/**
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000604 * xmlTextReaderStartElement:
605 * @ctx: the user data (XML parser context)
606 * @fullname: The element name, including namespace prefix
607 * @atts: An array of name/value attributes pairs, NULL terminated
608 *
609 * called when an opening tag has been processed.
610 */
611static void
612xmlTextReaderStartElement(void *ctx, const xmlChar *fullname,
613 const xmlChar **atts) {
614 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
615 xmlTextReaderPtr reader = ctxt->_private;
616
617#ifdef DEBUG_CALLBACKS
618 printf("xmlTextReaderStartElement(%s)\n", fullname);
619#endif
Daniel Veillardea7751d2002-12-20 00:16:24 +0000620 if ((reader != NULL) && (reader->startElement != NULL)) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000621 reader->startElement(ctx, fullname, atts);
Daniel Veillard067bae52003-01-05 01:27:54 +0000622 if ((ctxt->node != NULL) && (ctxt->input != NULL) &&
623 (ctxt->input->cur != NULL) && (ctxt->input->cur[0] == '/') &&
624 (ctxt->input->cur[1] == '>'))
Daniel Veillarde8039df2003-10-27 11:25:13 +0000625 ctxt->node->extra = NODE_IS_EMPTY;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000626 }
Daniel Veillard9e395c22003-01-01 14:50:44 +0000627 if (reader != NULL)
628 reader->state = XML_TEXTREADER_ELEMENT;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000629}
630
631/**
632 * xmlTextReaderEndElement:
633 * @ctx: the user data (XML parser context)
634 * @fullname: The element name, including namespace prefix
635 *
636 * called when an ending tag has been processed.
637 */
638static void
639xmlTextReaderEndElement(void *ctx, const xmlChar *fullname) {
640 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
641 xmlTextReaderPtr reader = ctxt->_private;
642
643#ifdef DEBUG_CALLBACKS
644 printf("xmlTextReaderEndElement(%s)\n", fullname);
645#endif
Daniel Veillardea7751d2002-12-20 00:16:24 +0000646 if ((reader != NULL) && (reader->endElement != NULL)) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000647 reader->endElement(ctx, fullname);
Daniel Veillardea7751d2002-12-20 00:16:24 +0000648 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000649}
650
651/**
Daniel Veillard07cb8222003-09-10 10:51:05 +0000652 * xmlTextReaderStartElementNs:
653 * @ctx: the user data (XML parser context)
654 * @localname: the local name of the element
655 * @prefix: the element namespace prefix if available
656 * @URI: the element namespace name if available
657 * @nb_namespaces: number of namespace definitions on that node
658 * @namespaces: pointer to the array of prefix/URI pairs namespace definitions
659 * @nb_attributes: the number of attributes on that node
660 * nb_defaulted: the number of defaulted attributes.
661 * @attributes: pointer to the array of (localname/prefix/URI/value/end)
662 * attribute values.
663 *
664 * called when an opening tag has been processed.
665 */
666static void
667xmlTextReaderStartElementNs(void *ctx,
668 const xmlChar *localname,
669 const xmlChar *prefix,
670 const xmlChar *URI,
671 int nb_namespaces,
672 const xmlChar **namespaces,
673 int nb_attributes,
674 int nb_defaulted,
675 const xmlChar **attributes)
676{
677 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
678 xmlTextReaderPtr reader = ctxt->_private;
679
680#ifdef DEBUG_CALLBACKS
Daniel Veillard198c1bf2003-10-20 17:07:41 +0000681 printf("xmlTextReaderStartElementNs(%s)\n", localname);
Daniel Veillard07cb8222003-09-10 10:51:05 +0000682#endif
683 if ((reader != NULL) && (reader->startElementNs != NULL)) {
684 reader->startElementNs(ctx, localname, prefix, URI, nb_namespaces,
685 namespaces, nb_attributes, nb_defaulted,
686 attributes);
687 if ((ctxt->node != NULL) && (ctxt->input != NULL) &&
688 (ctxt->input->cur != NULL) && (ctxt->input->cur[0] == '/') &&
689 (ctxt->input->cur[1] == '>'))
Daniel Veillarde8039df2003-10-27 11:25:13 +0000690 ctxt->node->extra = NODE_IS_EMPTY;
Daniel Veillard07cb8222003-09-10 10:51:05 +0000691 }
692 if (reader != NULL)
693 reader->state = XML_TEXTREADER_ELEMENT;
694}
695
696/**
697 * xmlTextReaderEndElementNs:
698 * @ctx: the user data (XML parser context)
699 * @localname: the local name of the element
700 * @prefix: the element namespace prefix if available
701 * @URI: the element namespace name if available
702 *
703 * called when an ending tag has been processed.
704 */
705static void
706xmlTextReaderEndElementNs(void *ctx,
707 const xmlChar * localname,
708 const xmlChar * prefix,
709 const xmlChar * URI)
710{
711 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
712 xmlTextReaderPtr reader = ctxt->_private;
713
714#ifdef DEBUG_CALLBACKS
Daniel Veillard198c1bf2003-10-20 17:07:41 +0000715 printf("xmlTextReaderEndElementNs(%s)\n", localname);
Daniel Veillard07cb8222003-09-10 10:51:05 +0000716#endif
717 if ((reader != NULL) && (reader->endElementNs != NULL)) {
718 reader->endElementNs(ctx, localname, prefix, URI);
719 }
720}
721
722
723/**
Daniel Veillardea7751d2002-12-20 00:16:24 +0000724 * xmlTextReaderCharacters:
725 * @ctx: the user data (XML parser context)
726 * @ch: a xmlChar string
727 * @len: the number of xmlChar
728 *
729 * receiving some chars from the parser.
730 */
731static void
732xmlTextReaderCharacters(void *ctx, const xmlChar *ch, int len)
733{
734 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
735 xmlTextReaderPtr reader = ctxt->_private;
736
737#ifdef DEBUG_CALLBACKS
738 printf("xmlTextReaderCharacters()\n");
739#endif
740 if ((reader != NULL) && (reader->characters != NULL)) {
741 reader->characters(ctx, ch, len);
Daniel Veillardea7751d2002-12-20 00:16:24 +0000742 }
743}
744
745/**
746 * xmlTextReaderCDataBlock:
747 * @ctx: the user data (XML parser context)
748 * @value: The pcdata content
749 * @len: the block length
750 *
751 * called when a pcdata block has been parsed
752 */
753static void
754xmlTextReaderCDataBlock(void *ctx, const xmlChar *ch, int len)
755{
756 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
757 xmlTextReaderPtr reader = ctxt->_private;
758
759#ifdef DEBUG_CALLBACKS
760 printf("xmlTextReaderCDataBlock()\n");
761#endif
762 if ((reader != NULL) && (reader->cdataBlock != NULL)) {
763 reader->cdataBlock(ctx, ch, len);
Daniel Veillardea7751d2002-12-20 00:16:24 +0000764 }
765}
766
767/**
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000768 * xmlTextReaderPushData:
769 * @reader: the xmlTextReaderPtr used
770 *
771 * Push data down the progressive parser until a significant callback
772 * got raised.
773 *
774 * Returns -1 in case of failure, 0 otherwise
775 */
776static int
777xmlTextReaderPushData(xmlTextReaderPtr reader) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000778 xmlBufferPtr inbuf;
Daniel Veillarda880b122003-04-21 21:36:41 +0000779 int val, s;
William M. Brack779af002003-08-01 15:55:39 +0000780 xmlTextReaderState oldstate;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000781
782 if ((reader->input == NULL) || (reader->input->buffer == NULL))
783 return(-1);
784
Daniel Veillardea7751d2002-12-20 00:16:24 +0000785 oldstate = reader->state;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000786 reader->state = XML_TEXTREADER_NONE;
787 inbuf = reader->input->buffer;
Daniel Veillarda880b122003-04-21 21:36:41 +0000788
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000789 while (reader->state == XML_TEXTREADER_NONE) {
Daniel Veillarda880b122003-04-21 21:36:41 +0000790 if (inbuf->use < reader->cur + CHUNK_SIZE) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000791 /*
792 * Refill the buffer unless we are at the end of the stream
793 */
794 if (reader->mode != XML_TEXTREADER_MODE_EOF) {
795 val = xmlParserInputBufferRead(reader->input, 4096);
Daniel Veillard53350552003-09-18 13:35:51 +0000796 if ((val == 0) &&
797 (inbuf->alloc == XML_BUFFER_ALLOC_IMMUTABLE)) {
798 if (inbuf->use == reader->cur) {
799 reader->mode = XML_TEXTREADER_MODE_EOF;
800 reader->state = oldstate;
Daniel Veillard53350552003-09-18 13:35:51 +0000801 }
802 } else if (val < 0) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000803 reader->mode = XML_TEXTREADER_MODE_EOF;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000804 reader->state = oldstate;
Daniel Veillardaaa105b2002-12-30 11:42:17 +0000805 if ((oldstate != XML_TEXTREADER_START) ||
806 (reader->ctxt->myDoc != NULL))
807 return(val);
Daniel Veillard53350552003-09-18 13:35:51 +0000808 } else if (val == 0) {
809 /* mark the end of the stream and process the remains */
810 reader->mode = XML_TEXTREADER_MODE_EOF;
811 break;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000812 }
Daniel Veillarda880b122003-04-21 21:36:41 +0000813
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000814 } else
815 break;
816 }
Daniel Veillard067bae52003-01-05 01:27:54 +0000817 /*
Daniel Veillarda880b122003-04-21 21:36:41 +0000818 * parse by block of CHUNK_SIZE bytes, various tests show that
819 * it's the best tradeoff at least on a 1.2GH Duron
Daniel Veillard067bae52003-01-05 01:27:54 +0000820 */
Daniel Veillarda880b122003-04-21 21:36:41 +0000821 if (inbuf->use >= reader->cur + CHUNK_SIZE) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000822 val = xmlParseChunk(reader->ctxt,
823 (const char *) &inbuf->content[reader->cur],
Daniel Veillarda880b122003-04-21 21:36:41 +0000824 CHUNK_SIZE, 0);
825 reader->cur += CHUNK_SIZE;
William M. Brack9f797ab2004-07-28 07:40:12 +0000826 if ((val != 0) || (reader->ctxt->wellFormed == 0))
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000827 return(-1);
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000828 } else {
Daniel Veillarda880b122003-04-21 21:36:41 +0000829 s = inbuf->use - reader->cur;
830 val = xmlParseChunk(reader->ctxt,
831 (const char *) &inbuf->content[reader->cur],
832 s, 0);
833 reader->cur += s;
William M. Brack9f797ab2004-07-28 07:40:12 +0000834 if ((val != 0) || (reader->ctxt->wellFormed == 0))
Daniel Veillarda880b122003-04-21 21:36:41 +0000835 return(-1);
836 break;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000837 }
838 }
Daniel Veillarda880b122003-04-21 21:36:41 +0000839
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000840 /*
841 * Discard the consumed input when needed and possible
842 */
Daniel Veillard67df8092002-12-16 22:04:11 +0000843 if (reader->mode == XML_TEXTREADER_MODE_INTERACTIVE) {
Daniel Veillard21924522004-02-19 16:37:07 +0000844 if (inbuf->alloc != XML_BUFFER_ALLOC_IMMUTABLE) {
845 if ((reader->cur >= 4096) &&
846 (inbuf->use - reader->cur <= CHUNK_SIZE)) {
847 val = xmlBufferShrink(inbuf, reader->cur);
848 if (val >= 0) {
849 reader->cur -= val;
850 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000851 }
852 }
853 }
854
855 /*
856 * At the end of the stream signal that the work is done to the Push
857 * parser.
858 */
Daniel Veillarda880b122003-04-21 21:36:41 +0000859 else if (reader->mode == XML_TEXTREADER_MODE_EOF) {
Daniel Veillardea7751d2002-12-20 00:16:24 +0000860 if (reader->mode != XML_TEXTREADER_DONE) {
Daniel Veillarda880b122003-04-21 21:36:41 +0000861 s = inbuf->use - reader->cur;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000862 val = xmlParseChunk(reader->ctxt,
Daniel Veillard067bae52003-01-05 01:27:54 +0000863 (const char *) &inbuf->content[reader->cur],
Daniel Veillarda880b122003-04-21 21:36:41 +0000864 s, 1);
865 reader->cur = inbuf->use;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000866 reader->mode = XML_TEXTREADER_DONE;
William M. Brack9f797ab2004-07-28 07:40:12 +0000867 if ((val != 0) || (reader->ctxt->wellFormed == 0))
Daniel Veillard16ed5972003-11-20 18:22:31 +0000868 return(-1);
Daniel Veillardea7751d2002-12-20 00:16:24 +0000869 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000870 }
Daniel Veillardea7751d2002-12-20 00:16:24 +0000871 reader->state = oldstate;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000872 return(0);
873}
874
Daniel Veillarda9cce9c2003-09-29 13:20:24 +0000875#ifdef LIBXML_REGEXP_ENABLED
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000876/**
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000877 * xmlTextReaderValidatePush:
878 * @reader: the xmlTextReaderPtr used
879 *
880 * Push the current node for validation
881 */
882static void
Daniel Veillarda9cce9c2003-09-29 13:20:24 +0000883xmlTextReaderValidatePush(xmlTextReaderPtr reader ATTRIBUTE_UNUSED) {
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000884 xmlNodePtr node = reader->node;
885
Daniel Veillardf54cd532004-02-25 11:52:31 +0000886#ifdef LIBXML_VALID_ENABLED
Daniel Veillardf4e55762003-04-15 23:32:22 +0000887 if ((reader->validate == XML_TEXTREADER_VALIDATE_DTD) &&
888 (reader->ctxt != NULL) && (reader->ctxt->validate == 1)) {
889 if ((node->ns == NULL) || (node->ns->prefix == NULL)) {
890 reader->ctxt->valid &= xmlValidatePushElement(&reader->ctxt->vctxt,
891 reader->ctxt->myDoc, node, node->name);
892 } else {
893 /* TODO use the BuildQName interface */
894 xmlChar *qname;
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000895
Daniel Veillardf4e55762003-04-15 23:32:22 +0000896 qname = xmlStrdup(node->ns->prefix);
897 qname = xmlStrcat(qname, BAD_CAST ":");
898 qname = xmlStrcat(qname, node->name);
899 reader->ctxt->valid &= xmlValidatePushElement(&reader->ctxt->vctxt,
900 reader->ctxt->myDoc, node, qname);
901 if (qname != NULL)
902 xmlFree(qname);
903 }
Daniel Veillardf54cd532004-02-25 11:52:31 +0000904 }
905#endif /* LIBXML_VALID_ENABLED */
Daniel Veillardf4e55762003-04-15 23:32:22 +0000906#ifdef LIBXML_SCHEMAS_ENABLED
Daniel Veillardf54cd532004-02-25 11:52:31 +0000907 if ((reader->validate == XML_TEXTREADER_VALIDATE_RNG) &&
Daniel Veillardf4e55762003-04-15 23:32:22 +0000908 (reader->rngValidCtxt != NULL)) {
909 int ret;
910
911 if (reader->rngFullNode != NULL) return;
912 ret = xmlRelaxNGValidatePushElement(reader->rngValidCtxt,
913 reader->ctxt->myDoc,
914 node);
915 if (ret == 0) {
916 /*
917 * this element requires a full tree
918 */
919 node = xmlTextReaderExpand(reader);
920 if (node == NULL) {
921printf("Expand failed !\n");
922 ret = -1;
923 } else {
924 ret = xmlRelaxNGValidateFullElement(reader->rngValidCtxt,
925 reader->ctxt->myDoc,
926 node);
927 reader->rngFullNode = node;
928 }
929 }
930 if (ret != 1)
931 reader->rngValidErrors++;
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000932 }
Daniel Veillardf54cd532004-02-25 11:52:31 +0000933#endif
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000934}
Daniel Veillardf4e55762003-04-15 23:32:22 +0000935
936/**
937 * xmlTextReaderValidateCData:
938 * @reader: the xmlTextReaderPtr used
939 * @data: pointer to the CData
940 * @len: lenght of the CData block in bytes.
941 *
942 * Push some CData for validation
943 */
944static void
945xmlTextReaderValidateCData(xmlTextReaderPtr reader,
946 const xmlChar *data, int len) {
Daniel Veillardf54cd532004-02-25 11:52:31 +0000947#ifdef LIBXML_VALID_ENABLED
Daniel Veillardf4e55762003-04-15 23:32:22 +0000948 if ((reader->validate == XML_TEXTREADER_VALIDATE_DTD) &&
949 (reader->ctxt != NULL) && (reader->ctxt->validate == 1)) {
950 reader->ctxt->valid &= xmlValidatePushCData(&reader->ctxt->vctxt,
951 data, len);
Daniel Veillardf54cd532004-02-25 11:52:31 +0000952 }
953#endif /* LIBXML_VALID_ENABLED */
Daniel Veillardf4e55762003-04-15 23:32:22 +0000954#ifdef LIBXML_SCHEMAS_ENABLED
Daniel Veillardf54cd532004-02-25 11:52:31 +0000955 if ((reader->validate == XML_TEXTREADER_VALIDATE_RNG) &&
Daniel Veillardf4e55762003-04-15 23:32:22 +0000956 (reader->rngValidCtxt != NULL)) {
957 int ret;
958
959 if (reader->rngFullNode != NULL) return;
960 ret = xmlRelaxNGValidatePushCData(reader->rngValidCtxt, data, len);
961 if (ret != 1)
962 reader->rngValidErrors++;
Daniel Veillardf4e55762003-04-15 23:32:22 +0000963 }
Daniel Veillardf54cd532004-02-25 11:52:31 +0000964#endif
Daniel Veillardf4e55762003-04-15 23:32:22 +0000965}
966
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000967/**
968 * xmlTextReaderValidatePop:
969 * @reader: the xmlTextReaderPtr used
970 *
971 * Pop the current node from validation
972 */
973static void
974xmlTextReaderValidatePop(xmlTextReaderPtr reader) {
975 xmlNodePtr node = reader->node;
976
Daniel Veillardf54cd532004-02-25 11:52:31 +0000977#ifdef LIBXML_VALID_ENABLED
Daniel Veillardf4e55762003-04-15 23:32:22 +0000978 if ((reader->validate == XML_TEXTREADER_VALIDATE_DTD) &&
979 (reader->ctxt != NULL) && (reader->ctxt->validate == 1)) {
980 if ((node->ns == NULL) || (node->ns->prefix == NULL)) {
981 reader->ctxt->valid &= xmlValidatePopElement(&reader->ctxt->vctxt,
982 reader->ctxt->myDoc, node, node->name);
983 } else {
984 /* TODO use the BuildQName interface */
985 xmlChar *qname;
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000986
Daniel Veillardf4e55762003-04-15 23:32:22 +0000987 qname = xmlStrdup(node->ns->prefix);
988 qname = xmlStrcat(qname, BAD_CAST ":");
989 qname = xmlStrcat(qname, node->name);
990 reader->ctxt->valid &= xmlValidatePopElement(&reader->ctxt->vctxt,
991 reader->ctxt->myDoc, node, qname);
992 if (qname != NULL)
993 xmlFree(qname);
994 }
Daniel Veillardf54cd532004-02-25 11:52:31 +0000995 }
996#endif /* LIBXML_VALID_ENABLED */
Daniel Veillardf4e55762003-04-15 23:32:22 +0000997#ifdef LIBXML_SCHEMAS_ENABLED
Daniel Veillardf54cd532004-02-25 11:52:31 +0000998 if ((reader->validate == XML_TEXTREADER_VALIDATE_RNG) &&
Daniel Veillardf4e55762003-04-15 23:32:22 +0000999 (reader->rngValidCtxt != NULL)) {
1000 int ret;
1001
1002 if (reader->rngFullNode != NULL) {
1003 if (node == reader->rngFullNode)
1004 reader->rngFullNode = NULL;
1005 return;
1006 }
1007 ret = xmlRelaxNGValidatePopElement(reader->rngValidCtxt,
1008 reader->ctxt->myDoc,
1009 node);
1010 if (ret != 1)
1011 reader->rngValidErrors++;
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001012 }
Daniel Veillardf54cd532004-02-25 11:52:31 +00001013#endif
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001014}
Daniel Veillarda9cce9c2003-09-29 13:20:24 +00001015
Daniel Veillarda80ff6e2003-01-03 12:52:08 +00001016/**
1017 * xmlTextReaderValidateEntity:
1018 * @reader: the xmlTextReaderPtr used
1019 *
1020 * Handle the validation when an entity reference is encountered and
1021 * entity substitution is not activated. As a result the parser interface
1022 * must walk through the entity and do the validation calls
1023 */
1024static void
1025xmlTextReaderValidateEntity(xmlTextReaderPtr reader) {
1026 xmlNodePtr oldnode = reader->node;
1027 xmlNodePtr node = reader->node;
1028 xmlParserCtxtPtr ctxt = reader->ctxt;
1029
1030 do {
1031 if (node->type == XML_ENTITY_REF_NODE) {
1032 /*
1033 * Case where the underlying tree is not availble, lookup the entity
1034 * and walk it.
1035 */
1036 if ((node->children == NULL) && (ctxt->sax != NULL) &&
1037 (ctxt->sax->getEntity != NULL)) {
1038 node->children = (xmlNodePtr)
1039 ctxt->sax->getEntity(ctxt, node->name);
1040 }
1041
1042 if ((node->children != NULL) &&
1043 (node->children->type == XML_ENTITY_DECL) &&
1044 (node->children->children != NULL)) {
1045 xmlTextReaderEntPush(reader, node);
1046 node = node->children->children;
1047 continue;
1048 } else {
1049 /*
1050 * The error has probably be raised already.
1051 */
1052 if (node == oldnode)
1053 break;
1054 node = node->next;
1055 }
Daniel Veillarda9cce9c2003-09-29 13:20:24 +00001056#ifdef LIBXML_REGEXP_ENABLED
Daniel Veillarda80ff6e2003-01-03 12:52:08 +00001057 } else if (node->type == XML_ELEMENT_NODE) {
1058 reader->node = node;
1059 xmlTextReaderValidatePush(reader);
1060 } else if ((node->type == XML_TEXT_NODE) ||
1061 (node->type == XML_CDATA_SECTION_NODE)) {
Daniel Veillardf4e55762003-04-15 23:32:22 +00001062 xmlTextReaderValidateCData(reader, node->content,
1063 xmlStrlen(node->content));
Daniel Veillarda9cce9c2003-09-29 13:20:24 +00001064#endif
Daniel Veillarda80ff6e2003-01-03 12:52:08 +00001065 }
1066
1067 /*
1068 * go to next node
1069 */
1070 if (node->children != NULL) {
1071 node = node->children;
1072 continue;
Daniel Veillardef8dd7b2003-03-23 12:02:56 +00001073 } else if (node->type == XML_ELEMENT_NODE) {
1074 xmlTextReaderValidatePop(reader);
Daniel Veillarda80ff6e2003-01-03 12:52:08 +00001075 }
1076 if (node->next != NULL) {
1077 node = node->next;
1078 continue;
1079 }
1080 do {
1081 node = node->parent;
1082 if (node->type == XML_ELEMENT_NODE) {
Daniel Veillard9ee35f32003-09-28 00:19:54 +00001083 xmlNodePtr tmp;
Daniel Veillard1d211e22003-10-20 22:32:39 +00001084 if (reader->entNr == 0) {
1085 while ((tmp = node->last) != NULL) {
Daniel Veillarde8039df2003-10-27 11:25:13 +00001086 if ((tmp->extra & NODE_IS_PRESERVED) == 0) {
Daniel Veillard1d211e22003-10-20 22:32:39 +00001087 xmlUnlinkNode(tmp);
1088 xmlTextReaderFreeNode(reader, tmp);
1089 } else
1090 break;
1091 }
Daniel Veillard9ee35f32003-09-28 00:19:54 +00001092 }
Daniel Veillarda80ff6e2003-01-03 12:52:08 +00001093 reader->node = node;
1094 xmlTextReaderValidatePop(reader);
1095 }
1096 if ((node->type == XML_ENTITY_DECL) &&
1097 (reader->ent != NULL) && (reader->ent->children == node)) {
1098 node = xmlTextReaderEntPop(reader);
1099 }
1100 if (node == oldnode)
1101 break;
1102 if (node->next != NULL) {
1103 node = node->next;
1104 break;
1105 }
1106 } while ((node != NULL) && (node != oldnode));
1107 } while ((node != NULL) && (node != oldnode));
1108 reader->node = oldnode;
1109}
Daniel Veillarda9cce9c2003-09-29 13:20:24 +00001110#endif /* LIBXML_REGEXP_ENABLED */
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001111
1112
1113/**
Daniel Veillardc6cae7b2003-04-11 09:02:11 +00001114 * xmlTextReaderGetSuccessor:
1115 * @cur: the current node
1116 *
1117 * Get the successor of a node if available.
1118 *
1119 * Returns the successor node or NULL
1120 */
1121static xmlNodePtr
1122xmlTextReaderGetSuccessor(xmlNodePtr cur) {
1123 if (cur == NULL) return(NULL) ; /* ERROR */
1124 if (cur->next != NULL) return(cur->next) ;
1125 do {
1126 cur = cur->parent;
1127 if (cur == NULL) return(NULL);
1128 if (cur->next != NULL) return(cur->next);
1129 } while (cur != NULL);
1130 return(cur);
1131}
1132
1133/**
1134 * xmlTextReaderDoExpand:
1135 * @reader: the xmlTextReaderPtr used
1136 *
1137 * Makes sure that the current node is fully read as well as all its
1138 * descendant. It means the full DOM subtree must be available at the
1139 * end of the call.
1140 *
1141 * Returns 1 if the node was expanded successfully, 0 if there is no more
1142 * nodes to read, or -1 in case of error
1143 */
1144static int
1145xmlTextReaderDoExpand(xmlTextReaderPtr reader) {
1146 int val;
1147
1148 if ((reader == NULL) || (reader->node == NULL) || (reader->ctxt == NULL))
1149 return(-1);
Daniel Veillardc6cae7b2003-04-11 09:02:11 +00001150 do {
Daniel Veillardf96cf4e2003-10-01 09:05:25 +00001151 if (reader->ctxt->instate == XML_PARSER_EOF) return(1);
1152
Daniel Veillardc6cae7b2003-04-11 09:02:11 +00001153 if (xmlTextReaderGetSuccessor(reader->node) != NULL)
1154 return(1);
Daniel Veillardf96cf4e2003-10-01 09:05:25 +00001155 if (reader->ctxt->nodeNr < reader->depth)
Daniel Veillarda37aab82003-06-09 09:10:36 +00001156 return(1);
Daniel Veillardc6cae7b2003-04-11 09:02:11 +00001157 if (reader->mode == XML_TEXTREADER_MODE_EOF)
1158 return(1);
1159 val = xmlTextReaderPushData(reader);
1160 if (val < 0)
1161 return(-1);
1162 } while(reader->mode != XML_TEXTREADER_MODE_EOF);
1163 return(1);
1164}
1165
1166/**
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001167 * xmlTextReaderRead:
1168 * @reader: the xmlTextReaderPtr used
1169 *
1170 * Moves the position of the current instance to the next node in
1171 * the stream, exposing its properties.
1172 *
1173 * Returns 1 if the node was read successfully, 0 if there is no more
1174 * nodes to read, or -1 in case of error
1175 */
1176int
1177xmlTextReaderRead(xmlTextReaderPtr reader) {
Daniel Veillard067bae52003-01-05 01:27:54 +00001178 int val, olddepth = 0;
William M. Brack899e64a2003-09-26 18:03:42 +00001179 xmlTextReaderState oldstate = XML_TEXTREADER_START;
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001180 xmlNodePtr oldnode = NULL;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001181
William M. Brack1af55582004-07-22 17:18:00 +00001182
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001183 if (reader == NULL)
1184 return(-1);
William M. Brack1af55582004-07-22 17:18:00 +00001185 reader->curnode = NULL;
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001186 if (reader->doc != NULL)
1187 return(xmlTextReaderReadTree(reader));
1188 if (reader->ctxt == NULL)
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001189 return(-1);
1190 if (reader->ctxt->wellFormed != 1)
1191 return(-1);
1192
1193#ifdef DEBUG_READER
1194 fprintf(stderr, "\nREAD ");
1195 DUMP_READER
1196#endif
Daniel Veillard67df8092002-12-16 22:04:11 +00001197 if (reader->mode == XML_TEXTREADER_MODE_INITIAL) {
1198 reader->mode = XML_TEXTREADER_MODE_INTERACTIVE;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001199 /*
1200 * Initial state
1201 */
1202 do {
1203 val = xmlTextReaderPushData(reader);
1204 if (val < 0)
1205 return(-1);
1206 } while ((reader->ctxt->node == NULL) &&
Daniel Veillard067bae52003-01-05 01:27:54 +00001207 ((reader->mode != XML_TEXTREADER_MODE_EOF) &&
1208 (reader->mode != XML_TEXTREADER_DONE)));
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001209 if (reader->ctxt->node == NULL) {
Daniel Veillarddab8ea92003-01-02 14:16:45 +00001210 if (reader->ctxt->myDoc != NULL) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001211 reader->node = reader->ctxt->myDoc->children;
Daniel Veillarddab8ea92003-01-02 14:16:45 +00001212 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001213 if (reader->node == NULL)
1214 return(-1);
Daniel Veillarddab8ea92003-01-02 14:16:45 +00001215 reader->state = XML_TEXTREADER_ELEMENT;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001216 } else {
Daniel Veillard48ef4c92003-03-22 12:38:15 +00001217 if (reader->ctxt->myDoc != NULL) {
1218 reader->node = reader->ctxt->myDoc->children;
1219 }
1220 if (reader->node == NULL)
1221 reader->node = reader->ctxt->nodeTab[0];
Daniel Veillarde59494f2003-01-04 16:35:29 +00001222 reader->state = XML_TEXTREADER_ELEMENT;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001223 }
Daniel Veillard4d8db8a2002-12-30 18:40:42 +00001224 reader->depth = 0;
Daniel Veillard0df3bc32004-06-08 12:03:41 +00001225 reader->ctxt->parseMode = XML_PARSE_READER;
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001226 goto node_found;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001227 }
1228 oldstate = reader->state;
1229 olddepth = reader->ctxt->nodeNr;
1230 oldnode = reader->node;
Daniel Veillarddf512f42002-12-23 15:56:21 +00001231
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001232get_next_node:
Daniel Veillard6f379a72004-04-29 18:45:42 +00001233 if (reader->node == NULL) {
1234 if (reader->mode == XML_TEXTREADER_DONE)
1235 return(0);
1236 else
1237 return(-1);
1238 }
Daniel Veillarde2161a62004-04-29 17:14:25 +00001239
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001240 /*
1241 * If we are not backtracking on ancestors or examined nodes,
1242 * that the parser didn't finished or that we arent at the end
1243 * of stream, continue processing.
1244 */
Daniel Veillarde2161a62004-04-29 17:14:25 +00001245 while ((reader->node != NULL) && (reader->node->next == NULL) &&
Daniel Veillarda880b122003-04-21 21:36:41 +00001246 (reader->ctxt->nodeNr == olddepth) &&
1247 ((oldstate == XML_TEXTREADER_BACKTRACK) ||
Daniel Veillardea7751d2002-12-20 00:16:24 +00001248 (reader->node->children == NULL) ||
1249 (reader->node->type == XML_ENTITY_REF_NODE) ||
Daniel Veillard409a8142003-07-18 15:16:57 +00001250 ((reader->node->children != NULL) &&
1251 (reader->node->children->type == XML_TEXT_NODE) &&
1252 (reader->node->children->next == NULL)) ||
Daniel Veillard4dbe77a2003-01-14 00:17:42 +00001253 (reader->node->type == XML_DTD_NODE) ||
1254 (reader->node->type == XML_DOCUMENT_NODE) ||
1255 (reader->node->type == XML_HTML_DOCUMENT_NODE)) &&
Daniel Veillard4dbe77a2003-01-14 00:17:42 +00001256 ((reader->ctxt->node == NULL) ||
1257 (reader->ctxt->node == reader->node) ||
1258 (reader->ctxt->node == reader->node->parent)) &&
Daniel Veillardea7751d2002-12-20 00:16:24 +00001259 (reader->ctxt->instate != XML_PARSER_EOF)) {
1260 val = xmlTextReaderPushData(reader);
1261 if (val < 0)
1262 return(-1);
1263 if (reader->node == NULL)
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001264 goto node_end;
Daniel Veillardea7751d2002-12-20 00:16:24 +00001265 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001266 if (oldstate != XML_TEXTREADER_BACKTRACK) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001267 if ((reader->node->children != NULL) &&
1268 (reader->node->type != XML_ENTITY_REF_NODE) &&
Daniel Veillard7899c5c2003-11-03 12:31:38 +00001269 (reader->node->type != XML_XINCLUDE_START) &&
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001270 (reader->node->type != XML_DTD_NODE)) {
1271 reader->node = reader->node->children;
1272 reader->depth++;
Daniel Veillarddf512f42002-12-23 15:56:21 +00001273 reader->state = XML_TEXTREADER_ELEMENT;
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001274 goto node_found;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001275 }
1276 }
1277 if (reader->node->next != NULL) {
1278 if ((oldstate == XML_TEXTREADER_ELEMENT) &&
Daniel Veillarddf512f42002-12-23 15:56:21 +00001279 (reader->node->type == XML_ELEMENT_NODE) &&
Daniel Veillard067bae52003-01-05 01:27:54 +00001280 (reader->node->children == NULL) &&
Daniel Veillard96b6cd22004-01-08 16:49:50 +00001281 ((reader->node->extra & NODE_IS_EMPTY) == 0)
1282#ifdef LIBXML_XINCLUDE_ENABLED
1283 && (reader->in_xinclude <= 0)
1284#endif
1285 ) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001286 reader->state = XML_TEXTREADER_END;
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001287 goto node_found;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001288 }
Daniel Veillarda9cce9c2003-09-29 13:20:24 +00001289#ifdef LIBXML_REGEXP_ENABLED
Daniel Veillardf4e55762003-04-15 23:32:22 +00001290 if ((reader->validate) &&
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001291 (reader->node->type == XML_ELEMENT_NODE))
1292 xmlTextReaderValidatePop(reader);
Daniel Veillarda9cce9c2003-09-29 13:20:24 +00001293#endif /* LIBXML_REGEXP_ENABLED */
Daniel Veillard1e906612003-12-05 14:57:46 +00001294 if ((reader->preserves > 0) &&
1295 (reader->node->extra & NODE_IS_SPRESERVED))
1296 reader->preserves--;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001297 reader->node = reader->node->next;
1298 reader->state = XML_TEXTREADER_ELEMENT;
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001299
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001300 /*
1301 * Cleanup of the old node
1302 */
Daniel Veillard1e906612003-12-05 14:57:46 +00001303 if ((reader->preserves == 0) &&
Daniel Veillard96b6cd22004-01-08 16:49:50 +00001304#ifdef LIBXML_XINCLUDE_ENABLED
Daniel Veillard1e906612003-12-05 14:57:46 +00001305 (reader->in_xinclude == 0) &&
Daniel Veillard96b6cd22004-01-08 16:49:50 +00001306#endif
Daniel Veillard1e906612003-12-05 14:57:46 +00001307 (reader->entNr == 0) &&
1308 (reader->node->prev != NULL) &&
Daniel Veillard1d211e22003-10-20 22:32:39 +00001309 (reader->node->prev->type != XML_DTD_NODE) &&
1310 (reader->entNr == 0)) {
Daniel Veillard4dbe77a2003-01-14 00:17:42 +00001311 xmlNodePtr tmp = reader->node->prev;
Daniel Veillarde8039df2003-10-27 11:25:13 +00001312 if ((tmp->extra & NODE_IS_PRESERVED) == 0) {
Daniel Veillard9ee35f32003-09-28 00:19:54 +00001313 xmlUnlinkNode(tmp);
1314 xmlTextReaderFreeNode(reader, tmp);
1315 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001316 }
1317
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001318 goto node_found;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001319 }
Daniel Veillardea7751d2002-12-20 00:16:24 +00001320 if ((oldstate == XML_TEXTREADER_ELEMENT) &&
Daniel Veillard571b8892002-12-30 12:37:59 +00001321 (reader->node->type == XML_ELEMENT_NODE) &&
Daniel Veillard067bae52003-01-05 01:27:54 +00001322 (reader->node->children == NULL) &&
Daniel Veillarde8039df2003-10-27 11:25:13 +00001323 ((reader->node->extra & NODE_IS_EMPTY) == 0)) {;
Daniel Veillardea7751d2002-12-20 00:16:24 +00001324 reader->state = XML_TEXTREADER_END;
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001325 goto node_found;
Daniel Veillardea7751d2002-12-20 00:16:24 +00001326 }
Daniel Veillarda9cce9c2003-09-29 13:20:24 +00001327#ifdef LIBXML_REGEXP_ENABLED
Daniel Veillardf4e55762003-04-15 23:32:22 +00001328 if ((reader->validate) && (reader->node->type == XML_ELEMENT_NODE))
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001329 xmlTextReaderValidatePop(reader);
Daniel Veillarda9cce9c2003-09-29 13:20:24 +00001330#endif /* LIBXML_REGEXP_ENABLED */
Daniel Veillard1e906612003-12-05 14:57:46 +00001331 if ((reader->preserves > 0) &&
1332 (reader->node->extra & NODE_IS_SPRESERVED))
1333 reader->preserves--;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001334 reader->node = reader->node->parent;
1335 if ((reader->node == NULL) ||
1336 (reader->node->type == XML_DOCUMENT_NODE) ||
1337#ifdef LIBXML_DOCB_ENABLED
1338 (reader->node->type == XML_DOCB_DOCUMENT_NODE) ||
1339#endif
1340 (reader->node->type == XML_HTML_DOCUMENT_NODE)) {
Daniel Veillardea7751d2002-12-20 00:16:24 +00001341 if (reader->mode != XML_TEXTREADER_DONE) {
1342 val = xmlParseChunk(reader->ctxt, "", 0, 1);
1343 reader->mode = XML_TEXTREADER_DONE;
William M. Brack9f797ab2004-07-28 07:40:12 +00001344 if (val != 0)
1345 return(-1);
Daniel Veillardea7751d2002-12-20 00:16:24 +00001346 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001347 reader->node = NULL;
Daniel Veillard4d8db8a2002-12-30 18:40:42 +00001348 reader->depth = -1;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001349
1350 /*
1351 * Cleanup of the old node
1352 */
Daniel Veillard1e906612003-12-05 14:57:46 +00001353 if ((reader->preserves == 0) &&
Daniel Veillard96b6cd22004-01-08 16:49:50 +00001354#ifdef LIBXML_XINCLUDE_ENABLED
Daniel Veillard1e906612003-12-05 14:57:46 +00001355 (reader->in_xinclude == 0) &&
Daniel Veillard96b6cd22004-01-08 16:49:50 +00001356#endif
Daniel Veillard1e906612003-12-05 14:57:46 +00001357 (reader->entNr == 0) &&
1358 (oldnode->type != XML_DTD_NODE) &&
Daniel Veillarde8039df2003-10-27 11:25:13 +00001359 ((oldnode->extra & NODE_IS_PRESERVED) == 0) &&
Daniel Veillard1d211e22003-10-20 22:32:39 +00001360 (reader->entNr == 0)) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001361 xmlUnlinkNode(oldnode);
Daniel Veillard9ee35f32003-09-28 00:19:54 +00001362 xmlTextReaderFreeNode(reader, oldnode);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001363 }
1364
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001365 goto node_end;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001366 }
Daniel Veillard1e906612003-12-05 14:57:46 +00001367 if ((reader->preserves == 0) &&
Daniel Veillard96b6cd22004-01-08 16:49:50 +00001368#ifdef LIBXML_XINCLUDE_ENABLED
Daniel Veillard1e906612003-12-05 14:57:46 +00001369 (reader->in_xinclude == 0) &&
Daniel Veillard96b6cd22004-01-08 16:49:50 +00001370#endif
Daniel Veillard1e906612003-12-05 14:57:46 +00001371 (reader->entNr == 0) &&
1372 (reader->node->last != NULL) &&
1373 ((reader->node->last->extra & NODE_IS_PRESERVED) == 0)) {
1374 xmlNodePtr tmp = reader->node->last;
1375 xmlUnlinkNode(tmp);
1376 xmlTextReaderFreeNode(reader, tmp);
1377 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001378 reader->depth--;
1379 reader->state = XML_TEXTREADER_BACKTRACK;
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001380
1381node_found:
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001382 DUMP_READER
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001383
1384 /*
Daniel Veillarda880b122003-04-21 21:36:41 +00001385 * If we are in the middle of a piece of CDATA make sure it's finished
1386 */
1387 if ((reader->node != NULL) &&
Daniel Veillardccc4d2b2003-09-17 21:27:31 +00001388 (reader->node->next == NULL) &&
Daniel Veillarda880b122003-04-21 21:36:41 +00001389 ((reader->node->type == XML_TEXT_NODE) ||
1390 (reader->node->type == XML_CDATA_SECTION_NODE))) {
William M. Brack42331a92004-07-29 07:07:16 +00001391 if (xmlTextReaderExpand(reader) == NULL)
1392 return -1;
Daniel Veillarda880b122003-04-21 21:36:41 +00001393 }
1394
Daniel Veillard7899c5c2003-11-03 12:31:38 +00001395#ifdef LIBXML_XINCLUDE_ENABLED
1396 /*
1397 * Handle XInclude if asked for
1398 */
1399 if ((reader->xinclude) && (reader->node != NULL) &&
1400 (reader->node->type == XML_ELEMENT_NODE) &&
1401 (reader->node->ns != NULL) &&
Daniel Veillardb5fa0202003-12-08 17:41:29 +00001402 ((xmlStrEqual(reader->node->ns->href, XINCLUDE_NS)) ||
1403 (xmlStrEqual(reader->node->ns->href, XINCLUDE_OLD_NS)))) {
Daniel Veillard7899c5c2003-11-03 12:31:38 +00001404 if (reader->xincctxt == NULL) {
1405 reader->xincctxt = xmlXIncludeNewContext(reader->ctxt->myDoc);
Daniel Veillardc14c3892004-08-16 12:34:50 +00001406 xmlXIncludeSetFlags(reader->xincctxt,
1407 reader->parserFlags & (~XML_PARSE_NOXINCNODE));
Daniel Veillard7899c5c2003-11-03 12:31:38 +00001408 }
1409 /*
1410 * expand that node and process it
1411 */
William M. Brack42331a92004-07-29 07:07:16 +00001412 if (xmlTextReaderExpand(reader) == NULL)
1413 return -1;
Daniel Veillard7899c5c2003-11-03 12:31:38 +00001414 xmlXIncludeProcessNode(reader->xincctxt, reader->node);
1415 }
1416 if (reader->node->type == XML_XINCLUDE_START) {
1417 reader->in_xinclude++;
1418 goto get_next_node;
1419 }
1420 if (reader->node->type == XML_XINCLUDE_END) {
1421 reader->in_xinclude--;
1422 goto get_next_node;
1423 }
1424#endif
Daniel Veillarda880b122003-04-21 21:36:41 +00001425 /*
Daniel Veillarda80ff6e2003-01-03 12:52:08 +00001426 * Handle entities enter and exit when in entity replacement mode
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001427 */
1428 if ((reader->node != NULL) &&
1429 (reader->node->type == XML_ENTITY_REF_NODE) &&
1430 (reader->ctxt != NULL) && (reader->ctxt->replaceEntities == 1)) {
1431 /*
1432 * Case where the underlying tree is not availble, lookup the entity
1433 * and walk it.
1434 */
1435 if ((reader->node->children == NULL) && (reader->ctxt->sax != NULL) &&
1436 (reader->ctxt->sax->getEntity != NULL)) {
1437 reader->node->children = (xmlNodePtr)
1438 reader->ctxt->sax->getEntity(reader->ctxt, reader->node->name);
1439 }
1440
1441 if ((reader->node->children != NULL) &&
1442 (reader->node->children->type == XML_ENTITY_DECL) &&
1443 (reader->node->children->children != NULL)) {
1444 xmlTextReaderEntPush(reader, reader->node);
1445 reader->node = reader->node->children->children;
1446 }
Daniel Veillarda9cce9c2003-09-29 13:20:24 +00001447#ifdef LIBXML_REGEXP_ENABLED
Daniel Veillarda80ff6e2003-01-03 12:52:08 +00001448 } else if ((reader->node != NULL) &&
1449 (reader->node->type == XML_ENTITY_REF_NODE) &&
Daniel Veillardf4e55762003-04-15 23:32:22 +00001450 (reader->ctxt != NULL) && (reader->validate)) {
Daniel Veillarda80ff6e2003-01-03 12:52:08 +00001451 xmlTextReaderValidateEntity(reader);
Daniel Veillarda9cce9c2003-09-29 13:20:24 +00001452#endif /* LIBXML_REGEXP_ENABLED */
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001453 }
1454 if ((reader->node != NULL) &&
1455 (reader->node->type == XML_ENTITY_DECL) &&
1456 (reader->ent != NULL) && (reader->ent->children == reader->node)) {
1457 reader->node = xmlTextReaderEntPop(reader);
1458 reader->depth++;
1459 goto get_next_node;
1460 }
Daniel Veillard0e298ad2003-02-04 16:14:33 +00001461#ifdef LIBXML_REGEXP_ENABLED
Daniel Veillardf4e55762003-04-15 23:32:22 +00001462 if ((reader->validate) && (reader->node != NULL)) {
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001463 xmlNodePtr node = reader->node;
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001464
1465 if ((node->type == XML_ELEMENT_NODE) &&
1466 ((reader->state != XML_TEXTREADER_END) &&
1467 (reader->state != XML_TEXTREADER_BACKTRACK))) {
1468 xmlTextReaderValidatePush(reader);
1469 } else if ((node->type == XML_TEXT_NODE) ||
1470 (node->type == XML_CDATA_SECTION_NODE)) {
Daniel Veillardf4e55762003-04-15 23:32:22 +00001471 xmlTextReaderValidateCData(reader, node->content,
1472 xmlStrlen(node->content));
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001473 }
1474 }
Daniel Veillard0e298ad2003-02-04 16:14:33 +00001475#endif /* LIBXML_REGEXP_ENABLED */
Daniel Veillard1e906612003-12-05 14:57:46 +00001476#ifdef LIBXML_PATTERN_ENABLED
1477 if ((reader->patternNr > 0) && (reader->state != XML_TEXTREADER_END) &&
1478 (reader->state != XML_TEXTREADER_BACKTRACK)) {
1479 int i;
1480 for (i = 0;i < reader->patternNr;i++) {
1481 if (xmlPatternMatch(reader->patternTab[i], reader->node) == 1) {
1482 xmlTextReaderPreserve(reader);
1483 break;
1484 }
1485 }
1486 }
1487#endif /* LIBXML_PATTERN_ENABLED */
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001488 return(1);
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001489node_end:
Daniel Veillardc6cae7b2003-04-11 09:02:11 +00001490 reader->mode = XML_TEXTREADER_DONE;
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001491 return(0);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001492}
1493
Daniel Veillard67df8092002-12-16 22:04:11 +00001494/**
1495 * xmlTextReaderReadState:
1496 * @reader: the xmlTextReaderPtr used
1497 *
1498 * Gets the read state of the reader.
1499 *
1500 * Returns the state value, or -1 in case of error
1501 */
1502int
1503xmlTextReaderReadState(xmlTextReaderPtr reader) {
1504 if (reader == NULL)
1505 return(-1);
1506 return(reader->mode);
1507}
1508
1509/**
Daniel Veillardc6cae7b2003-04-11 09:02:11 +00001510 * xmlTextReaderExpand:
1511 * @reader: the xmlTextReaderPtr used
1512 *
1513 * Reads the contents of the current node and the full subtree. It then makes
Daniel Veillard61c52202003-04-30 12:20:34 +00001514 * the subtree available until the next xmlTextReaderRead() call
Daniel Veillardc6cae7b2003-04-11 09:02:11 +00001515 *
1516 * Returns a node pointer valid until the next xmlTextReaderRead() call
1517 * or NULL in case of error.
1518 */
1519xmlNodePtr
1520xmlTextReaderExpand(xmlTextReaderPtr reader) {
Daniel Veillardf40c1ce2003-12-19 17:26:28 +00001521 if ((reader == NULL) || (reader->node == NULL))
Daniel Veillardc6cae7b2003-04-11 09:02:11 +00001522 return(NULL);
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001523 if (reader->doc != NULL)
1524 return(reader->node);
Daniel Veillardf40c1ce2003-12-19 17:26:28 +00001525 if (reader->ctxt == NULL)
1526 return(NULL);
Daniel Veillardc6cae7b2003-04-11 09:02:11 +00001527 if (xmlTextReaderDoExpand(reader) < 0)
1528 return(NULL);
1529 return(reader->node);
1530}
1531
1532/**
1533 * xmlTextReaderNext:
1534 * @reader: the xmlTextReaderPtr used
1535 *
1536 * Skip to the node following the current one in document order while
1537 * avoiding the subtree if any.
1538 *
1539 * Returns 1 if the node was read successfully, 0 if there is no more
1540 * nodes to read, or -1 in case of error
1541 */
1542int
1543xmlTextReaderNext(xmlTextReaderPtr reader) {
1544 int ret;
1545 xmlNodePtr cur;
1546
1547 if (reader == NULL)
1548 return(-1);
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001549 if (reader->doc != NULL)
1550 return(xmlTextReaderNextTree(reader));
Daniel Veillardc6cae7b2003-04-11 09:02:11 +00001551 cur = reader->node;
1552 if ((cur == NULL) || (cur->type != XML_ELEMENT_NODE))
1553 return(xmlTextReaderRead(reader));
1554 if (reader->state == XML_TEXTREADER_END)
1555 return(xmlTextReaderRead(reader));
Daniel Veillarde8039df2003-10-27 11:25:13 +00001556 if (cur->extra & NODE_IS_EMPTY)
Daniel Veillard9ee35f32003-09-28 00:19:54 +00001557 return(xmlTextReaderRead(reader));
Daniel Veillardc6cae7b2003-04-11 09:02:11 +00001558 do {
1559 ret = xmlTextReaderRead(reader);
1560 if (ret != 1)
1561 return(ret);
1562 } while (reader->node != cur);
1563 return(xmlTextReaderRead(reader));
1564}
1565
1566/**
Daniel Veillard67df8092002-12-16 22:04:11 +00001567 * xmlTextReaderReadInnerXml:
1568 * @reader: the xmlTextReaderPtr used
1569 *
1570 * Reads the contents of the current node, including child nodes and markup.
1571 *
1572 * Returns a string containing the XML content, or NULL if the current node
1573 * is neither an element nor attribute, or has no child nodes. The
1574 * string must be deallocated by the caller.
1575 */
1576xmlChar *
Daniel Veillard33300b42003-04-17 09:09:19 +00001577xmlTextReaderReadInnerXml(xmlTextReaderPtr reader ATTRIBUTE_UNUSED) {
Daniel Veillard67df8092002-12-16 22:04:11 +00001578 TODO
1579 return(NULL);
1580}
1581
1582/**
1583 * xmlTextReaderReadOuterXml:
1584 * @reader: the xmlTextReaderPtr used
1585 *
1586 * Reads the contents of the current node, including child nodes and markup.
1587 *
1588 * Returns a string containing the XML content, or NULL if the current node
1589 * is neither an element nor attribute, or has no child nodes. The
1590 * string must be deallocated by the caller.
1591 */
1592xmlChar *
Daniel Veillard33300b42003-04-17 09:09:19 +00001593xmlTextReaderReadOuterXml(xmlTextReaderPtr reader ATTRIBUTE_UNUSED) {
Daniel Veillard67df8092002-12-16 22:04:11 +00001594 TODO
1595 return(NULL);
1596}
1597
1598/**
1599 * xmlTextReaderReadString:
1600 * @reader: the xmlTextReaderPtr used
1601 *
1602 * Reads the contents of an element or a text node as a string.
1603 *
1604 * Returns a string containing the contents of the Element or Text node,
1605 * or NULL if the reader is positioned on any other type of node.
1606 * The string must be deallocated by the caller.
1607 */
1608xmlChar *
Daniel Veillard33300b42003-04-17 09:09:19 +00001609xmlTextReaderReadString(xmlTextReaderPtr reader ATTRIBUTE_UNUSED) {
Daniel Veillard67df8092002-12-16 22:04:11 +00001610 TODO
1611 return(NULL);
1612}
1613
Daniel Veillard9f7eb0b2003-09-17 10:26:25 +00001614#if 0
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00001615/**
1616 * xmlTextReaderReadBase64:
1617 * @reader: the xmlTextReaderPtr used
1618 * @array: a byte array to store the content.
1619 * @offset: the zero-based index into array where the method should
1620 * begin to write.
1621 * @len: the number of bytes to write.
1622 *
1623 * Reads and decodes the Base64 encoded contents of an element and
1624 * stores the result in a byte buffer.
1625 *
1626 * Returns the number of bytes written to array, or zero if the current
1627 * instance is not positioned on an element or -1 in case of error.
1628 */
1629int
Daniel Veillard9f7eb0b2003-09-17 10:26:25 +00001630xmlTextReaderReadBase64(xmlTextReaderPtr reader,
1631 unsigned char *array ATTRIBUTE_UNUSED,
1632 int offset ATTRIBUTE_UNUSED,
1633 int len ATTRIBUTE_UNUSED) {
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00001634 if ((reader == NULL) || (reader->ctxt == NULL))
1635 return(-1);
1636 if (reader->ctxt->wellFormed != 1)
1637 return(-1);
1638
1639 if ((reader->node == NULL) || (reader->node->type == XML_ELEMENT_NODE))
1640 return(0);
1641 TODO
1642 return(0);
1643}
1644
1645/**
1646 * xmlTextReaderReadBinHex:
1647 * @reader: the xmlTextReaderPtr used
1648 * @array: a byte array to store the content.
1649 * @offset: the zero-based index into array where the method should
1650 * begin to write.
1651 * @len: the number of bytes to write.
1652 *
1653 * Reads and decodes the BinHex encoded contents of an element and
1654 * stores the result in a byte buffer.
1655 *
1656 * Returns the number of bytes written to array, or zero if the current
1657 * instance is not positioned on an element or -1 in case of error.
1658 */
1659int
Daniel Veillard9f7eb0b2003-09-17 10:26:25 +00001660xmlTextReaderReadBinHex(xmlTextReaderPtr reader,
1661 unsigned char *array ATTRIBUTE_UNUSED,
1662 int offset ATTRIBUTE_UNUSED,
1663 int len ATTRIBUTE_UNUSED) {
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00001664 if ((reader == NULL) || (reader->ctxt == NULL))
1665 return(-1);
1666 if (reader->ctxt->wellFormed != 1)
1667 return(-1);
1668
1669 if ((reader->node == NULL) || (reader->node->type == XML_ELEMENT_NODE))
1670 return(0);
1671 TODO
1672 return(0);
1673}
Daniel Veillard9f7eb0b2003-09-17 10:26:25 +00001674#endif
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00001675
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001676/************************************************************************
1677 * *
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001678 * Operating on a preparsed tree *
1679 * *
1680 ************************************************************************/
1681static int
1682xmlTextReaderNextTree(xmlTextReaderPtr reader)
1683{
Daniel Veillard7899c5c2003-11-03 12:31:38 +00001684 if (reader == NULL)
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001685 return(-1);
1686
1687 if (reader->state == XML_TEXTREADER_END)
1688 return(0);
1689
Daniel Veillard7899c5c2003-11-03 12:31:38 +00001690 if (reader->node == NULL) {
1691 if (reader->doc->children == NULL) {
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001692 reader->state = XML_TEXTREADER_END;
1693 return(0);
1694 }
1695
1696 reader->node = reader->doc->children;
1697 reader->state = XML_TEXTREADER_START;
1698 return(1);
1699 }
1700
1701 if (reader->state != XML_TEXTREADER_BACKTRACK) {
1702 if (reader->node->children != 0) {
1703 reader->node = reader->node->children;
1704 reader->depth++;
1705 reader->state = XML_TEXTREADER_START;
1706 return(1);
1707 }
1708
1709 if ((reader->node->type == XML_ELEMENT_NODE) ||
1710 (reader->node->type == XML_ATTRIBUTE_NODE)) {
1711 reader->state = XML_TEXTREADER_BACKTRACK;
1712 return(1);
1713 }
1714 }
1715
1716 if (reader->node->next != 0) {
1717 reader->node = reader->node->next;
1718 reader->state = XML_TEXTREADER_START;
1719 return(1);
1720 }
1721
1722 if (reader->node->parent != 0) {
1723 if (reader->node->parent->type == XML_DOCUMENT_NODE) {
1724 reader->state = XML_TEXTREADER_END;
1725 return(0);
1726 }
1727
1728 reader->node = reader->node->parent;
1729 reader->depth--;
1730 reader->state = XML_TEXTREADER_BACKTRACK;
1731 return(1);
1732 }
1733
1734 reader->state = XML_TEXTREADER_END;
1735
1736 return(1);
1737}
1738
1739/**
1740 * xmlTextReaderReadTree:
1741 * @reader: the xmlTextReaderPtr used
1742 *
1743 * Moves the position of the current instance to the next node in
1744 * the stream, exposing its properties.
1745 *
1746 * Returns 1 if the node was read successfully, 0 if there is no more
1747 * nodes to read, or -1 in case of error
1748 */
1749static int
1750xmlTextReaderReadTree(xmlTextReaderPtr reader) {
1751 if (reader->state == XML_TEXTREADER_END)
1752 return(0);
1753
Daniel Veillard7899c5c2003-11-03 12:31:38 +00001754next_node:
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001755 if (reader->node == NULL) {
1756 if (reader->doc->children == NULL) {
1757 reader->state = XML_TEXTREADER_END;
1758 return(0);
1759 }
1760
1761 reader->node = reader->doc->children;
1762 reader->state = XML_TEXTREADER_START;
Daniel Veillard7899c5c2003-11-03 12:31:38 +00001763 goto found_node;
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001764 }
1765
Daniel Veillard7899c5c2003-11-03 12:31:38 +00001766 if ((reader->state != XML_TEXTREADER_BACKTRACK) &&
1767 (reader->node->type != XML_DTD_NODE) &&
1768 (reader->node->type != XML_XINCLUDE_START) &&
1769 (reader->node->type != XML_ENTITY_REF_NODE)) {
1770 if (reader->node->children != NULL) {
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001771 reader->node = reader->node->children;
1772 reader->depth++;
1773 reader->state = XML_TEXTREADER_START;
Daniel Veillard7899c5c2003-11-03 12:31:38 +00001774 goto found_node;
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001775 }
1776
Daniel Veillard7899c5c2003-11-03 12:31:38 +00001777 if (reader->node->type == XML_ATTRIBUTE_NODE) {
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001778 reader->state = XML_TEXTREADER_BACKTRACK;
Daniel Veillard7899c5c2003-11-03 12:31:38 +00001779 goto found_node;
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001780 }
1781 }
1782
Daniel Veillard7899c5c2003-11-03 12:31:38 +00001783 if (reader->node->next != NULL) {
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001784 reader->node = reader->node->next;
1785 reader->state = XML_TEXTREADER_START;
Daniel Veillard7899c5c2003-11-03 12:31:38 +00001786 goto found_node;
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001787 }
1788
Daniel Veillard7899c5c2003-11-03 12:31:38 +00001789 if (reader->node->parent != NULL) {
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001790 if ((reader->node->parent->type == XML_DOCUMENT_NODE) ||
1791 (reader->node->parent->type == XML_HTML_DOCUMENT_NODE)) {
1792 reader->state = XML_TEXTREADER_END;
1793 return(0);
1794 }
1795
1796 reader->node = reader->node->parent;
1797 reader->depth--;
1798 reader->state = XML_TEXTREADER_BACKTRACK;
Daniel Veillard7899c5c2003-11-03 12:31:38 +00001799 goto found_node;
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001800 }
1801
1802 reader->state = XML_TEXTREADER_END;
1803
Daniel Veillard7899c5c2003-11-03 12:31:38 +00001804found_node:
1805 if ((reader->node->type == XML_XINCLUDE_START) ||
1806 (reader->node->type == XML_XINCLUDE_END))
1807 goto next_node;
1808
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001809 return(1);
1810}
1811
1812/**
William M. Brackb1d53162003-11-18 06:54:40 +00001813 * xmlTextReaderNextSibling:
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001814 * @reader: the xmlTextReaderPtr used
1815 *
1816 * Skip to the node following the current one in document order while
1817 * avoiding the subtree if any.
1818 * Currently implemented only for Readers built on a document
1819 *
1820 * Returns 1 if the node was read successfully, 0 if there is no more
1821 * nodes to read, or -1 in case of error
1822 */
1823int
1824xmlTextReaderNextSibling(xmlTextReaderPtr reader) {
1825 if (reader == NULL)
1826 return(-1);
1827 if (reader->doc == NULL) {
Daniel Veillarddd6d3002004-11-03 14:20:29 +00001828 /* TODO */
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001829 return(-1);
1830 }
1831
1832 if (reader->state == XML_TEXTREADER_END)
1833 return(0);
1834
Daniel Veillard7899c5c2003-11-03 12:31:38 +00001835 if (reader->node == NULL)
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001836 return(xmlTextReaderNextTree(reader));
1837
Daniel Veillard7899c5c2003-11-03 12:31:38 +00001838 if (reader->node->next != NULL) {
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001839 reader->node = reader->node->next;
1840 reader->state = XML_TEXTREADER_START;
1841 return(1);
1842 }
1843
1844 return(0);
1845}
1846
1847/************************************************************************
1848 * *
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001849 * Constructor and destructors *
1850 * *
1851 ************************************************************************/
1852/**
1853 * xmlNewTextReader:
1854 * @input: the xmlParserInputBufferPtr used to read data
Daniel Veillardea7751d2002-12-20 00:16:24 +00001855 * @URI: the URI information for the source if available
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001856 *
1857 * Create an xmlTextReader structure fed with @input
1858 *
1859 * Returns the new xmlTextReaderPtr or NULL in case of error
1860 */
1861xmlTextReaderPtr
Daniel Veillardea7751d2002-12-20 00:16:24 +00001862xmlNewTextReader(xmlParserInputBufferPtr input, const char *URI) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001863 xmlTextReaderPtr ret;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001864
1865 if (input == NULL)
1866 return(NULL);
1867 ret = xmlMalloc(sizeof(xmlTextReader));
1868 if (ret == NULL) {
1869 xmlGenericError(xmlGenericErrorContext,
1870 "xmlNewTextReader : malloc failed\n");
1871 return(NULL);
1872 }
1873 memset(ret, 0, sizeof(xmlTextReader));
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001874 ret->doc = NULL;
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001875 ret->entTab = NULL;
1876 ret->entMax = 0;
1877 ret->entNr = 0;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001878 ret->input = input;
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001879 ret->buffer = xmlBufferCreateSize(100);
William M. Bracka3215c72004-07-31 16:24:01 +00001880 if (ret->buffer == NULL) {
1881 xmlFree(ret);
1882 xmlGenericError(xmlGenericErrorContext,
1883 "xmlNewTextReader : malloc failed\n");
1884 return(NULL);
1885 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001886 ret->sax = (xmlSAXHandler *) xmlMalloc(sizeof(xmlSAXHandler));
1887 if (ret->sax == NULL) {
William M. Brack42331a92004-07-29 07:07:16 +00001888 xmlBufferFree(ret->buffer);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001889 xmlFree(ret);
1890 xmlGenericError(xmlGenericErrorContext,
1891 "xmlNewTextReader : malloc failed\n");
1892 return(NULL);
1893 }
Daniel Veillard81273902003-09-30 00:43:48 +00001894 xmlSAXVersion(ret->sax, 2);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001895 ret->startElement = ret->sax->startElement;
1896 ret->sax->startElement = xmlTextReaderStartElement;
1897 ret->endElement = ret->sax->endElement;
1898 ret->sax->endElement = xmlTextReaderEndElement;
Daniel Veillard81273902003-09-30 00:43:48 +00001899#ifdef LIBXML_SAX1_ENABLED
Daniel Veillard07cb8222003-09-10 10:51:05 +00001900 if (ret->sax->initialized == XML_SAX2_MAGIC) {
Daniel Veillard81273902003-09-30 00:43:48 +00001901#endif /* LIBXML_SAX1_ENABLED */
Daniel Veillard07cb8222003-09-10 10:51:05 +00001902 ret->startElementNs = ret->sax->startElementNs;
1903 ret->sax->startElementNs = xmlTextReaderStartElementNs;
1904 ret->endElementNs = ret->sax->endElementNs;
1905 ret->sax->endElementNs = xmlTextReaderEndElementNs;
Daniel Veillard81273902003-09-30 00:43:48 +00001906#ifdef LIBXML_SAX1_ENABLED
Daniel Veillard07cb8222003-09-10 10:51:05 +00001907 } else {
1908 ret->startElementNs = NULL;
1909 ret->endElementNs = NULL;
1910 }
Daniel Veillard81273902003-09-30 00:43:48 +00001911#endif /* LIBXML_SAX1_ENABLED */
Daniel Veillardea7751d2002-12-20 00:16:24 +00001912 ret->characters = ret->sax->characters;
1913 ret->sax->characters = xmlTextReaderCharacters;
Daniel Veillard40412cd2003-09-03 13:28:32 +00001914 ret->sax->ignorableWhitespace = xmlTextReaderCharacters;
Daniel Veillardea7751d2002-12-20 00:16:24 +00001915 ret->cdataBlock = ret->sax->cdataBlock;
1916 ret->sax->cdataBlock = xmlTextReaderCDataBlock;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001917
Daniel Veillard67df8092002-12-16 22:04:11 +00001918 ret->mode = XML_TEXTREADER_MODE_INITIAL;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001919 ret->node = NULL;
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001920 ret->curnode = NULL;
Daniel Veillard53350552003-09-18 13:35:51 +00001921 if (ret->input->buffer->use < 4) {
William M. Brack899e64a2003-09-26 18:03:42 +00001922 xmlParserInputBufferRead(input, 4);
Daniel Veillard53350552003-09-18 13:35:51 +00001923 }
1924 if (ret->input->buffer->use >= 4) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001925 ret->ctxt = xmlCreatePushParserCtxt(ret->sax, NULL,
Daniel Veillardea7751d2002-12-20 00:16:24 +00001926 (const char *) ret->input->buffer->content, 4, URI);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001927 ret->base = 0;
1928 ret->cur = 4;
1929 } else {
Daniel Veillardea7751d2002-12-20 00:16:24 +00001930 ret->ctxt = xmlCreatePushParserCtxt(ret->sax, NULL, NULL, 0, URI);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001931 ret->base = 0;
1932 ret->cur = 0;
1933 }
Daniel Veillard0df3bc32004-06-08 12:03:41 +00001934
Daniel Veillarda76fe5c2003-04-24 16:06:47 +00001935 if (ret->ctxt == NULL) {
1936 xmlGenericError(xmlGenericErrorContext,
1937 "xmlNewTextReader : malloc failed\n");
William M. Brack42331a92004-07-29 07:07:16 +00001938 xmlBufferFree(ret->buffer);
Daniel Veillarda76fe5c2003-04-24 16:06:47 +00001939 xmlFree(ret->sax);
1940 xmlFree(ret);
1941 return(NULL);
1942 }
Daniel Veillard0df3bc32004-06-08 12:03:41 +00001943 ret->ctxt->parseMode = XML_PARSE_READER;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001944 ret->ctxt->_private = ret;
Daniel Veillardea7751d2002-12-20 00:16:24 +00001945 ret->ctxt->linenumbers = 1;
Daniel Veillard9f7eb0b2003-09-17 10:26:25 +00001946 ret->ctxt->dictNames = 1;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001947 ret->allocs = XML_TEXTREADER_CTXT;
Daniel Veillard40412cd2003-09-03 13:28:32 +00001948 /*
1949 * use the parser dictionnary to allocate all elements and attributes names
1950 */
1951 ret->ctxt->docdict = 1;
Daniel Veillard198c1bf2003-10-20 17:07:41 +00001952 ret->dict = ret->ctxt->dict;
Daniel Veillard7899c5c2003-11-03 12:31:38 +00001953#ifdef LIBXML_XINCLUDE_ENABLED
1954 ret->xinclude = 0;
1955#endif
Daniel Veillard1e906612003-12-05 14:57:46 +00001956#ifdef LIBXML_PATTERN_ENABLED
1957 ret->patternMax = 0;
1958 ret->patternTab = NULL;
1959#endif
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001960 return(ret);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001961}
1962
1963/**
1964 * xmlNewTextReaderFilename:
1965 * @URI: the URI of the resource to process
1966 *
1967 * Create an xmlTextReader structure fed with the resource at @URI
1968 *
1969 * Returns the new xmlTextReaderPtr or NULL in case of error
1970 */
1971xmlTextReaderPtr
1972xmlNewTextReaderFilename(const char *URI) {
1973 xmlParserInputBufferPtr input;
1974 xmlTextReaderPtr ret;
Daniel Veillardea7751d2002-12-20 00:16:24 +00001975 char *directory = NULL;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001976
1977 input = xmlParserInputBufferCreateFilename(URI, XML_CHAR_ENCODING_NONE);
1978 if (input == NULL)
1979 return(NULL);
Daniel Veillardea7751d2002-12-20 00:16:24 +00001980 ret = xmlNewTextReader(input, URI);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001981 if (ret == NULL) {
1982 xmlFreeParserInputBuffer(input);
1983 return(NULL);
1984 }
1985 ret->allocs |= XML_TEXTREADER_INPUT;
Daniel Veillardea7751d2002-12-20 00:16:24 +00001986 if (ret->ctxt->directory == NULL)
1987 directory = xmlParserGetDirectory(URI);
1988 if ((ret->ctxt->directory == NULL) && (directory != NULL))
1989 ret->ctxt->directory = (char *) xmlStrdup((xmlChar *) directory);
1990 if (directory != NULL)
1991 xmlFree(directory);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001992 return(ret);
1993}
1994
1995/**
1996 * xmlFreeTextReader:
1997 * @reader: the xmlTextReaderPtr
1998 *
1999 * Deallocate all the resources associated to the reader
2000 */
2001void
2002xmlFreeTextReader(xmlTextReaderPtr reader) {
2003 if (reader == NULL)
2004 return;
Daniel Veillard37fc84d2003-05-09 19:38:15 +00002005#ifdef LIBXML_SCHEMAS_ENABLED
Daniel Veillardf4e55762003-04-15 23:32:22 +00002006 if (reader->rngSchemas != NULL) {
2007 xmlRelaxNGFree(reader->rngSchemas);
2008 reader->rngSchemas = NULL;
2009 }
2010 if (reader->rngValidCtxt != NULL) {
2011 xmlRelaxNGFreeValidCtxt(reader->rngValidCtxt);
2012 reader->rngValidCtxt = NULL;
2013 }
Daniel Veillard37fc84d2003-05-09 19:38:15 +00002014#endif
Daniel Veillard7899c5c2003-11-03 12:31:38 +00002015#ifdef LIBXML_XINCLUDE_ENABLED
2016 if (reader->xincctxt != NULL)
2017 xmlXIncludeFreeContext(reader->xincctxt);
2018#endif
Daniel Veillard1e906612003-12-05 14:57:46 +00002019#ifdef LIBXML_PATTERN_ENABLED
2020 if (reader->patternTab != NULL) {
2021 int i;
2022 for (i = 0;i < reader->patternNr;i++) {
2023 if (reader->patternTab[i] != NULL)
2024 xmlFreePattern(reader->patternTab[i]);
2025 }
2026 xmlFree(reader->patternTab);
2027 }
2028#endif
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002029 if (reader->ctxt != NULL) {
Daniel Veillard198c1bf2003-10-20 17:07:41 +00002030 if (reader->dict == reader->ctxt->dict)
2031 reader->dict = NULL;
Daniel Veillard9ee35f32003-09-28 00:19:54 +00002032 if (reader->ctxt->myDoc != NULL) {
2033 if (reader->preserve == 0)
2034 xmlTextReaderFreeDoc(reader, reader->ctxt->myDoc);
2035 reader->ctxt->myDoc = NULL;
2036 }
Daniel Veillard336fc7d2002-12-27 19:37:04 +00002037 if ((reader->ctxt->vctxt.vstateTab != NULL) &&
2038 (reader->ctxt->vctxt.vstateMax > 0)){
2039 xmlFree(reader->ctxt->vctxt.vstateTab);
2040 reader->ctxt->vctxt.vstateTab = 0;
2041 reader->ctxt->vctxt.vstateMax = 0;
2042 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002043 if (reader->allocs & XML_TEXTREADER_CTXT)
2044 xmlFreeParserCtxt(reader->ctxt);
2045 }
2046 if (reader->sax != NULL)
2047 xmlFree(reader->sax);
2048 if ((reader->input != NULL) && (reader->allocs & XML_TEXTREADER_INPUT))
2049 xmlFreeParserInputBuffer(reader->input);
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00002050 if (reader->faketext != NULL) {
2051 xmlFreeNode(reader->faketext);
2052 }
Daniel Veillard198c1bf2003-10-20 17:07:41 +00002053 if (reader->buffer != NULL)
2054 xmlBufferFree(reader->buffer);
Daniel Veillard1fdfd112003-01-03 01:18:43 +00002055 if (reader->entTab != NULL)
2056 xmlFree(reader->entTab);
Daniel Veillard198c1bf2003-10-20 17:07:41 +00002057 if (reader->dict != NULL)
2058 xmlDictFree(reader->dict);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002059 xmlFree(reader);
2060}
2061
2062/************************************************************************
2063 * *
Daniel Veillard0eb38c72002-12-14 23:00:35 +00002064 * Methods for XmlTextReader *
2065 * *
2066 ************************************************************************/
2067/**
2068 * xmlTextReaderClose:
2069 * @reader: the xmlTextReaderPtr used
2070 *
2071 * This method releases any resources allocated by the current instance
2072 * changes the state to Closed and close any underlying input.
2073 *
2074 * Returns 0 or -1 in case of error
2075 */
2076int
2077xmlTextReaderClose(xmlTextReaderPtr reader) {
2078 if (reader == NULL)
2079 return(-1);
2080 reader->node = NULL;
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002081 reader->curnode = NULL;
Daniel Veillard0eb38c72002-12-14 23:00:35 +00002082 reader->mode = XML_TEXTREADER_MODE_CLOSED;
2083 if (reader->ctxt != NULL) {
Daniel Veillardee1d6922004-04-18 14:58:57 +00002084 xmlStopParser(reader->ctxt);
Daniel Veillard0eb38c72002-12-14 23:00:35 +00002085 if (reader->ctxt->myDoc != NULL) {
Daniel Veillard9ee35f32003-09-28 00:19:54 +00002086 if (reader->preserve == 0)
2087 xmlTextReaderFreeDoc(reader, reader->ctxt->myDoc);
Daniel Veillard0eb38c72002-12-14 23:00:35 +00002088 reader->ctxt->myDoc = NULL;
2089 }
Daniel Veillard0eb38c72002-12-14 23:00:35 +00002090 }
2091 if ((reader->input != NULL) && (reader->allocs & XML_TEXTREADER_INPUT)) {
2092 xmlFreeParserInputBuffer(reader->input);
2093 reader->allocs -= XML_TEXTREADER_INPUT;
2094 }
2095 return(0);
2096}
2097
2098/**
2099 * xmlTextReaderGetAttributeNo:
2100 * @reader: the xmlTextReaderPtr used
2101 * @no: the zero-based index of the attribute relative to the containing element
2102 *
2103 * Provides the value of the attribute with the specified index relative
2104 * to the containing element.
2105 *
2106 * Returns a string containing the value of the specified attribute, or NULL
2107 * in case of error. The string must be deallocated by the caller.
2108 */
2109xmlChar *
2110xmlTextReaderGetAttributeNo(xmlTextReaderPtr reader, int no) {
2111 xmlChar *ret;
2112 int i;
2113 xmlAttrPtr cur;
2114 xmlNsPtr ns;
2115
2116 if (reader == NULL)
2117 return(NULL);
2118 if (reader->node == NULL)
2119 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002120 if (reader->curnode != NULL)
2121 return(NULL);
Daniel Veillard0eb38c72002-12-14 23:00:35 +00002122 /* TODO: handle the xmlDecl */
2123 if (reader->node->type != XML_ELEMENT_NODE)
2124 return(NULL);
2125
2126 ns = reader->node->nsDef;
2127 for (i = 0;(i < no) && (ns != NULL);i++) {
2128 ns = ns->next;
2129 }
2130 if (ns != NULL)
2131 return(xmlStrdup(ns->href));
2132
2133 cur = reader->node->properties;
2134 if (cur == NULL)
2135 return(NULL);
2136 for (;i < no;i++) {
2137 cur = cur->next;
2138 if (cur == NULL)
2139 return(NULL);
2140 }
2141 /* TODO walk the DTD if present */
2142
2143 ret = xmlNodeListGetString(reader->node->doc, cur->children, 1);
2144 if (ret == NULL) return(xmlStrdup((xmlChar *)""));
2145 return(ret);
2146}
2147
2148/**
2149 * xmlTextReaderGetAttribute:
2150 * @reader: the xmlTextReaderPtr used
2151 * @name: the qualified name of the attribute.
2152 *
2153 * Provides the value of the attribute with the specified qualified name.
2154 *
2155 * Returns a string containing the value of the specified attribute, or NULL
2156 * in case of error. The string must be deallocated by the caller.
2157 */
2158xmlChar *
2159xmlTextReaderGetAttribute(xmlTextReaderPtr reader, const xmlChar *name) {
2160 xmlChar *prefix = NULL;
2161 xmlChar *localname;
2162 xmlNsPtr ns;
2163 xmlChar *ret = NULL;
2164
2165 if ((reader == NULL) || (name == NULL))
2166 return(NULL);
2167 if (reader->node == NULL)
2168 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002169 if (reader->curnode != NULL)
2170 return(NULL);
Daniel Veillard0eb38c72002-12-14 23:00:35 +00002171
2172 /* TODO: handle the xmlDecl */
2173 if (reader->node->type != XML_ELEMENT_NODE)
2174 return(NULL);
2175
2176 localname = xmlSplitQName2(name, &prefix);
2177 if (localname == NULL)
2178 return(xmlGetProp(reader->node, name));
2179
2180 ns = xmlSearchNs(reader->node->doc, reader->node, prefix);
2181 if (ns != NULL)
2182 ret = xmlGetNsProp(reader->node, localname, ns->href);
2183
2184 if (localname != NULL)
2185 xmlFree(localname);
2186 if (prefix != NULL)
2187 xmlFree(prefix);
2188 return(ret);
2189}
2190
2191
2192/**
2193 * xmlTextReaderGetAttributeNs:
2194 * @reader: the xmlTextReaderPtr used
2195 * @localName: the local name of the attribute.
2196 * @namespaceURI: the namespace URI of the attribute.
2197 *
2198 * Provides the value of the specified attribute
2199 *
2200 * Returns a string containing the value of the specified attribute, or NULL
2201 * in case of error. The string must be deallocated by the caller.
2202 */
2203xmlChar *
2204xmlTextReaderGetAttributeNs(xmlTextReaderPtr reader, const xmlChar *localName,
2205 const xmlChar *namespaceURI) {
2206 if ((reader == NULL) || (localName == NULL))
2207 return(NULL);
2208 if (reader->node == NULL)
2209 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002210 if (reader->curnode != NULL)
2211 return(NULL);
Daniel Veillard0eb38c72002-12-14 23:00:35 +00002212
2213 /* TODO: handle the xmlDecl */
2214 if (reader->node->type != XML_ELEMENT_NODE)
2215 return(NULL);
2216
2217 return(xmlGetNsProp(reader->node, localName, namespaceURI));
2218}
2219
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002220/**
2221 * xmlTextReaderGetRemainder:
2222 * @reader: the xmlTextReaderPtr used
2223 *
2224 * Method to get the remainder of the buffered XML. this method stops the
2225 * parser, set its state to End Of File and return the input stream with
2226 * what is left that the parser did not use.
2227 *
Daniel Veillardee1d6922004-04-18 14:58:57 +00002228 * The implementation is not good, the parser certainly procgressed past
2229 * what's left in reader->input, and there is an allocation problem. Best
2230 * would be to rewrite it differently.
2231 *
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002232 * Returns the xmlParserInputBufferPtr attached to the XML or NULL
2233 * in case of error.
2234 */
2235xmlParserInputBufferPtr
2236xmlTextReaderGetRemainder(xmlTextReaderPtr reader) {
2237 xmlParserInputBufferPtr ret = NULL;
2238
2239 if (reader == NULL)
2240 return(NULL);
2241 if (reader->node == NULL)
2242 return(NULL);
2243
2244 reader->node = NULL;
2245 reader->curnode = NULL;
2246 reader->mode = XML_TEXTREADER_MODE_EOF;
2247 if (reader->ctxt != NULL) {
Daniel Veillardee1d6922004-04-18 14:58:57 +00002248 xmlStopParser(reader->ctxt);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002249 if (reader->ctxt->myDoc != NULL) {
Daniel Veillard9ee35f32003-09-28 00:19:54 +00002250 if (reader->preserve == 0)
2251 xmlTextReaderFreeDoc(reader, reader->ctxt->myDoc);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002252 reader->ctxt->myDoc = NULL;
2253 }
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002254 }
2255 if (reader->allocs & XML_TEXTREADER_INPUT) {
2256 ret = reader->input;
Daniel Veillardee1d6922004-04-18 14:58:57 +00002257 reader->input = NULL;
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002258 reader->allocs -= XML_TEXTREADER_INPUT;
2259 } else {
2260 /*
2261 * Hum, one may need to duplicate the data structure because
2262 * without reference counting the input may be freed twice:
2263 * - by the layer which allocated it.
2264 * - by the layer to which would have been returned to.
2265 */
2266 TODO
2267 return(NULL);
2268 }
2269 return(ret);
2270}
2271
2272/**
2273 * xmlTextReaderLookupNamespace:
2274 * @reader: the xmlTextReaderPtr used
2275 * @prefix: the prefix whose namespace URI is to be resolved. To return
2276 * the default namespace, specify NULL
2277 *
2278 * Resolves a namespace prefix in the scope of the current element.
2279 *
2280 * Returns a string containing the namespace URI to which the prefix maps
2281 * or NULL in case of error. The string must be deallocated by the caller.
2282 */
2283xmlChar *
2284xmlTextReaderLookupNamespace(xmlTextReaderPtr reader, const xmlChar *prefix) {
2285 xmlNsPtr ns;
2286
2287 if (reader == NULL)
2288 return(NULL);
2289 if (reader->node == NULL)
2290 return(NULL);
2291
2292 ns = xmlSearchNs(reader->node->doc, reader->node, prefix);
2293 if (ns == NULL)
2294 return(NULL);
2295 return(xmlStrdup(ns->href));
2296}
2297
2298/**
2299 * xmlTextReaderMoveToAttributeNo:
2300 * @reader: the xmlTextReaderPtr used
2301 * @no: the zero-based index of the attribute relative to the containing
2302 * element.
2303 *
2304 * Moves the position of the current instance to the attribute with
2305 * the specified index relative to the containing element.
2306 *
2307 * Returns 1 in case of success, -1 in case of error, 0 if not found
2308 */
2309int
2310xmlTextReaderMoveToAttributeNo(xmlTextReaderPtr reader, int no) {
2311 int i;
2312 xmlAttrPtr cur;
2313 xmlNsPtr ns;
2314
2315 if (reader == NULL)
2316 return(-1);
2317 if (reader->node == NULL)
2318 return(-1);
2319 /* TODO: handle the xmlDecl */
2320 if (reader->node->type != XML_ELEMENT_NODE)
2321 return(-1);
2322
2323 reader->curnode = NULL;
2324
2325 ns = reader->node->nsDef;
2326 for (i = 0;(i < no) && (ns != NULL);i++) {
2327 ns = ns->next;
2328 }
2329 if (ns != NULL) {
2330 reader->curnode = (xmlNodePtr) ns;
2331 return(1);
2332 }
2333
2334 cur = reader->node->properties;
2335 if (cur == NULL)
2336 return(0);
2337 for (;i < no;i++) {
2338 cur = cur->next;
2339 if (cur == NULL)
2340 return(0);
2341 }
2342 /* TODO walk the DTD if present */
2343
2344 reader->curnode = (xmlNodePtr) cur;
2345 return(1);
2346}
2347
2348/**
2349 * xmlTextReaderMoveToAttribute:
2350 * @reader: the xmlTextReaderPtr used
2351 * @name: the qualified name of the attribute.
2352 *
2353 * Moves the position of the current instance to the attribute with
2354 * the specified qualified name.
2355 *
2356 * Returns 1 in case of success, -1 in case of error, 0 if not found
2357 */
2358int
2359xmlTextReaderMoveToAttribute(xmlTextReaderPtr reader, const xmlChar *name) {
2360 xmlChar *prefix = NULL;
2361 xmlChar *localname;
2362 xmlNsPtr ns;
2363 xmlAttrPtr prop;
2364
2365 if ((reader == NULL) || (name == NULL))
2366 return(-1);
2367 if (reader->node == NULL)
2368 return(-1);
2369
2370 /* TODO: handle the xmlDecl */
2371 if (reader->node->type != XML_ELEMENT_NODE)
2372 return(0);
2373
2374 localname = xmlSplitQName2(name, &prefix);
2375 if (localname == NULL) {
2376 /*
2377 * Namespace default decl
2378 */
2379 if (xmlStrEqual(name, BAD_CAST "xmlns")) {
2380 ns = reader->node->nsDef;
2381 while (ns != NULL) {
2382 if (ns->prefix == NULL) {
2383 reader->curnode = (xmlNodePtr) ns;
2384 return(1);
2385 }
2386 ns = ns->next;
2387 }
2388 return(0);
2389 }
2390
2391 prop = reader->node->properties;
2392 while (prop != NULL) {
2393 /*
2394 * One need to have
2395 * - same attribute names
2396 * - and the attribute carrying that namespace
2397 */
2398 if ((xmlStrEqual(prop->name, name)) &&
2399 ((prop->ns == NULL) || (prop->ns->prefix == NULL))) {
2400 reader->curnode = (xmlNodePtr) prop;
2401 return(1);
2402 }
2403 prop = prop->next;
2404 }
2405 return(0);
2406 }
2407
2408 /*
2409 * Namespace default decl
2410 */
2411 if (xmlStrEqual(prefix, BAD_CAST "xmlns")) {
2412 ns = reader->node->nsDef;
2413 while (ns != NULL) {
2414 if ((ns->prefix != NULL) && (xmlStrEqual(ns->prefix, localname))) {
2415 reader->curnode = (xmlNodePtr) ns;
2416 goto found;
2417 }
2418 ns = ns->next;
2419 }
2420 goto not_found;
2421 }
2422 prop = reader->node->properties;
2423 while (prop != NULL) {
2424 /*
2425 * One need to have
2426 * - same attribute names
2427 * - and the attribute carrying that namespace
2428 */
2429 if ((xmlStrEqual(prop->name, localname)) &&
2430 (prop->ns != NULL) && (xmlStrEqual(prop->ns->prefix, prefix))) {
2431 reader->curnode = (xmlNodePtr) prop;
2432 goto found;
2433 }
2434 prop = prop->next;
2435 }
2436not_found:
2437 if (localname != NULL)
2438 xmlFree(localname);
2439 if (prefix != NULL)
2440 xmlFree(prefix);
2441 return(0);
2442
2443found:
2444 if (localname != NULL)
2445 xmlFree(localname);
2446 if (prefix != NULL)
2447 xmlFree(prefix);
2448 return(1);
2449}
2450
2451/**
2452 * xmlTextReaderMoveToAttributeNs:
2453 * @reader: the xmlTextReaderPtr used
2454 * @localName: the local name of the attribute.
2455 * @namespaceURI: the namespace URI of the attribute.
2456 *
2457 * Moves the position of the current instance to the attribute with the
2458 * specified local name and namespace URI.
2459 *
2460 * Returns 1 in case of success, -1 in case of error, 0 if not found
2461 */
2462int
2463xmlTextReaderMoveToAttributeNs(xmlTextReaderPtr reader,
2464 const xmlChar *localName, const xmlChar *namespaceURI) {
2465 xmlAttrPtr prop;
2466 xmlNodePtr node;
2467
2468 if ((reader == NULL) || (localName == NULL) || (namespaceURI == NULL))
2469 return(-1);
2470 if (reader->node == NULL)
2471 return(-1);
2472 if (reader->node->type != XML_ELEMENT_NODE)
2473 return(0);
2474 node = reader->node;
2475
2476 /*
2477 * A priori reading http://www.w3.org/TR/REC-xml-names/ there is no
2478 * namespace name associated to "xmlns"
2479 */
2480 prop = node->properties;
2481 while (prop != NULL) {
2482 /*
2483 * One need to have
2484 * - same attribute names
2485 * - and the attribute carrying that namespace
2486 */
2487 if (xmlStrEqual(prop->name, localName) &&
2488 ((prop->ns != NULL) &&
2489 (xmlStrEqual(prop->ns->href, namespaceURI)))) {
2490 reader->curnode = (xmlNodePtr) prop;
2491 return(1);
2492 }
2493 prop = prop->next;
2494 }
2495 return(0);
2496}
2497
2498/**
2499 * xmlTextReaderMoveToFirstAttribute:
2500 * @reader: the xmlTextReaderPtr used
2501 *
2502 * Moves the position of the current instance to the first attribute
2503 * associated with the current node.
2504 *
2505 * Returns 1 in case of success, -1 in case of error, 0 if not found
2506 */
2507int
2508xmlTextReaderMoveToFirstAttribute(xmlTextReaderPtr reader) {
2509 if (reader == NULL)
2510 return(-1);
2511 if (reader->node == NULL)
2512 return(-1);
2513 if (reader->node->type != XML_ELEMENT_NODE)
2514 return(0);
2515
2516 if (reader->node->nsDef != NULL) {
2517 reader->curnode = (xmlNodePtr) reader->node->nsDef;
2518 return(1);
2519 }
2520 if (reader->node->properties != NULL) {
2521 reader->curnode = (xmlNodePtr) reader->node->properties;
2522 return(1);
2523 }
2524 return(0);
2525}
2526
2527/**
2528 * xmlTextReaderMoveToNextAttribute:
2529 * @reader: the xmlTextReaderPtr used
2530 *
2531 * Moves the position of the current instance to the next attribute
2532 * associated with the current node.
2533 *
2534 * Returns 1 in case of success, -1 in case of error, 0 if not found
2535 */
2536int
2537xmlTextReaderMoveToNextAttribute(xmlTextReaderPtr reader) {
2538 if (reader == NULL)
2539 return(-1);
2540 if (reader->node == NULL)
2541 return(-1);
2542 if (reader->node->type != XML_ELEMENT_NODE)
2543 return(0);
2544 if (reader->curnode == NULL)
2545 return(xmlTextReaderMoveToFirstAttribute(reader));
2546
2547 if (reader->curnode->type == XML_NAMESPACE_DECL) {
2548 xmlNsPtr ns = (xmlNsPtr) reader->curnode;
2549 if (ns->next != NULL) {
2550 reader->curnode = (xmlNodePtr) ns->next;
2551 return(1);
2552 }
2553 if (reader->node->properties != NULL) {
2554 reader->curnode = (xmlNodePtr) reader->node->properties;
2555 return(1);
2556 }
2557 return(0);
2558 } else if ((reader->curnode->type == XML_ATTRIBUTE_NODE) &&
2559 (reader->curnode->next != NULL)) {
2560 reader->curnode = reader->curnode->next;
2561 return(1);
2562 }
2563 return(0);
2564}
2565
2566/**
2567 * xmlTextReaderMoveToElement:
2568 * @reader: the xmlTextReaderPtr used
2569 *
2570 * Moves the position of the current instance to the node that
2571 * contains the current Attribute node.
2572 *
2573 * Returns 1 in case of success, -1 in case of error, 0 if not moved
2574 */
2575int
2576xmlTextReaderMoveToElement(xmlTextReaderPtr reader) {
2577 if (reader == NULL)
2578 return(-1);
2579 if (reader->node == NULL)
2580 return(-1);
2581 if (reader->node->type != XML_ELEMENT_NODE)
2582 return(0);
2583 if (reader->curnode != NULL) {
2584 reader->curnode = NULL;
2585 return(1);
2586 }
2587 return(0);
2588}
2589
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00002590/**
2591 * xmlTextReaderReadAttributeValue:
2592 * @reader: the xmlTextReaderPtr used
2593 *
2594 * Parses an attribute value into one or more Text and EntityReference nodes.
2595 *
2596 * Returns 1 in case of success, 0 if the reader was not positionned on an
2597 * ttribute node or all the attribute values have been read, or -1
2598 * in case of error.
2599 */
2600int
2601xmlTextReaderReadAttributeValue(xmlTextReaderPtr reader) {
2602 if (reader == NULL)
2603 return(-1);
2604 if (reader->node == NULL)
2605 return(-1);
2606 if (reader->curnode == NULL)
2607 return(0);
2608 if (reader->curnode->type == XML_ATTRIBUTE_NODE) {
2609 if (reader->curnode->children == NULL)
2610 return(0);
2611 reader->curnode = reader->curnode->children;
2612 } else if (reader->curnode->type == XML_NAMESPACE_DECL) {
2613 xmlNsPtr ns = (xmlNsPtr) reader->curnode;
2614
2615 if (reader->faketext == NULL) {
2616 reader->faketext = xmlNewDocText(reader->node->doc,
2617 ns->href);
2618 } else {
2619 if (reader->faketext->content != NULL)
2620 xmlFree(reader->faketext->content);
2621 reader->faketext->content = xmlStrdup(ns->href);
2622 }
2623 reader->curnode = reader->faketext;
2624 } else {
2625 if (reader->curnode->next == NULL)
2626 return(0);
2627 reader->curnode = reader->curnode->next;
2628 }
2629 return(1);
2630}
2631
Daniel Veillarde2811272004-10-19 09:04:23 +00002632/**
2633 * xmlTextReaderConstEncoding:
2634 * @reader: the xmlTextReaderPtr used
2635 *
2636 * Determine the encoding of the document being read.
2637 *
2638 * Returns a string containing the encoding of the document or NULL in
2639 * case of error. The string is deallocated with the reader.
2640 */
2641const xmlChar *
2642xmlTextReaderConstEncoding(xmlTextReaderPtr reader) {
2643 xmlDocPtr doc = NULL;
2644 if (reader == NULL)
2645 return(NULL);
2646 if (reader->doc != NULL)
2647 doc = reader->doc;
2648 else if (reader->ctxt != NULL)
2649 doc = reader->ctxt->myDoc;
2650 if (doc == NULL)
2651 return(NULL);
2652
2653 if (doc->encoding == NULL)
2654 return(NULL);
2655 else
2656 return(CONSTSTR(doc->encoding));
2657}
2658
2659
Daniel Veillard0eb38c72002-12-14 23:00:35 +00002660/************************************************************************
2661 * *
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002662 * Acces API to the current node *
2663 * *
2664 ************************************************************************/
2665/**
2666 * xmlTextReaderAttributeCount:
2667 * @reader: the xmlTextReaderPtr used
2668 *
Daniel Veillarda9b66d02002-12-11 14:23:49 +00002669 * Provides the number of attributes of the current node
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002670 *
2671 * Returns 0 i no attributes, -1 in case of error or the attribute count
2672 */
2673int
2674xmlTextReaderAttributeCount(xmlTextReaderPtr reader) {
2675 int ret;
2676 xmlAttrPtr attr;
Daniel Veillard67df8092002-12-16 22:04:11 +00002677 xmlNsPtr ns;
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002678 xmlNodePtr node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002679
2680 if (reader == NULL)
2681 return(-1);
2682 if (reader->node == NULL)
2683 return(0);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002684
2685 if (reader->curnode != NULL)
2686 node = reader->curnode;
2687 else
2688 node = reader->node;
2689
2690 if (node->type != XML_ELEMENT_NODE)
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002691 return(0);
2692 if ((reader->state == XML_TEXTREADER_END) ||
2693 (reader->state == XML_TEXTREADER_BACKTRACK))
2694 return(0);
2695 ret = 0;
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002696 attr = node->properties;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002697 while (attr != NULL) {
2698 ret++;
2699 attr = attr->next;
2700 }
Daniel Veillard67df8092002-12-16 22:04:11 +00002701 ns = node->nsDef;
2702 while (ns != NULL) {
2703 ret++;
2704 ns = ns->next;
2705 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002706 return(ret);
2707}
2708
2709/**
2710 * xmlTextReaderNodeType:
2711 * @reader: the xmlTextReaderPtr used
2712 *
2713 * Get the node type of the current node
2714 * Reference:
2715 * http://dotgnu.org/pnetlib-doc/System/Xml/XmlNodeType.html
2716 *
2717 * Returns the xmlNodeType of the current node or -1 in case of error
2718 */
2719int
2720xmlTextReaderNodeType(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002721 xmlNodePtr node;
Daniel Veillardd6038e02003-07-30 16:37:18 +00002722
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002723 if (reader == NULL)
2724 return(-1);
2725 if (reader->node == NULL)
Daniel Veillardd6038e02003-07-30 16:37:18 +00002726 return(XML_READER_TYPE_NONE);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002727 if (reader->curnode != NULL)
2728 node = reader->curnode;
2729 else
2730 node = reader->node;
2731 switch (node->type) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002732 case XML_ELEMENT_NODE:
2733 if ((reader->state == XML_TEXTREADER_END) ||
2734 (reader->state == XML_TEXTREADER_BACKTRACK))
Daniel Veillardd6038e02003-07-30 16:37:18 +00002735 return(XML_READER_TYPE_END_ELEMENT);
2736 return(XML_READER_TYPE_ELEMENT);
Daniel Veillardecaba492002-12-30 10:55:29 +00002737 case XML_NAMESPACE_DECL:
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002738 case XML_ATTRIBUTE_NODE:
Daniel Veillardd6038e02003-07-30 16:37:18 +00002739 return(XML_READER_TYPE_ATTRIBUTE);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002740 case XML_TEXT_NODE:
Daniel Veillardd6038e02003-07-30 16:37:18 +00002741 if (xmlIsBlankNode(reader->node)) {
2742 if (xmlNodeGetSpacePreserve(reader->node))
2743 return(XML_READER_TYPE_SIGNIFICANT_WHITESPACE);
2744 else
2745 return(XML_READER_TYPE_WHITESPACE);
2746 } else {
2747 return(XML_READER_TYPE_TEXT);
2748 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002749 case XML_CDATA_SECTION_NODE:
Daniel Veillardd6038e02003-07-30 16:37:18 +00002750 return(XML_READER_TYPE_CDATA);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002751 case XML_ENTITY_REF_NODE:
Daniel Veillardd6038e02003-07-30 16:37:18 +00002752 return(XML_READER_TYPE_ENTITY_REFERENCE);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002753 case XML_ENTITY_NODE:
Daniel Veillardd6038e02003-07-30 16:37:18 +00002754 return(XML_READER_TYPE_ENTITY);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002755 case XML_PI_NODE:
Daniel Veillardd6038e02003-07-30 16:37:18 +00002756 return(XML_READER_TYPE_PROCESSING_INSTRUCTION);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002757 case XML_COMMENT_NODE:
Daniel Veillardd6038e02003-07-30 16:37:18 +00002758 return(XML_READER_TYPE_COMMENT);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002759 case XML_DOCUMENT_NODE:
2760 case XML_HTML_DOCUMENT_NODE:
2761#ifdef LIBXML_DOCB_ENABLED
2762 case XML_DOCB_DOCUMENT_NODE:
2763#endif
Daniel Veillardd6038e02003-07-30 16:37:18 +00002764 return(XML_READER_TYPE_DOCUMENT);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002765 case XML_DOCUMENT_FRAG_NODE:
Daniel Veillardd6038e02003-07-30 16:37:18 +00002766 return(XML_READER_TYPE_DOCUMENT_FRAGMENT);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002767 case XML_NOTATION_NODE:
Daniel Veillardd6038e02003-07-30 16:37:18 +00002768 return(XML_READER_TYPE_NOTATION);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002769 case XML_DOCUMENT_TYPE_NODE:
2770 case XML_DTD_NODE:
Daniel Veillardd6038e02003-07-30 16:37:18 +00002771 return(XML_READER_TYPE_DOCUMENT_TYPE);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002772
2773 case XML_ELEMENT_DECL:
2774 case XML_ATTRIBUTE_DECL:
2775 case XML_ENTITY_DECL:
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002776 case XML_XINCLUDE_START:
2777 case XML_XINCLUDE_END:
Daniel Veillardd6038e02003-07-30 16:37:18 +00002778 return(XML_READER_TYPE_NONE);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002779 }
2780 return(-1);
2781}
2782
2783/**
Daniel Veillard01c13b52002-12-10 15:19:08 +00002784 * xmlTextReaderIsEmptyElement:
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002785 * @reader: the xmlTextReaderPtr used
2786 *
2787 * Check if the current node is empty
2788 *
2789 * Returns 1 if empty, 0 if not and -1 in case of error
2790 */
2791int
2792xmlTextReaderIsEmptyElement(xmlTextReaderPtr reader) {
2793 if ((reader == NULL) || (reader->node == NULL))
2794 return(-1);
Daniel Veillarddf512f42002-12-23 15:56:21 +00002795 if (reader->node->type != XML_ELEMENT_NODE)
2796 return(0);
Daniel Veillarde3c036e2003-01-01 15:11:05 +00002797 if (reader->curnode != NULL)
2798 return(0);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002799 if (reader->node->children != NULL)
2800 return(0);
Daniel Veillarddab8ea92003-01-02 14:16:45 +00002801 if (reader->state == XML_TEXTREADER_END)
2802 return(0);
Daniel Veillard7899c5c2003-11-03 12:31:38 +00002803 if (reader->doc != NULL)
2804 return(1);
Daniel Veillard96b6cd22004-01-08 16:49:50 +00002805#ifdef LIBXML_XINCLUDE_ENABLED
Daniel Veillard7899c5c2003-11-03 12:31:38 +00002806 if (reader->in_xinclude > 0)
2807 return(1);
Daniel Veillard96b6cd22004-01-08 16:49:50 +00002808#endif
Daniel Veillarde8039df2003-10-27 11:25:13 +00002809 return((reader->node->extra & NODE_IS_EMPTY) != 0);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002810}
2811
2812/**
2813 * xmlTextReaderLocalName:
2814 * @reader: the xmlTextReaderPtr used
2815 *
2816 * The local name of the node.
2817 *
2818 * Returns the local name or NULL if not available
2819 */
2820xmlChar *
2821xmlTextReaderLocalName(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002822 xmlNodePtr node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002823 if ((reader == NULL) || (reader->node == NULL))
2824 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002825 if (reader->curnode != NULL)
2826 node = reader->curnode;
2827 else
2828 node = reader->node;
2829 if (node->type == XML_NAMESPACE_DECL) {
2830 xmlNsPtr ns = (xmlNsPtr) node;
2831 if (ns->prefix == NULL)
2832 return(xmlStrdup(BAD_CAST "xmlns"));
2833 else
2834 return(xmlStrdup(ns->prefix));
2835 }
2836 if ((node->type != XML_ELEMENT_NODE) &&
2837 (node->type != XML_ATTRIBUTE_NODE))
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002838 return(xmlTextReaderName(reader));
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002839 return(xmlStrdup(node->name));
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002840}
2841
2842/**
Daniel Veillarde72c5082003-09-19 12:44:05 +00002843 * xmlTextReaderConstLocalName:
2844 * @reader: the xmlTextReaderPtr used
2845 *
2846 * The local name of the node.
2847 *
2848 * Returns the local name or NULL if not available, the
2849 * string will be deallocated with the reader.
2850 */
2851const xmlChar *
2852xmlTextReaderConstLocalName(xmlTextReaderPtr reader) {
2853 xmlNodePtr node;
2854 if ((reader == NULL) || (reader->node == NULL))
2855 return(NULL);
2856 if (reader->curnode != NULL)
2857 node = reader->curnode;
2858 else
2859 node = reader->node;
2860 if (node->type == XML_NAMESPACE_DECL) {
2861 xmlNsPtr ns = (xmlNsPtr) node;
2862 if (ns->prefix == NULL)
2863 return(CONSTSTR(BAD_CAST "xmlns"));
2864 else
2865 return(ns->prefix);
2866 }
2867 if ((node->type != XML_ELEMENT_NODE) &&
2868 (node->type != XML_ATTRIBUTE_NODE))
2869 return(xmlTextReaderConstName(reader));
2870 return(node->name);
2871}
2872
2873/**
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002874 * xmlTextReaderName:
2875 * @reader: the xmlTextReaderPtr used
2876 *
2877 * The qualified name of the node, equal to Prefix :LocalName.
2878 *
2879 * Returns the local name or NULL if not available
2880 */
2881xmlChar *
2882xmlTextReaderName(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002883 xmlNodePtr node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002884 xmlChar *ret;
2885
2886 if ((reader == NULL) || (reader->node == NULL))
2887 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002888 if (reader->curnode != NULL)
2889 node = reader->curnode;
2890 else
2891 node = reader->node;
2892 switch (node->type) {
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002893 case XML_ELEMENT_NODE:
2894 case XML_ATTRIBUTE_NODE:
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002895 if ((node->ns == NULL) ||
2896 (node->ns->prefix == NULL))
2897 return(xmlStrdup(node->name));
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002898
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002899 ret = xmlStrdup(node->ns->prefix);
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002900 ret = xmlStrcat(ret, BAD_CAST ":");
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002901 ret = xmlStrcat(ret, node->name);
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002902 return(ret);
2903 case XML_TEXT_NODE:
2904 return(xmlStrdup(BAD_CAST "#text"));
2905 case XML_CDATA_SECTION_NODE:
2906 return(xmlStrdup(BAD_CAST "#cdata-section"));
2907 case XML_ENTITY_NODE:
2908 case XML_ENTITY_REF_NODE:
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002909 return(xmlStrdup(node->name));
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002910 case XML_PI_NODE:
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002911 return(xmlStrdup(node->name));
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002912 case XML_COMMENT_NODE:
2913 return(xmlStrdup(BAD_CAST "#comment"));
2914 case XML_DOCUMENT_NODE:
2915 case XML_HTML_DOCUMENT_NODE:
2916#ifdef LIBXML_DOCB_ENABLED
2917 case XML_DOCB_DOCUMENT_NODE:
2918#endif
2919 return(xmlStrdup(BAD_CAST "#document"));
2920 case XML_DOCUMENT_FRAG_NODE:
2921 return(xmlStrdup(BAD_CAST "#document-fragment"));
2922 case XML_NOTATION_NODE:
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002923 return(xmlStrdup(node->name));
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002924 case XML_DOCUMENT_TYPE_NODE:
2925 case XML_DTD_NODE:
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002926 return(xmlStrdup(node->name));
2927 case XML_NAMESPACE_DECL: {
2928 xmlNsPtr ns = (xmlNsPtr) node;
2929
2930 ret = xmlStrdup(BAD_CAST "xmlns");
2931 if (ns->prefix == NULL)
2932 return(ret);
2933 ret = xmlStrcat(ret, BAD_CAST ":");
2934 ret = xmlStrcat(ret, ns->prefix);
2935 return(ret);
2936 }
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002937
2938 case XML_ELEMENT_DECL:
2939 case XML_ATTRIBUTE_DECL:
2940 case XML_ENTITY_DECL:
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002941 case XML_XINCLUDE_START:
2942 case XML_XINCLUDE_END:
2943 return(NULL);
2944 }
2945 return(NULL);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002946}
2947
2948/**
Daniel Veillarde72c5082003-09-19 12:44:05 +00002949 * xmlTextReaderConstName:
2950 * @reader: the xmlTextReaderPtr used
2951 *
2952 * The qualified name of the node, equal to Prefix :LocalName.
2953 *
2954 * Returns the local name or NULL if not available, the string is
2955 * deallocated with the reader.
2956 */
2957const xmlChar *
2958xmlTextReaderConstName(xmlTextReaderPtr reader) {
2959 xmlNodePtr node;
2960
2961 if ((reader == NULL) || (reader->node == NULL))
2962 return(NULL);
2963 if (reader->curnode != NULL)
2964 node = reader->curnode;
2965 else
2966 node = reader->node;
2967 switch (node->type) {
2968 case XML_ELEMENT_NODE:
2969 case XML_ATTRIBUTE_NODE:
2970 if ((node->ns == NULL) ||
2971 (node->ns->prefix == NULL))
2972 return(node->name);
2973 return(CONSTQSTR(node->ns->prefix, node->name));
2974 case XML_TEXT_NODE:
2975 return(CONSTSTR(BAD_CAST "#text"));
2976 case XML_CDATA_SECTION_NODE:
2977 return(CONSTSTR(BAD_CAST "#cdata-section"));
2978 case XML_ENTITY_NODE:
2979 case XML_ENTITY_REF_NODE:
2980 return(CONSTSTR(node->name));
2981 case XML_PI_NODE:
2982 return(CONSTSTR(node->name));
2983 case XML_COMMENT_NODE:
2984 return(CONSTSTR(BAD_CAST "#comment"));
2985 case XML_DOCUMENT_NODE:
2986 case XML_HTML_DOCUMENT_NODE:
2987#ifdef LIBXML_DOCB_ENABLED
2988 case XML_DOCB_DOCUMENT_NODE:
2989#endif
2990 return(CONSTSTR(BAD_CAST "#document"));
2991 case XML_DOCUMENT_FRAG_NODE:
2992 return(CONSTSTR(BAD_CAST "#document-fragment"));
2993 case XML_NOTATION_NODE:
2994 return(CONSTSTR(node->name));
2995 case XML_DOCUMENT_TYPE_NODE:
2996 case XML_DTD_NODE:
2997 return(CONSTSTR(node->name));
2998 case XML_NAMESPACE_DECL: {
2999 xmlNsPtr ns = (xmlNsPtr) node;
3000
3001 if (ns->prefix == NULL)
3002 return(CONSTSTR(BAD_CAST "xmlns"));
3003 return(CONSTQSTR(BAD_CAST "xmlns", ns->prefix));
3004 }
3005
3006 case XML_ELEMENT_DECL:
3007 case XML_ATTRIBUTE_DECL:
3008 case XML_ENTITY_DECL:
3009 case XML_XINCLUDE_START:
3010 case XML_XINCLUDE_END:
3011 return(NULL);
3012 }
3013 return(NULL);
3014}
3015
3016/**
Daniel Veillarde1ca5032002-12-09 14:13:43 +00003017 * xmlTextReaderPrefix:
3018 * @reader: the xmlTextReaderPtr used
3019 *
3020 * A shorthand reference to the namespace associated with the node.
3021 *
3022 * Returns the prefix or NULL if not available
3023 */
3024xmlChar *
3025xmlTextReaderPrefix(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00003026 xmlNodePtr node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00003027 if ((reader == NULL) || (reader->node == NULL))
3028 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00003029 if (reader->curnode != NULL)
3030 node = reader->curnode;
3031 else
3032 node = reader->node;
3033 if (node->type == XML_NAMESPACE_DECL) {
3034 xmlNsPtr ns = (xmlNsPtr) node;
3035 if (ns->prefix == NULL)
3036 return(NULL);
3037 return(xmlStrdup(BAD_CAST "xmlns"));
3038 }
3039 if ((node->type != XML_ELEMENT_NODE) &&
3040 (node->type != XML_ATTRIBUTE_NODE))
Daniel Veillarde1ca5032002-12-09 14:13:43 +00003041 return(NULL);
Daniel Veillard952379b2003-03-17 15:37:12 +00003042 if ((node->ns != NULL) && (node->ns->prefix != NULL))
Daniel Veillardda46d2d2002-12-15 23:36:49 +00003043 return(xmlStrdup(node->ns->prefix));
Daniel Veillarde1ca5032002-12-09 14:13:43 +00003044 return(NULL);
3045}
3046
3047/**
Daniel Veillarde72c5082003-09-19 12:44:05 +00003048 * xmlTextReaderConstPrefix:
3049 * @reader: the xmlTextReaderPtr used
3050 *
3051 * A shorthand reference to the namespace associated with the node.
3052 *
3053 * Returns the prefix or NULL if not available, the string is deallocated
3054 * with the reader.
3055 */
3056const xmlChar *
3057xmlTextReaderConstPrefix(xmlTextReaderPtr reader) {
3058 xmlNodePtr node;
3059 if ((reader == NULL) || (reader->node == NULL))
3060 return(NULL);
3061 if (reader->curnode != NULL)
3062 node = reader->curnode;
3063 else
3064 node = reader->node;
3065 if (node->type == XML_NAMESPACE_DECL) {
3066 xmlNsPtr ns = (xmlNsPtr) node;
3067 if (ns->prefix == NULL)
3068 return(NULL);
3069 return(CONSTSTR(BAD_CAST "xmlns"));
3070 }
3071 if ((node->type != XML_ELEMENT_NODE) &&
3072 (node->type != XML_ATTRIBUTE_NODE))
3073 return(NULL);
3074 if ((node->ns != NULL) && (node->ns->prefix != NULL))
3075 return(CONSTSTR(node->ns->prefix));
3076 return(NULL);
3077}
3078
3079/**
Daniel Veillarde1ca5032002-12-09 14:13:43 +00003080 * xmlTextReaderNamespaceUri:
3081 * @reader: the xmlTextReaderPtr used
3082 *
3083 * The URI defining the namespace associated with the node.
3084 *
3085 * Returns the namespace URI or NULL if not available
3086 */
3087xmlChar *
3088xmlTextReaderNamespaceUri(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00003089 xmlNodePtr node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00003090 if ((reader == NULL) || (reader->node == NULL))
3091 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00003092 if (reader->curnode != NULL)
3093 node = reader->curnode;
3094 else
3095 node = reader->node;
Daniel Veillardecaba492002-12-30 10:55:29 +00003096 if (node->type == XML_NAMESPACE_DECL)
3097 return(xmlStrdup(BAD_CAST "http://www.w3.org/2000/xmlns/"));
Daniel Veillardda46d2d2002-12-15 23:36:49 +00003098 if ((node->type != XML_ELEMENT_NODE) &&
3099 (node->type != XML_ATTRIBUTE_NODE))
Daniel Veillarde1ca5032002-12-09 14:13:43 +00003100 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00003101 if (node->ns != NULL)
3102 return(xmlStrdup(node->ns->href));
Daniel Veillarde1ca5032002-12-09 14:13:43 +00003103 return(NULL);
3104}
3105
3106/**
Daniel Veillarde72c5082003-09-19 12:44:05 +00003107 * xmlTextReaderConstNamespaceUri:
3108 * @reader: the xmlTextReaderPtr used
3109 *
3110 * The URI defining the namespace associated with the node.
3111 *
3112 * Returns the namespace URI or NULL if not available, the string
3113 * will be deallocated with the reader
3114 */
3115const xmlChar *
3116xmlTextReaderConstNamespaceUri(xmlTextReaderPtr reader) {
3117 xmlNodePtr node;
3118 if ((reader == NULL) || (reader->node == NULL))
3119 return(NULL);
3120 if (reader->curnode != NULL)
3121 node = reader->curnode;
3122 else
3123 node = reader->node;
3124 if (node->type == XML_NAMESPACE_DECL)
3125 return(CONSTSTR(BAD_CAST "http://www.w3.org/2000/xmlns/"));
3126 if ((node->type != XML_ELEMENT_NODE) &&
3127 (node->type != XML_ATTRIBUTE_NODE))
3128 return(NULL);
3129 if (node->ns != NULL)
3130 return(CONSTSTR(node->ns->href));
3131 return(NULL);
3132}
3133
3134/**
Daniel Veillarde1ca5032002-12-09 14:13:43 +00003135 * xmlTextReaderBaseUri:
3136 * @reader: the xmlTextReaderPtr used
3137 *
3138 * The base URI of the node.
3139 *
3140 * Returns the base URI or NULL if not available
3141 */
3142xmlChar *
3143xmlTextReaderBaseUri(xmlTextReaderPtr reader) {
3144 if ((reader == NULL) || (reader->node == NULL))
3145 return(NULL);
3146 return(xmlNodeGetBase(NULL, reader->node));
3147}
3148
3149/**
Daniel Veillarde72c5082003-09-19 12:44:05 +00003150 * xmlTextReaderConstBaseUri:
3151 * @reader: the xmlTextReaderPtr used
3152 *
3153 * The base URI of the node.
3154 *
3155 * Returns the base URI or NULL if not available, the string
3156 * will be deallocated with the reader
3157 */
3158const xmlChar *
3159xmlTextReaderConstBaseUri(xmlTextReaderPtr reader) {
3160 xmlChar *tmp;
3161 const xmlChar *ret;
3162
3163 if ((reader == NULL) || (reader->node == NULL))
3164 return(NULL);
3165 tmp = xmlNodeGetBase(NULL, reader->node);
3166 if (tmp == NULL)
3167 return(NULL);
3168 ret = CONSTSTR(tmp);
3169 xmlFree(tmp);
3170 return(ret);
3171}
3172
3173/**
Daniel Veillarde1ca5032002-12-09 14:13:43 +00003174 * xmlTextReaderDepth:
3175 * @reader: the xmlTextReaderPtr used
3176 *
3177 * The depth of the node in the tree.
3178 *
3179 * Returns the depth or -1 in case of error
3180 */
3181int
3182xmlTextReaderDepth(xmlTextReaderPtr reader) {
3183 if (reader == NULL)
3184 return(-1);
3185 if (reader->node == NULL)
3186 return(0);
3187
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00003188 if (reader->curnode != NULL) {
3189 if ((reader->curnode->type == XML_ATTRIBUTE_NODE) ||
3190 (reader->curnode->type == XML_NAMESPACE_DECL))
3191 return(reader->depth + 1);
3192 return(reader->depth + 2);
3193 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +00003194 return(reader->depth);
3195}
3196
3197/**
3198 * xmlTextReaderHasAttributes:
3199 * @reader: the xmlTextReaderPtr used
3200 *
3201 * Whether the node has attributes.
3202 *
3203 * Returns 1 if true, 0 if false, and -1 in case or error
3204 */
3205int
3206xmlTextReaderHasAttributes(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00003207 xmlNodePtr node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00003208 if (reader == NULL)
3209 return(-1);
3210 if (reader->node == NULL)
3211 return(0);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00003212 if (reader->curnode != NULL)
3213 node = reader->curnode;
3214 else
3215 node = reader->node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00003216
Daniel Veillardda46d2d2002-12-15 23:36:49 +00003217 if ((node->type == XML_ELEMENT_NODE) &&
Daniel Veillard6bb3e862004-11-24 12:39:00 +00003218 ((node->properties != NULL) || (node->nsDef != NULL)))
Daniel Veillarde1ca5032002-12-09 14:13:43 +00003219 return(1);
3220 /* TODO: handle the xmlDecl */
3221 return(0);
3222}
3223
3224/**
3225 * xmlTextReaderHasValue:
3226 * @reader: the xmlTextReaderPtr used
3227 *
3228 * Whether the node can have a text value.
3229 *
3230 * Returns 1 if true, 0 if false, and -1 in case or error
3231 */
3232int
3233xmlTextReaderHasValue(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00003234 xmlNodePtr node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00003235 if (reader == NULL)
3236 return(-1);
3237 if (reader->node == NULL)
3238 return(0);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00003239 if (reader->curnode != NULL)
3240 node = reader->curnode;
3241 else
3242 node = reader->node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00003243
Daniel Veillardda46d2d2002-12-15 23:36:49 +00003244 switch (node->type) {
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00003245 case XML_ATTRIBUTE_NODE:
3246 case XML_TEXT_NODE:
3247 case XML_CDATA_SECTION_NODE:
3248 case XML_PI_NODE:
3249 case XML_COMMENT_NODE:
Daniel Veillard9e077102003-04-10 13:36:54 +00003250 case XML_NAMESPACE_DECL:
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00003251 return(1);
3252 default:
Daniel Veillard2cfd9df2003-03-22 22:39:16 +00003253 break;
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00003254 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +00003255 return(0);
3256}
3257
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00003258/**
3259 * xmlTextReaderValue:
3260 * @reader: the xmlTextReaderPtr used
3261 *
3262 * Provides the text value of the node if present
3263 *
Daniel Veillard198c1bf2003-10-20 17:07:41 +00003264 * Returns the string or NULL if not available. The result must be deallocated
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00003265 * with xmlFree()
Daniel Veillarde1ca5032002-12-09 14:13:43 +00003266 */
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00003267xmlChar *
3268xmlTextReaderValue(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00003269 xmlNodePtr node;
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00003270 if (reader == NULL)
3271 return(NULL);
3272 if (reader->node == NULL)
3273 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00003274 if (reader->curnode != NULL)
3275 node = reader->curnode;
3276 else
3277 node = reader->node;
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00003278
Daniel Veillardda46d2d2002-12-15 23:36:49 +00003279 switch (node->type) {
3280 case XML_NAMESPACE_DECL:
3281 return(xmlStrdup(((xmlNsPtr) node)->href));
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00003282 case XML_ATTRIBUTE_NODE:{
Daniel Veillardda46d2d2002-12-15 23:36:49 +00003283 xmlAttrPtr attr = (xmlAttrPtr) node;
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00003284
3285 if (attr->parent != NULL)
3286 return (xmlNodeListGetString
3287 (attr->parent->doc, attr->children, 1));
3288 else
3289 return (xmlNodeListGetString(NULL, attr->children, 1));
3290 break;
3291 }
3292 case XML_TEXT_NODE:
3293 case XML_CDATA_SECTION_NODE:
3294 case XML_PI_NODE:
3295 case XML_COMMENT_NODE:
Daniel Veillardda46d2d2002-12-15 23:36:49 +00003296 if (node->content != NULL)
3297 return (xmlStrdup(node->content));
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00003298 default:
Daniel Veillard2cfd9df2003-03-22 22:39:16 +00003299 break;
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00003300 }
3301 return(NULL);
3302}
3303
3304/**
Daniel Veillard198c1bf2003-10-20 17:07:41 +00003305 * xmlTextReaderConstValue:
3306 * @reader: the xmlTextReaderPtr used
3307 *
3308 * Provides the text value of the node if present
3309 *
3310 * Returns the string or NULL if not available. The result will be
3311 * deallocated on the next Read() operation.
3312 */
3313const xmlChar *
3314xmlTextReaderConstValue(xmlTextReaderPtr reader) {
3315 xmlNodePtr node;
3316 if (reader == NULL)
3317 return(NULL);
3318 if (reader->node == NULL)
3319 return(NULL);
3320 if (reader->curnode != NULL)
3321 node = reader->curnode;
3322 else
3323 node = reader->node;
3324
3325 switch (node->type) {
3326 case XML_NAMESPACE_DECL:
3327 return(((xmlNsPtr) node)->href);
3328 case XML_ATTRIBUTE_NODE:{
3329 xmlAttrPtr attr = (xmlAttrPtr) node;
3330
3331 if ((attr->children != NULL) &&
3332 (attr->children->type == XML_TEXT_NODE) &&
3333 (attr->children->next == NULL))
3334 return(attr->children->content);
3335 else {
Daniel Veillard8165a6b2004-07-01 11:20:33 +00003336 if (reader->buffer == NULL)
3337 reader->buffer = xmlBufferCreateSize(100);
3338 if (reader->buffer == NULL) {
3339 xmlGenericError(xmlGenericErrorContext,
3340 "xmlTextReaderSetup : malloc failed\n");
3341 return (NULL);
3342 }
Daniel Veillard198c1bf2003-10-20 17:07:41 +00003343 reader->buffer->use = 0;
3344 xmlNodeBufGetContent(reader->buffer, node);
3345 return(reader->buffer->content);
3346 }
3347 break;
3348 }
3349 case XML_TEXT_NODE:
3350 case XML_CDATA_SECTION_NODE:
3351 case XML_PI_NODE:
3352 case XML_COMMENT_NODE:
3353 return(node->content);
3354 default:
3355 break;
3356 }
3357 return(NULL);
3358}
3359
3360/**
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00003361 * xmlTextReaderIsDefault:
3362 * @reader: the xmlTextReaderPtr used
3363 *
3364 * Whether an Attribute node was generated from the default value
3365 * defined in the DTD or schema.
3366 *
3367 * Returns 0 if not defaulted, 1 if defaulted, and -1 in case of error
3368 */
3369int
3370xmlTextReaderIsDefault(xmlTextReaderPtr reader) {
3371 if (reader == NULL)
3372 return(-1);
3373 return(0);
3374}
3375
3376/**
3377 * xmlTextReaderQuoteChar:
3378 * @reader: the xmlTextReaderPtr used
3379 *
3380 * The quotation mark character used to enclose the value of an attribute.
3381 *
3382 * Returns " or ' and -1 in case of error
3383 */
3384int
3385xmlTextReaderQuoteChar(xmlTextReaderPtr reader) {
3386 if (reader == NULL)
3387 return(-1);
3388 /* TODO maybe lookup the attribute value for " first */
3389 return((int) '"');
3390}
Daniel Veillarde1ca5032002-12-09 14:13:43 +00003391
3392/**
3393 * xmlTextReaderXmlLang:
3394 * @reader: the xmlTextReaderPtr used
3395 *
3396 * The xml:lang scope within which the node resides.
3397 *
3398 * Returns the xml:lang value or NULL if none exists.
3399 */
3400xmlChar *
3401xmlTextReaderXmlLang(xmlTextReaderPtr reader) {
3402 if (reader == NULL)
3403 return(NULL);
3404 if (reader->node == NULL)
3405 return(NULL);
3406 return(xmlNodeGetLang(reader->node));
3407}
3408
Daniel Veillard67df8092002-12-16 22:04:11 +00003409/**
Daniel Veillard7a02cfe2003-09-25 12:18:34 +00003410 * xmlTextReaderConstXmlLang:
Daniel Veillarde72c5082003-09-19 12:44:05 +00003411 * @reader: the xmlTextReaderPtr used
3412 *
3413 * The xml:lang scope within which the node resides.
3414 *
3415 * Returns the xml:lang value or NULL if none exists.
3416 */
3417const xmlChar *
3418xmlTextReaderConstXmlLang(xmlTextReaderPtr reader) {
3419 xmlChar *tmp;
3420 const xmlChar *ret;
3421
3422 if (reader == NULL)
3423 return(NULL);
3424 if (reader->node == NULL)
3425 return(NULL);
3426 tmp = xmlNodeGetLang(reader->node);
3427 if (tmp == NULL)
3428 return(NULL);
3429 ret = CONSTSTR(tmp);
3430 xmlFree(tmp);
3431 return(ret);
3432}
3433
3434/**
Daniel Veillardf85ce8e2003-09-22 10:24:45 +00003435 * xmlTextReaderConstString:
3436 * @reader: the xmlTextReaderPtr used
3437 * @str: the string to intern.
3438 *
3439 * Get an interned string from the reader, allows for example to
3440 * speedup string name comparisons
3441 *
3442 * Returns an interned copy of the string or NULL in case of error. The
3443 * string will be deallocated with the reader.
3444 */
3445const xmlChar *
3446xmlTextReaderConstString(xmlTextReaderPtr reader, const xmlChar *str) {
3447 if (reader == NULL)
3448 return(NULL);
3449 return(CONSTSTR(str));
3450}
3451
3452/**
Daniel Veillard67df8092002-12-16 22:04:11 +00003453 * xmlTextReaderNormalization:
3454 * @reader: the xmlTextReaderPtr used
3455 *
3456 * The value indicating whether to normalize white space and attribute values.
3457 * Since attribute value and end of line normalizations are a MUST in the XML
3458 * specification only the value true is accepted. The broken bahaviour of
3459 * accepting out of range character entities like &#0; is of course not
3460 * supported either.
3461 *
3462 * Returns 1 or -1 in case of error.
3463 */
3464int
3465xmlTextReaderNormalization(xmlTextReaderPtr reader) {
3466 if (reader == NULL)
3467 return(-1);
3468 return(1);
3469}
3470
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00003471/************************************************************************
3472 * *
3473 * Extensions to the base APIs *
3474 * *
3475 ************************************************************************/
3476
3477/**
3478 * xmlTextReaderSetParserProp:
3479 * @reader: the xmlTextReaderPtr used
3480 * @prop: the xmlParserProperties to set
3481 * @value: usually 0 or 1 to (de)activate it
3482 *
3483 * Change the parser processing behaviour by changing some of its internal
3484 * properties. Note that some properties can only be changed before any
3485 * read has been done.
3486 *
3487 * Returns 0 if the call was successful, or -1 in case of error
3488 */
3489int
3490xmlTextReaderSetParserProp(xmlTextReaderPtr reader, int prop, int value) {
3491 xmlParserProperties p = (xmlParserProperties) prop;
3492 xmlParserCtxtPtr ctxt;
3493
3494 if ((reader == NULL) || (reader->ctxt == NULL))
3495 return(-1);
3496 ctxt = reader->ctxt;
3497
3498 switch (p) {
3499 case XML_PARSER_LOADDTD:
3500 if (value != 0) {
3501 if (ctxt->loadsubset == 0) {
3502 if (reader->mode != XML_TEXTREADER_MODE_INITIAL)
3503 return(-1);
3504 ctxt->loadsubset = XML_DETECT_IDS;
3505 }
3506 } else {
3507 ctxt->loadsubset = 0;
3508 }
3509 return(0);
3510 case XML_PARSER_DEFAULTATTRS:
3511 if (value != 0) {
3512 ctxt->loadsubset |= XML_COMPLETE_ATTRS;
3513 } else {
3514 if (ctxt->loadsubset & XML_COMPLETE_ATTRS)
3515 ctxt->loadsubset -= XML_COMPLETE_ATTRS;
3516 }
3517 return(0);
3518 case XML_PARSER_VALIDATE:
3519 if (value != 0) {
3520 ctxt->validate = 1;
Daniel Veillardf4e55762003-04-15 23:32:22 +00003521 reader->validate = XML_TEXTREADER_VALIDATE_DTD;
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00003522 } else {
3523 ctxt->validate = 0;
3524 }
3525 return(0);
Daniel Veillarde18fc182002-12-28 22:56:33 +00003526 case XML_PARSER_SUBST_ENTITIES:
3527 if (value != 0) {
3528 ctxt->replaceEntities = 1;
3529 } else {
3530 ctxt->replaceEntities = 0;
3531 }
3532 return(0);
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00003533 }
3534 return(-1);
3535}
3536
3537/**
3538 * xmlTextReaderGetParserProp:
3539 * @reader: the xmlTextReaderPtr used
3540 * @prop: the xmlParserProperties to get
3541 *
3542 * Read the parser internal property.
3543 *
3544 * Returns the value, usually 0 or 1, or -1 in case of error.
3545 */
3546int
3547xmlTextReaderGetParserProp(xmlTextReaderPtr reader, int prop) {
3548 xmlParserProperties p = (xmlParserProperties) prop;
3549 xmlParserCtxtPtr ctxt;
3550
3551 if ((reader == NULL) || (reader->ctxt == NULL))
3552 return(-1);
3553 ctxt = reader->ctxt;
3554
3555 switch (p) {
3556 case XML_PARSER_LOADDTD:
3557 if ((ctxt->loadsubset != 0) || (ctxt->validate != 0))
3558 return(1);
3559 return(0);
3560 case XML_PARSER_DEFAULTATTRS:
3561 if (ctxt->loadsubset & XML_COMPLETE_ATTRS)
3562 return(1);
3563 return(0);
3564 case XML_PARSER_VALIDATE:
Daniel Veillardf4e55762003-04-15 23:32:22 +00003565 return(reader->validate);
Daniel Veillarde18fc182002-12-28 22:56:33 +00003566 case XML_PARSER_SUBST_ENTITIES:
3567 return(ctxt->replaceEntities);
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00003568 }
3569 return(-1);
3570}
3571
Daniel Veillarde18fc182002-12-28 22:56:33 +00003572/**
Aleksey Sanind671e282005-01-03 21:58:59 +00003573 * xmlTextReaderGetParserLineNumber:
3574 * @ctx: the user data (XML reader context)
3575 *
3576 * Provide the line number of the current parsing point.
3577 *
3578 * Returns an int
3579 */
3580int
3581xmlTextReaderGetParserLineNumber(xmlTextReaderPtr reader)
3582{
3583 if ((reader == NULL) || (reader->ctxt == NULL) || (reader->ctxt->input == NULL)) {
3584 return(0);
3585 }
3586 return(reader->ctxt->input->line);
3587}
3588
3589/**
3590 * xmlTextReaderGetParserColumnNumber:
3591 * @ctx: the user data (XML reader context)
3592 *
3593 * Provide the column number of the current parsing point.
3594 *
3595 * Returns an int
3596 */
3597int
3598xmlTextReaderGetParserColumnNumber(xmlTextReaderPtr reader)
3599{
3600 if ((reader == NULL) || (reader->ctxt == NULL) || (reader->ctxt->input == NULL)) {
3601 return(0);
3602 }
3603 return(reader->ctxt->input->col);
3604}
3605
3606/**
Daniel Veillarde18fc182002-12-28 22:56:33 +00003607 * xmlTextReaderCurrentNode:
3608 * @reader: the xmlTextReaderPtr used
3609 *
3610 * Hacking interface allowing to get the xmlNodePtr correponding to the
3611 * current node being accessed by the xmlTextReader. This is dangerous
3612 * because the underlying node may be destroyed on the next Reads.
3613 *
3614 * Returns the xmlNodePtr or NULL in case of error.
3615 */
3616xmlNodePtr
3617xmlTextReaderCurrentNode(xmlTextReaderPtr reader) {
3618 if (reader == NULL)
3619 return(NULL);
3620
3621 if (reader->curnode != NULL)
3622 return(reader->curnode);
3623 return(reader->node);
3624}
3625
3626/**
Daniel Veillard9ee35f32003-09-28 00:19:54 +00003627 * xmlTextReaderPreserve:
3628 * @reader: the xmlTextReaderPtr used
3629 *
Daniel Veillard4a14fb82004-06-14 19:58:20 +00003630 * This tells the XML Reader to preserve the current node.
3631 * The caller must also use xmlTextReaderCurrentDoc() to
3632 * keep an handle on the resulting document once parsing has finished
Daniel Veillard9ee35f32003-09-28 00:19:54 +00003633 *
3634 * Returns the xmlNodePtr or NULL in case of error.
3635 */
3636xmlNodePtr
3637xmlTextReaderPreserve(xmlTextReaderPtr reader) {
3638 xmlNodePtr cur, parent;
3639
3640 if (reader == NULL)
3641 return(NULL);
3642
3643 if (reader->curnode != NULL)
3644 cur = reader->curnode;
3645 else
3646 cur = reader->node;
3647 if (cur == NULL)
3648 return(NULL);
Daniel Veillard1e906612003-12-05 14:57:46 +00003649
Daniel Veillard4a14fb82004-06-14 19:58:20 +00003650 if ((cur->type != XML_DOCUMENT_NODE) && (cur->type != XML_DTD_NODE)) {
Daniel Veillard1e906612003-12-05 14:57:46 +00003651 cur->extra |= NODE_IS_PRESERVED;
3652 cur->extra |= NODE_IS_SPRESERVED;
3653 }
3654 reader->preserves++;
Daniel Veillard9ee35f32003-09-28 00:19:54 +00003655
3656 parent = cur->parent;;
3657 while (parent != NULL) {
Daniel Veillard1e906612003-12-05 14:57:46 +00003658 if (parent->type == XML_ELEMENT_NODE)
3659 parent->extra |= NODE_IS_PRESERVED;
Daniel Veillard9ee35f32003-09-28 00:19:54 +00003660 parent = parent->parent;
3661 }
3662 return(cur);
3663}
3664
Daniel Veillard1e906612003-12-05 14:57:46 +00003665#ifdef LIBXML_PATTERN_ENABLED
3666/**
3667 * xmlTextReaderPreservePattern:
3668 * @reader: the xmlTextReaderPtr used
3669 * @pattern: an XPath subset pattern
Daniel Veillardffa7b7e2003-12-05 16:10:21 +00003670 * @namespaces: the prefix definitions, array of [URI, prefix] or NULL
Daniel Veillard1e906612003-12-05 14:57:46 +00003671 *
3672 * This tells the XML Reader to preserve all nodes matched by the
3673 * pattern. The caller must also use xmlTextReaderCurrentDoc() to
3674 * keep an handle on the resulting document once parsing has finished
3675 *
3676 * Returns a positive number in case of success and -1 in case of error
3677 */
3678int
Daniel Veillardffa7b7e2003-12-05 16:10:21 +00003679xmlTextReaderPreservePattern(xmlTextReaderPtr reader, const xmlChar *pattern,
3680 const xmlChar **namespaces)
3681{
Daniel Veillard1e906612003-12-05 14:57:46 +00003682 xmlPatternPtr comp;
3683
3684 if ((reader == NULL) || (pattern == NULL))
3685 return(-1);
3686
Daniel Veillardffa7b7e2003-12-05 16:10:21 +00003687 comp = xmlPatterncompile(pattern, reader->dict, 0, namespaces);
Daniel Veillard1e906612003-12-05 14:57:46 +00003688 if (comp == NULL)
3689 return(-1);
3690
3691 if (reader->patternMax <= 0) {
3692 reader->patternMax = 4;
3693 reader->patternTab = (xmlPatternPtr *) xmlMalloc(reader->patternMax *
3694 sizeof(reader->patternTab[0]));
3695 if (reader->patternTab == NULL) {
3696 xmlGenericError(xmlGenericErrorContext, "xmlMalloc failed !\n");
3697 return (-1);
3698 }
3699 }
3700 if (reader->patternNr >= reader->patternMax) {
3701 xmlPatternPtr *tmp;
3702 reader->patternMax *= 2;
3703 tmp = (xmlPatternPtr *) xmlRealloc(reader->patternTab,
3704 reader->patternMax *
3705 sizeof(reader->patternTab[0]));
3706 if (tmp == NULL) {
3707 xmlGenericError(xmlGenericErrorContext, "xmlRealloc failed !\n");
3708 reader->patternMax /= 2;
3709 return (-1);
3710 }
3711 reader->patternTab = tmp;
3712 }
3713 reader->patternTab[reader->patternNr] = comp;
3714 return(reader->patternNr++);
3715}
3716#endif
3717
Daniel Veillard9ee35f32003-09-28 00:19:54 +00003718/**
Daniel Veillarde18fc182002-12-28 22:56:33 +00003719 * xmlTextReaderCurrentDoc:
3720 * @reader: the xmlTextReaderPtr used
3721 *
3722 * Hacking interface allowing to get the xmlDocPtr correponding to the
Daniel Veillard9ee35f32003-09-28 00:19:54 +00003723 * current document being accessed by the xmlTextReader.
3724 * NOTE: as a result of this call, the reader will not destroy the
3725 * associated XML document and calling xmlFreeDoc() on the result
3726 * is needed once the reader parsing has finished.
Daniel Veillarde18fc182002-12-28 22:56:33 +00003727 *
3728 * Returns the xmlDocPtr or NULL in case of error.
3729 */
3730xmlDocPtr
3731xmlTextReaderCurrentDoc(xmlTextReaderPtr reader) {
Daniel Veillard198c1bf2003-10-20 17:07:41 +00003732 if (reader == NULL)
3733 return(NULL);
3734 if (reader->doc != NULL)
3735 return(reader->doc);
Daniel Veillard9ee35f32003-09-28 00:19:54 +00003736 if ((reader == NULL) || (reader->ctxt == NULL) ||
3737 (reader->ctxt->myDoc == NULL))
Daniel Veillarde18fc182002-12-28 22:56:33 +00003738 return(NULL);
3739
Daniel Veillard9ee35f32003-09-28 00:19:54 +00003740 reader->preserve = 1;
Daniel Veillarde18fc182002-12-28 22:56:33 +00003741 return(reader->ctxt->myDoc);
3742}
3743
Daniel Veillard37fc84d2003-05-09 19:38:15 +00003744#ifdef LIBXML_SCHEMAS_ENABLED
Daniel Veillardf4e55762003-04-15 23:32:22 +00003745/**
Daniel Veillard33300b42003-04-17 09:09:19 +00003746 * xmlTextReaderRelaxNGSetSchema:
3747 * @reader: the xmlTextReaderPtr used
3748 * @schema: a precompiled RelaxNG schema
3749 *
3750 * Use RelaxNG to validate the document as it is processed.
3751 * Activation is only possible before the first Read().
3752 * if @schema is NULL, then RelaxNG validation is desactivated.
3753 @ The @schema should not be freed until the reader is deallocated
3754 * or its use has been deactivated.
3755 *
3756 * Returns 0 in case the RelaxNG validation could be (des)activated and
3757 * -1 in case of error.
3758 */
3759int
3760xmlTextReaderRelaxNGSetSchema(xmlTextReaderPtr reader, xmlRelaxNGPtr schema) {
Daniel Veillardce682bc2004-11-05 17:22:25 +00003761 if (reader == NULL)
3762 return(-1);
Daniel Veillard33300b42003-04-17 09:09:19 +00003763 if (schema == NULL) {
3764 if (reader->rngSchemas != NULL) {
3765 xmlRelaxNGFree(reader->rngSchemas);
3766 reader->rngSchemas = NULL;
3767 }
3768 if (reader->rngValidCtxt != NULL) {
3769 xmlRelaxNGFreeValidCtxt(reader->rngValidCtxt);
3770 reader->rngValidCtxt = NULL;
3771 }
3772 return(0);
3773 }
3774 if (reader->mode != XML_TEXTREADER_MODE_INITIAL)
3775 return(-1);
3776 if (reader->rngSchemas != NULL) {
3777 xmlRelaxNGFree(reader->rngSchemas);
3778 reader->rngSchemas = NULL;
3779 }
3780 if (reader->rngValidCtxt != NULL) {
3781 xmlRelaxNGFreeValidCtxt(reader->rngValidCtxt);
3782 reader->rngValidCtxt = NULL;
3783 }
3784 reader->rngValidCtxt = xmlRelaxNGNewValidCtxt(schema);
3785 if (reader->rngValidCtxt == NULL)
3786 return(-1);
3787 if (reader->errorFunc != NULL) {
3788 xmlRelaxNGSetValidErrors(reader->rngValidCtxt,
3789 (xmlRelaxNGValidityErrorFunc)reader->errorFunc,
3790 (xmlRelaxNGValidityWarningFunc) reader->errorFunc,
3791 reader->errorFuncArg);
3792 }
3793 reader->rngValidErrors = 0;
3794 reader->rngFullNode = NULL;
3795 reader->validate = XML_TEXTREADER_VALIDATE_RNG;
3796 return(0);
3797}
3798
3799/**
Daniel Veillardf4e55762003-04-15 23:32:22 +00003800 * xmlTextReaderRelaxNGValidate:
3801 * @reader: the xmlTextReaderPtr used
3802 * @rng: the path to a RelaxNG schema or NULL
3803 *
3804 * Use RelaxNG to validate the document as it is processed.
3805 * Activation is only possible before the first Read().
3806 * if @rng is NULL, then RelaxNG validation is desactivated.
3807 *
3808 * Returns 0 in case the RelaxNG validation could be (des)activated and
3809 * -1 in case of error.
3810 */
3811int
3812xmlTextReaderRelaxNGValidate(xmlTextReaderPtr reader, const char *rng) {
3813 xmlRelaxNGParserCtxtPtr ctxt;
3814
3815 if (reader == NULL)
3816 return(-1);
3817
3818 if (rng == NULL) {
3819 if (reader->rngSchemas != NULL) {
3820 xmlRelaxNGFree(reader->rngSchemas);
3821 reader->rngSchemas = NULL;
3822 }
3823 if (reader->rngValidCtxt != NULL) {
3824 xmlRelaxNGFreeValidCtxt(reader->rngValidCtxt);
3825 reader->rngValidCtxt = NULL;
3826 }
3827 return(0);
3828 }
3829 if (reader->mode != XML_TEXTREADER_MODE_INITIAL)
3830 return(-1);
Daniel Veillard33300b42003-04-17 09:09:19 +00003831 if (reader->rngSchemas != NULL) {
3832 xmlRelaxNGFree(reader->rngSchemas);
3833 reader->rngSchemas = NULL;
3834 }
3835 if (reader->rngValidCtxt != NULL) {
3836 xmlRelaxNGFreeValidCtxt(reader->rngValidCtxt);
3837 reader->rngValidCtxt = NULL;
3838 }
Daniel Veillardf4e55762003-04-15 23:32:22 +00003839 ctxt = xmlRelaxNGNewParserCtxt(rng);
3840 if (reader->errorFunc != NULL) {
3841 xmlRelaxNGSetParserErrors(ctxt,
3842 (xmlRelaxNGValidityErrorFunc) reader->errorFunc,
3843 (xmlRelaxNGValidityWarningFunc) reader->errorFunc,
3844 reader->errorFuncArg);
3845 }
3846 reader->rngSchemas = xmlRelaxNGParse(ctxt);
3847 xmlRelaxNGFreeParserCtxt(ctxt);
3848 if (reader->rngSchemas == NULL)
3849 return(-1);
3850 reader->rngValidCtxt = xmlRelaxNGNewValidCtxt(reader->rngSchemas);
3851 if (reader->rngValidCtxt == NULL)
3852 return(-1);
3853 if (reader->errorFunc != NULL) {
3854 xmlRelaxNGSetValidErrors(reader->rngValidCtxt,
3855 (xmlRelaxNGValidityErrorFunc)reader->errorFunc,
3856 (xmlRelaxNGValidityWarningFunc) reader->errorFunc,
3857 reader->errorFuncArg);
3858 }
3859 reader->rngValidErrors = 0;
3860 reader->rngFullNode = NULL;
3861 reader->validate = XML_TEXTREADER_VALIDATE_RNG;
3862 return(0);
3863}
Daniel Veillard37fc84d2003-05-09 19:38:15 +00003864#endif
Daniel Veillardf4e55762003-04-15 23:32:22 +00003865
Daniel Veillarde2811272004-10-19 09:04:23 +00003866/**
3867 * xmlTextReaderIsNamespaceDecl:
3868 * @reader: the xmlTextReaderPtr used
3869 *
3870 * Determine whether the current node is a namespace declaration
3871 * rather than a regular attribute.
3872 *
3873 * Returns 1 if the current node is a namespace declaration, 0 if it
3874 * is a regular attribute or other type of node, or -1 in case of
3875 * error.
3876 */
3877int
3878xmlTextReaderIsNamespaceDecl(xmlTextReaderPtr reader) {
3879 xmlNodePtr node;
3880 if (reader == NULL)
3881 return(-1);
3882 if (reader->node == NULL)
3883 return(-1);
3884 if (reader->curnode != NULL)
3885 node = reader->curnode;
3886 else
3887 node = reader->node;
3888
3889 if (XML_NAMESPACE_DECL == node->type)
3890 return(1);
3891 else
3892 return(0);
3893}
3894
3895/**
3896 * xmlTextReaderConstXmlVersion:
3897 * @reader: the xmlTextReaderPtr used
3898 *
3899 * Determine the XML version of the document being read.
3900 *
3901 * Returns a string containing the XML version of the document or NULL
3902 * in case of error. The string is deallocated with the reader.
3903 */
3904const xmlChar *
3905xmlTextReaderConstXmlVersion(xmlTextReaderPtr reader) {
3906 xmlDocPtr doc = NULL;
3907 if (reader == NULL)
3908 return(NULL);
3909 if (reader->doc != NULL)
3910 doc = reader->doc;
3911 else if (reader->ctxt != NULL)
3912 doc = reader->ctxt->myDoc;
3913 if (doc == NULL)
3914 return(NULL);
3915
3916 if (doc->version == NULL)
3917 return(NULL);
3918 else
3919 return(CONSTSTR(doc->version));
3920}
3921
3922/**
3923 * xmlTextReaderStandalone:
3924 * @reader: the xmlTextReaderPtr used
3925 *
3926 * Determine the standalone status of the document being read.
3927 *
3928 * Returns 1 if the document was declared to be standalone, 0 if it
3929 * was declared to be not standalone, or -1 if the document did not
3930 * specify its standalone status or in case of error.
3931 */
3932int
3933xmlTextReaderStandalone(xmlTextReaderPtr reader) {
3934 xmlDocPtr doc = NULL;
3935 if (reader == NULL)
3936 return(-1);
3937 if (reader->doc != NULL)
3938 doc = reader->doc;
3939 else if (reader->ctxt != NULL)
3940 doc = reader->ctxt->myDoc;
3941 if (doc == NULL)
3942 return(-1);
3943
3944 return(doc->standalone);
3945}
3946
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00003947/************************************************************************
3948 * *
Daniel Veillard26f70262003-01-16 22:45:08 +00003949 * Error Handling Extensions *
3950 * *
3951 ************************************************************************/
3952
3953/* helper to build a xmlMalloc'ed string from a format and va_list */
3954static char *
3955xmlTextReaderBuildMessage(const char *msg, va_list ap) {
3956 int size;
3957 int chars;
3958 char *larger;
3959 char *str;
3960
Daniel Veillard3c908dc2003-04-19 00:07:51 +00003961 str = (char *) xmlMallocAtomic(150);
Daniel Veillard26f70262003-01-16 22:45:08 +00003962 if (str == NULL) {
3963 xmlGenericError(xmlGenericErrorContext, "xmlMalloc failed !\n");
3964 return NULL;
3965 }
3966
3967 size = 150;
3968
3969 while (1) {
3970 chars = vsnprintf(str, size, msg, ap);
3971 if ((chars > -1) && (chars < size))
3972 break;
3973 if (chars > -1)
3974 size += chars + 1;
3975 else
3976 size += 100;
3977 if ((larger = (char *) xmlRealloc(str, size)) == NULL) {
3978 xmlGenericError(xmlGenericErrorContext, "xmlRealloc failed !\n");
3979 xmlFree(str);
3980 return NULL;
3981 }
3982 str = larger;
3983 }
3984
3985 return str;
3986}
3987
Daniel Veillard417be3a2003-01-20 21:26:34 +00003988/**
Daniel Veillard540a31a2003-01-21 11:21:07 +00003989 * xmlTextReaderLocatorLineNumber:
Daniel Veillard417be3a2003-01-20 21:26:34 +00003990 * @locator: the xmlTextReaderLocatorPtr used
3991 *
3992 * Obtain the line number for the given locator.
3993 *
3994 * Returns the line number or -1 in case of error.
3995 */
3996int
3997xmlTextReaderLocatorLineNumber(xmlTextReaderLocatorPtr locator) {
3998 /* we know that locator is a xmlParserCtxtPtr */
3999 xmlParserCtxtPtr ctx = (xmlParserCtxtPtr)locator;
4000 int ret = -1;
4001
Daniel Veillardce682bc2004-11-05 17:22:25 +00004002 if (locator == NULL)
4003 return(-1);
Daniel Veillard417be3a2003-01-20 21:26:34 +00004004 if (ctx->node != NULL) {
4005 ret = xmlGetLineNo(ctx->node);
4006 }
4007 else {
4008 /* inspired from error.c */
4009 xmlParserInputPtr input;
4010 input = ctx->input;
4011 if ((input->filename == NULL) && (ctx->inputNr > 1))
4012 input = ctx->inputTab[ctx->inputNr - 2];
4013 if (input != NULL) {
4014 ret = input->line;
4015 }
4016 else {
4017 ret = -1;
4018 }
4019 }
4020
4021 return ret;
4022}
4023
4024/**
Daniel Veillard540a31a2003-01-21 11:21:07 +00004025 * xmlTextReaderLocatorBaseURI:
Daniel Veillard417be3a2003-01-20 21:26:34 +00004026 * @locator: the xmlTextReaderLocatorPtr used
4027 *
4028 * Obtain the base URI for the given locator.
4029 *
4030 * Returns the base URI or NULL in case of error.
4031 */
4032xmlChar *
4033xmlTextReaderLocatorBaseURI(xmlTextReaderLocatorPtr locator) {
4034 /* we know that locator is a xmlParserCtxtPtr */
4035 xmlParserCtxtPtr ctx = (xmlParserCtxtPtr)locator;
4036 xmlChar *ret = NULL;
4037
Daniel Veillardce682bc2004-11-05 17:22:25 +00004038 if (locator == NULL)
4039 return(NULL);
Daniel Veillard417be3a2003-01-20 21:26:34 +00004040 if (ctx->node != NULL) {
4041 ret = xmlNodeGetBase(NULL,ctx->node);
4042 }
4043 else {
4044 /* inspired from error.c */
4045 xmlParserInputPtr input;
4046 input = ctx->input;
4047 if ((input->filename == NULL) && (ctx->inputNr > 1))
4048 input = ctx->inputTab[ctx->inputNr - 2];
4049 if (input != NULL) {
Daniel Veillard580ced82003-03-21 21:22:48 +00004050 ret = xmlStrdup(BAD_CAST input->filename);
Daniel Veillard417be3a2003-01-20 21:26:34 +00004051 }
4052 else {
4053 ret = NULL;
4054 }
4055 }
4056
4057 return ret;
4058}
4059
Daniel Veillard26f70262003-01-16 22:45:08 +00004060static void
William M. Brack899e64a2003-09-26 18:03:42 +00004061xmlTextReaderGenericError(void *ctxt, xmlParserSeverities severity, char *str) {
Daniel Veillard26f70262003-01-16 22:45:08 +00004062 xmlParserCtxtPtr ctx = (xmlParserCtxtPtr)ctxt;
4063 xmlTextReaderPtr reader = (xmlTextReaderPtr)ctx->_private;
4064
William M. Bracka3215c72004-07-31 16:24:01 +00004065 if (str != NULL) {
4066 if (reader->errorFunc)
Daniel Veillard26f70262003-01-16 22:45:08 +00004067 reader->errorFunc(reader->errorFuncArg,
4068 str,
Daniel Veillard417be3a2003-01-20 21:26:34 +00004069 severity,
4070 (xmlTextReaderLocatorPtr)ctx);
Daniel Veillard26f70262003-01-16 22:45:08 +00004071 xmlFree(str);
4072 }
4073}
4074
4075static void
William M. Brack93d004f2004-02-03 00:14:10 +00004076xmlTextReaderStructuredError(void *ctxt, xmlErrorPtr error) {
4077 xmlParserCtxtPtr ctx = (xmlParserCtxtPtr) ctxt;
4078 xmlTextReaderPtr reader = (xmlTextReaderPtr) ctx->_private;
4079
4080 if (error && reader->sErrorFunc) {
4081 reader->sErrorFunc(reader->errorFuncArg,
4082 (xmlErrorPtr) error);
4083 }
4084}
4085
4086static void
Daniel Veillard26f70262003-01-16 22:45:08 +00004087xmlTextReaderError(void *ctxt, const char *msg, ...) {
4088 va_list ap;
4089
4090 va_start(ap,msg);
4091 xmlTextReaderGenericError(ctxt,
Daniel Veillard417be3a2003-01-20 21:26:34 +00004092 XML_PARSER_SEVERITY_ERROR,
Daniel Veillard26f70262003-01-16 22:45:08 +00004093 xmlTextReaderBuildMessage(msg,ap));
4094 va_end(ap);
4095
4096}
4097
4098static void
4099xmlTextReaderWarning(void *ctxt, const char *msg, ...) {
4100 va_list ap;
4101
4102 va_start(ap,msg);
4103 xmlTextReaderGenericError(ctxt,
Daniel Veillard417be3a2003-01-20 21:26:34 +00004104 XML_PARSER_SEVERITY_WARNING,
Daniel Veillard26f70262003-01-16 22:45:08 +00004105 xmlTextReaderBuildMessage(msg,ap));
4106 va_end(ap);
4107}
4108
4109static void
4110xmlTextReaderValidityError(void *ctxt, const char *msg, ...) {
4111 va_list ap;
Daniel Veillard417be3a2003-01-20 21:26:34 +00004112 int len = xmlStrlen((const xmlChar *) msg);
Daniel Veillard26f70262003-01-16 22:45:08 +00004113
Daniel Veillard417be3a2003-01-20 21:26:34 +00004114 if ((len > 1) && (msg[len - 2] != ':')) {
4115 /*
4116 * some callbacks only report locator information:
4117 * skip them (mimicking behaviour in error.c)
4118 */
4119 va_start(ap,msg);
4120 xmlTextReaderGenericError(ctxt,
4121 XML_PARSER_SEVERITY_VALIDITY_ERROR,
4122 xmlTextReaderBuildMessage(msg,ap));
4123 va_end(ap);
4124 }
Daniel Veillard26f70262003-01-16 22:45:08 +00004125}
4126
4127static void
4128xmlTextReaderValidityWarning(void *ctxt, const char *msg, ...) {
4129 va_list ap;
Daniel Veillard417be3a2003-01-20 21:26:34 +00004130 int len = xmlStrlen((const xmlChar *) msg);
Daniel Veillard26f70262003-01-16 22:45:08 +00004131
Daniel Veillard417be3a2003-01-20 21:26:34 +00004132 if ((len != 0) && (msg[len - 1] != ':')) {
4133 /*
4134 * some callbacks only report locator information:
4135 * skip them (mimicking behaviour in error.c)
4136 */
4137 va_start(ap,msg);
4138 xmlTextReaderGenericError(ctxt,
4139 XML_PARSER_SEVERITY_VALIDITY_WARNING,
4140 xmlTextReaderBuildMessage(msg,ap));
4141 va_end(ap);
4142 }
Daniel Veillard26f70262003-01-16 22:45:08 +00004143}
4144
4145/**
4146 * xmlTextReaderSetErrorHandler:
4147 * @reader: the xmlTextReaderPtr used
4148 * @f: the callback function to call on error and warnings
4149 * @arg: a user argument to pass to the callback function
4150 *
Daniel Veillard417be3a2003-01-20 21:26:34 +00004151 * Register a callback function that will be called on error and warnings.
4152 *
Daniel Veillard26f70262003-01-16 22:45:08 +00004153 * If @f is NULL, the default error and warning handlers are restored.
4154 */
4155void
4156xmlTextReaderSetErrorHandler(xmlTextReaderPtr reader,
4157 xmlTextReaderErrorFunc f,
Daniel Veillard417be3a2003-01-20 21:26:34 +00004158 void *arg) {
Daniel Veillard26f70262003-01-16 22:45:08 +00004159 if (f != NULL) {
4160 reader->ctxt->sax->error = xmlTextReaderError;
William M. Brack93d004f2004-02-03 00:14:10 +00004161 reader->ctxt->sax->serror = NULL;
Daniel Veillard26f70262003-01-16 22:45:08 +00004162 reader->ctxt->vctxt.error = xmlTextReaderValidityError;
4163 reader->ctxt->sax->warning = xmlTextReaderWarning;
4164 reader->ctxt->vctxt.warning = xmlTextReaderValidityWarning;
4165 reader->errorFunc = f;
William M. Brack9f797ab2004-07-28 07:40:12 +00004166 reader->sErrorFunc = NULL;
Daniel Veillard26f70262003-01-16 22:45:08 +00004167 reader->errorFuncArg = arg;
4168 }
4169 else {
4170 /* restore defaults */
4171 reader->ctxt->sax->error = xmlParserError;
4172 reader->ctxt->vctxt.error = xmlParserValidityError;
4173 reader->ctxt->sax->warning = xmlParserWarning;
4174 reader->ctxt->vctxt.warning = xmlParserValidityWarning;
4175 reader->errorFunc = NULL;
William M. Brack93d004f2004-02-03 00:14:10 +00004176 reader->sErrorFunc = NULL;
Daniel Veillard26f70262003-01-16 22:45:08 +00004177 reader->errorFuncArg = NULL;
4178 }
4179}
4180
Daniel Veillard417be3a2003-01-20 21:26:34 +00004181/**
William M. Brack93d004f2004-02-03 00:14:10 +00004182* xmlTextReaderSetStructuredErrorHandler:
4183 * @reader: the xmlTextReaderPtr used
4184 * @f: the callback function to call on error and warnings
4185 * @arg: a user argument to pass to the callback function
4186 *
4187 * Register a callback function that will be called on error and warnings.
4188 *
4189 * If @f is NULL, the default error and warning handlers are restored.
4190 */
4191void
4192xmlTextReaderSetStructuredErrorHandler(xmlTextReaderPtr reader,
4193 xmlStructuredErrorFunc f,
4194 void *arg) {
4195 if (f != NULL) {
William M. Brack9f797ab2004-07-28 07:40:12 +00004196 reader->ctxt->sax->error = NULL;
William M. Brack93d004f2004-02-03 00:14:10 +00004197 reader->ctxt->sax->serror = xmlTextReaderStructuredError;
4198 reader->ctxt->vctxt.error = xmlTextReaderValidityError;
4199 reader->ctxt->sax->warning = xmlTextReaderWarning;
4200 reader->ctxt->vctxt.warning = xmlTextReaderValidityWarning;
4201 reader->sErrorFunc = f;
4202 reader->errorFunc = NULL;
4203 reader->errorFuncArg = arg;
4204 }
4205 else {
4206 /* restore defaults */
4207 reader->ctxt->sax->error = xmlParserError;
4208 reader->ctxt->sax->serror = NULL;
4209 reader->ctxt->vctxt.error = xmlParserValidityError;
4210 reader->ctxt->sax->warning = xmlParserWarning;
4211 reader->ctxt->vctxt.warning = xmlParserValidityWarning;
4212 reader->errorFunc = NULL;
4213 reader->sErrorFunc = NULL;
4214 reader->errorFuncArg = NULL;
4215 }
4216}
4217
4218/**
Daniel Veillardf6bad792003-04-11 19:38:54 +00004219 * xmlTextReaderIsValid:
4220 * @reader: the xmlTextReaderPtr used
4221 *
4222 * Retrieve the validity status from the parser context
4223 *
4224 * Returns the flag value 1 if valid, 0 if no, and -1 in case of error
4225 */
4226int
4227xmlTextReaderIsValid(xmlTextReaderPtr reader) {
Daniel Veillardf4e55762003-04-15 23:32:22 +00004228 if (reader == NULL) return(-1);
4229#ifdef LIBXML_SCHEMAS_ENABLED
4230 if (reader->validate == XML_TEXTREADER_VALIDATE_RNG)
4231 return(reader->rngValidErrors == 0);
4232#endif
Daniel Veillard16ed5972003-11-20 18:22:31 +00004233 if ((reader->ctxt != NULL) && (reader->ctxt->validate == 1))
Daniel Veillardf4e55762003-04-15 23:32:22 +00004234 return(reader->ctxt->valid);
4235 return(0);
Daniel Veillardf6bad792003-04-11 19:38:54 +00004236}
4237
4238/**
Daniel Veillard417be3a2003-01-20 21:26:34 +00004239 * xmlTextReaderGetErrorHandler:
4240 * @reader: the xmlTextReaderPtr used
4241 * @f: the callback function or NULL is no callback has been registered
4242 * @arg: a user argument
4243 *
4244 * Retrieve the error callback function and user argument.
4245 */
Daniel Veillard26f70262003-01-16 22:45:08 +00004246void
4247xmlTextReaderGetErrorHandler(xmlTextReaderPtr reader,
4248 xmlTextReaderErrorFunc *f,
Daniel Veillard417be3a2003-01-20 21:26:34 +00004249 void **arg) {
Daniel Veillardd5cc0f72004-11-06 19:24:28 +00004250 if (f != NULL) *f = reader->errorFunc;
4251 if (arg != NULL) *arg = reader->errorFuncArg;
Daniel Veillard26f70262003-01-16 22:45:08 +00004252}
4253
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004254
4255/************************************************************************
4256 * *
4257 * New set (2.6.0) of simpler and more flexible APIs *
4258 * *
4259 ************************************************************************/
4260
4261/**
4262 * xmlTextReaderSetup:
4263 * @reader: an XML reader
4264 * @URL: the base URL to use for the document
4265 * @encoding: the document encoding, or NULL
Daniel Veillard87ab1c12003-12-21 13:01:56 +00004266 * @options: a combination of xmlParserOption
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004267 * @reuse: keep the context for reuse
4268 *
4269 * Setup an XML reader with new options
4270 *
4271 * Returns 0 in case of success and -1 in case of error.
4272 */
4273static int
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004274xmlTextReaderSetup(xmlTextReaderPtr reader,
4275 xmlParserInputBufferPtr input, const char *URL,
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004276 const char *encoding, int options)
4277{
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004278 if (reader == NULL)
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004279 return (-1);
4280
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004281 reader->doc = NULL;
4282 reader->entNr = 0;
Daniel Veillarde74d2e12003-12-09 11:35:37 +00004283 reader->parserFlags = options;
Daniel Veillardc36965d2003-12-02 10:28:48 +00004284 reader->validate = XML_TEXTREADER_NOT_VALIDATE;
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004285 if ((input != NULL) && (reader->input != NULL) &&
4286 (reader->allocs & XML_TEXTREADER_INPUT)) {
4287 xmlFreeParserInputBuffer(reader->input);
4288 reader->input = NULL;
4289 reader->allocs -= XML_TEXTREADER_INPUT;
4290 }
4291 if (input != NULL) {
4292 reader->input = input;
4293 reader->allocs |= XML_TEXTREADER_INPUT;
4294 }
4295 if (reader->buffer == NULL)
4296 reader->buffer = xmlBufferCreateSize(100);
4297 if (reader->buffer == NULL) {
4298 xmlGenericError(xmlGenericErrorContext,
4299 "xmlTextReaderSetup : malloc failed\n");
4300 return (-1);
4301 }
4302 if (reader->sax == NULL)
4303 reader->sax = (xmlSAXHandler *) xmlMalloc(sizeof(xmlSAXHandler));
4304 if (reader->sax == NULL) {
4305 xmlGenericError(xmlGenericErrorContext,
4306 "xmlTextReaderSetup : malloc failed\n");
4307 return (-1);
4308 }
4309 xmlSAXVersion(reader->sax, 2);
4310 reader->startElement = reader->sax->startElement;
4311 reader->sax->startElement = xmlTextReaderStartElement;
4312 reader->endElement = reader->sax->endElement;
4313 reader->sax->endElement = xmlTextReaderEndElement;
4314#ifdef LIBXML_SAX1_ENABLED
4315 if (reader->sax->initialized == XML_SAX2_MAGIC) {
4316#endif /* LIBXML_SAX1_ENABLED */
4317 reader->startElementNs = reader->sax->startElementNs;
4318 reader->sax->startElementNs = xmlTextReaderStartElementNs;
4319 reader->endElementNs = reader->sax->endElementNs;
4320 reader->sax->endElementNs = xmlTextReaderEndElementNs;
4321#ifdef LIBXML_SAX1_ENABLED
4322 } else {
4323 reader->startElementNs = NULL;
4324 reader->endElementNs = NULL;
4325 }
4326#endif /* LIBXML_SAX1_ENABLED */
4327 reader->characters = reader->sax->characters;
4328 reader->sax->characters = xmlTextReaderCharacters;
4329 reader->sax->ignorableWhitespace = xmlTextReaderCharacters;
4330 reader->cdataBlock = reader->sax->cdataBlock;
4331 reader->sax->cdataBlock = xmlTextReaderCDataBlock;
4332
4333 reader->mode = XML_TEXTREADER_MODE_INITIAL;
4334 reader->node = NULL;
4335 reader->curnode = NULL;
4336 if (input != NULL) {
4337 if (reader->input->buffer->use < 4) {
4338 xmlParserInputBufferRead(input, 4);
4339 }
4340 if (reader->ctxt == NULL) {
4341 if (reader->input->buffer->use >= 4) {
4342 reader->ctxt = xmlCreatePushParserCtxt(reader->sax, NULL,
4343 (const char *) reader->input->buffer->content, 4, URL);
4344 reader->base = 0;
4345 reader->cur = 4;
4346 } else {
4347 reader->ctxt =
4348 xmlCreatePushParserCtxt(reader->sax, NULL, NULL, 0, URL);
4349 reader->base = 0;
4350 reader->cur = 0;
4351 }
4352 } else {
4353 xmlParserInputPtr inputStream;
4354 xmlParserInputBufferPtr buf;
4355 xmlCharEncoding enc = XML_CHAR_ENCODING_NONE;
4356
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004357 xmlCtxtReset(reader->ctxt);
4358 buf = xmlAllocParserInputBuffer(enc);
4359 if (buf == NULL) return(-1);
4360 inputStream = xmlNewInputStream(reader->ctxt);
4361 if (inputStream == NULL) {
4362 xmlFreeParserInputBuffer(buf);
4363 return(-1);
4364 }
4365
4366 if (URL == NULL)
4367 inputStream->filename = NULL;
4368 else
4369 inputStream->filename = (char *)
4370 xmlCanonicPath((const xmlChar *) URL);
4371 inputStream->buf = buf;
4372 inputStream->base = inputStream->buf->buffer->content;
4373 inputStream->cur = inputStream->buf->buffer->content;
4374 inputStream->end =
4375 &inputStream->buf->buffer->content[inputStream->buf->buffer->use];
4376
4377 inputPush(reader->ctxt, inputStream);
4378 reader->cur = 0;
4379 }
4380 if (reader->ctxt == NULL) {
4381 xmlGenericError(xmlGenericErrorContext,
4382 "xmlTextReaderSetup : malloc failed\n");
4383 return (-1);
4384 }
4385 }
4386 if (reader->dict != NULL) {
4387 if (reader->ctxt->dict != NULL) {
4388 if (reader->dict != reader->ctxt->dict) {
4389 xmlDictFree(reader->dict);
4390 reader->dict = reader->ctxt->dict;
4391 }
4392 } else {
4393 reader->ctxt->dict = reader->dict;
4394 }
4395 } else {
4396 if (reader->ctxt->dict == NULL)
4397 reader->ctxt->dict = xmlDictCreate();
4398 reader->dict = reader->ctxt->dict;
4399 }
4400 reader->ctxt->_private = reader;
4401 reader->ctxt->linenumbers = 1;
4402 reader->ctxt->dictNames = 1;
4403 /*
4404 * use the parser dictionnary to allocate all elements and attributes names
4405 */
4406 reader->ctxt->docdict = 1;
Daniel Veillard0df3bc32004-06-08 12:03:41 +00004407 reader->ctxt->parseMode = XML_PARSE_READER;
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004408
Daniel Veillard7899c5c2003-11-03 12:31:38 +00004409#ifdef LIBXML_XINCLUDE_ENABLED
4410 if (reader->xincctxt != NULL) {
4411 xmlXIncludeFreeContext(reader->xincctxt);
4412 reader->xincctxt = NULL;
4413 }
4414 if (options & XML_PARSE_XINCLUDE) {
4415 reader->xinclude = 1;
4416 reader->xinclude_name = xmlDictLookup(reader->dict, XINCLUDE_NODE, -1);
4417 options -= XML_PARSE_XINCLUDE;
4418 } else
4419 reader->xinclude = 0;
4420 reader->in_xinclude = 0;
4421#endif
Daniel Veillard1e906612003-12-05 14:57:46 +00004422#ifdef LIBXML_PATTERN_ENABLED
4423 if (reader->patternTab == NULL) {
4424 reader->patternNr = 0;
4425 reader->patternMax = 0;
4426 }
4427 while (reader->patternNr > 0) {
4428 reader->patternNr--;
4429 if (reader->patternTab[reader->patternNr] != NULL) {
4430 xmlFreePattern(reader->patternTab[reader->patternNr]);
4431 reader->patternTab[reader->patternNr] = NULL;
4432 }
4433 }
4434#endif
4435
Daniel Veillardc36965d2003-12-02 10:28:48 +00004436 if (options & XML_PARSE_DTDVALID)
4437 reader->validate = XML_TEXTREADER_VALIDATE_DTD;
4438
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004439 xmlCtxtUseOptions(reader->ctxt, options);
4440 if (encoding != NULL) {
4441 xmlCharEncodingHandlerPtr hdlr;
4442
4443 hdlr = xmlFindCharEncodingHandler(encoding);
4444 if (hdlr != NULL)
4445 xmlSwitchToEncoding(reader->ctxt, hdlr);
4446 }
4447 if ((URL != NULL) && (reader->ctxt->input != NULL) &&
4448 (reader->ctxt->input->filename == NULL))
4449 reader->ctxt->input->filename = (char *)
4450 xmlStrdup((const xmlChar *) URL);
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004451
4452 reader->doc = NULL;
4453
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004454 return (0);
4455}
4456
4457/**
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004458 * xmlReaderWalker:
4459 * @doc: a preparsed document
4460 *
4461 * Create an xmltextReader for a preparsed document.
4462 *
4463 * Returns the new reader or NULL in case of error.
4464 */
4465xmlTextReaderPtr
4466xmlReaderWalker(xmlDocPtr doc)
4467{
4468 xmlTextReaderPtr ret;
4469
4470 if (doc == NULL)
4471 return(NULL);
4472
4473 ret = xmlMalloc(sizeof(xmlTextReader));
4474 if (ret == NULL) {
4475 xmlGenericError(xmlGenericErrorContext,
4476 "xmlNewTextReader : malloc failed\n");
4477 return(NULL);
4478 }
4479 memset(ret, 0, sizeof(xmlTextReader));
4480 ret->entNr = 0;
4481 ret->input = NULL;
4482 ret->mode = XML_TEXTREADER_MODE_INITIAL;
4483 ret->node = NULL;
4484 ret->curnode = NULL;
4485 ret->base = 0;
4486 ret->cur = 0;
4487 ret->allocs = XML_TEXTREADER_CTXT;
4488 ret->doc = doc;
4489 ret->state = XML_TEXTREADER_START;
4490 ret->dict = xmlDictCreate();
4491 return(ret);
4492}
4493
4494/**
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004495 * xmlReaderForDoc:
4496 * @cur: a pointer to a zero terminated string
4497 * @URL: the base URL to use for the document
4498 * @encoding: the document encoding, or NULL
Daniel Veillard87ab1c12003-12-21 13:01:56 +00004499 * @options: a combination of xmlParserOption
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004500 *
4501 * Create an xmltextReader for an XML in-memory document.
Daniel Veillard87ab1c12003-12-21 13:01:56 +00004502 * The parsing flags @options are a combination of xmlParserOption.
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004503 *
4504 * Returns the new reader or NULL in case of error.
4505 */
4506xmlTextReaderPtr
4507xmlReaderForDoc(const xmlChar * cur, const char *URL, const char *encoding,
4508 int options)
4509{
4510 int len;
4511
4512 if (cur == NULL)
4513 return (NULL);
4514 len = xmlStrlen(cur);
4515
4516 return (xmlReaderForMemory
4517 ((const char *) cur, len, URL, encoding, options));
4518}
4519
4520/**
4521 * xmlReaderForFile:
4522 * @filename: a file or URL
4523 * @encoding: the document encoding, or NULL
Daniel Veillard87ab1c12003-12-21 13:01:56 +00004524 * @options: a combination of xmlParserOption
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004525 *
4526 * parse an XML file from the filesystem or the network.
Daniel Veillard87ab1c12003-12-21 13:01:56 +00004527 * The parsing flags @options are a combination of xmlParserOption.
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004528 *
4529 * Returns the new reader or NULL in case of error.
4530 */
4531xmlTextReaderPtr
4532xmlReaderForFile(const char *filename, const char *encoding, int options)
4533{
4534 xmlTextReaderPtr reader;
4535
4536 reader = xmlNewTextReaderFilename(filename);
4537 if (reader == NULL)
4538 return (NULL);
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004539 xmlTextReaderSetup(reader, NULL, NULL, encoding, options);
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004540 return (reader);
4541}
4542
4543/**
4544 * xmlReaderForMemory:
4545 * @buffer: a pointer to a char array
4546 * @size: the size of the array
4547 * @URL: the base URL to use for the document
4548 * @encoding: the document encoding, or NULL
Daniel Veillard87ab1c12003-12-21 13:01:56 +00004549 * @options: a combination of xmlParserOption
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004550 *
4551 * Create an xmltextReader for an XML in-memory document.
Daniel Veillard87ab1c12003-12-21 13:01:56 +00004552 * The parsing flags @options are a combination of xmlParserOption.
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004553 *
4554 * Returns the new reader or NULL in case of error.
4555 */
4556xmlTextReaderPtr
4557xmlReaderForMemory(const char *buffer, int size, const char *URL,
4558 const char *encoding, int options)
4559{
4560 xmlTextReaderPtr reader;
4561 xmlParserInputBufferPtr buf;
4562
Daniel Veillard21924522004-02-19 16:37:07 +00004563 buf = xmlParserInputBufferCreateStatic(buffer, size,
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004564 XML_CHAR_ENCODING_NONE);
4565 if (buf == NULL) {
4566 return (NULL);
4567 }
4568 reader = xmlNewTextReader(buf, URL);
4569 if (reader == NULL) {
4570 xmlFreeParserInputBuffer(buf);
4571 return (NULL);
4572 }
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004573 reader->allocs |= XML_TEXTREADER_INPUT;
4574 xmlTextReaderSetup(reader, NULL, URL, encoding, options);
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004575 return (reader);
4576}
4577
4578/**
4579 * xmlReaderForFd:
4580 * @fd: an open file descriptor
4581 * @URL: the base URL to use for the document
4582 * @encoding: the document encoding, or NULL
Daniel Veillard87ab1c12003-12-21 13:01:56 +00004583 * @options: a combination of xmlParserOption
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004584 *
4585 * Create an xmltextReader for an XML from a file descriptor.
Daniel Veillard87ab1c12003-12-21 13:01:56 +00004586 * The parsing flags @options are a combination of xmlParserOption.
Daniel Veillard4bc5f432003-12-22 18:13:12 +00004587 * NOTE that the file descriptor will not be closed when the
4588 * reader is closed or reset.
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004589 *
4590 * Returns the new reader or NULL in case of error.
4591 */
4592xmlTextReaderPtr
4593xmlReaderForFd(int fd, const char *URL, const char *encoding, int options)
4594{
4595 xmlTextReaderPtr reader;
4596 xmlParserInputBufferPtr input;
4597
4598 if (fd < 0)
4599 return (NULL);
4600
4601 input = xmlParserInputBufferCreateFd(fd, XML_CHAR_ENCODING_NONE);
4602 if (input == NULL)
4603 return (NULL);
Daniel Veillard4bc5f432003-12-22 18:13:12 +00004604 input->closecallback = NULL;
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004605 reader = xmlNewTextReader(input, URL);
4606 if (reader == NULL) {
4607 xmlFreeParserInputBuffer(input);
4608 return (NULL);
4609 }
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004610 reader->allocs |= XML_TEXTREADER_INPUT;
4611 xmlTextReaderSetup(reader, NULL, URL, encoding, options);
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004612 return (reader);
4613}
4614
4615/**
4616 * xmlReaderForIO:
4617 * @ioread: an I/O read function
4618 * @ioclose: an I/O close function
4619 * @ioctx: an I/O handler
4620 * @URL: the base URL to use for the document
4621 * @encoding: the document encoding, or NULL
Daniel Veillard87ab1c12003-12-21 13:01:56 +00004622 * @options: a combination of xmlParserOption
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004623 *
4624 * Create an xmltextReader for an XML document from I/O functions and source.
Daniel Veillard87ab1c12003-12-21 13:01:56 +00004625 * The parsing flags @options are a combination of xmlParserOption.
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004626 *
4627 * Returns the new reader or NULL in case of error.
4628 */
4629xmlTextReaderPtr
4630xmlReaderForIO(xmlInputReadCallback ioread, xmlInputCloseCallback ioclose,
4631 void *ioctx, const char *URL, const char *encoding,
4632 int options)
4633{
4634 xmlTextReaderPtr reader;
4635 xmlParserInputBufferPtr input;
4636
4637 if (ioread == NULL)
4638 return (NULL);
4639
4640 input = xmlParserInputBufferCreateIO(ioread, ioclose, ioctx,
4641 XML_CHAR_ENCODING_NONE);
4642 if (input == NULL)
4643 return (NULL);
4644 reader = xmlNewTextReader(input, URL);
4645 if (reader == NULL) {
4646 xmlFreeParserInputBuffer(input);
4647 return (NULL);
4648 }
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004649 reader->allocs |= XML_TEXTREADER_INPUT;
4650 xmlTextReaderSetup(reader, NULL, URL, encoding, options);
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004651 return (reader);
4652}
4653
4654/**
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004655 * xmlReaderNewWalker:
4656 * @reader: an XML reader
4657 * @doc: a preparsed document
4658 *
4659 * Setup an xmltextReader to parse a preparsed XML document.
4660 * This reuses the existing @reader xmlTextReader.
4661 *
4662 * Returns 0 in case of success and -1 in case of error
4663 */
4664int
4665xmlReaderNewWalker(xmlTextReaderPtr reader, xmlDocPtr doc)
4666{
4667 if (doc == NULL)
4668 return (-1);
4669 if (reader == NULL)
4670 return (-1);
4671
Daniel Veillarddd6d3002004-11-03 14:20:29 +00004672 if (reader->input != NULL) {
4673 xmlFreeParserInputBuffer(reader->input);
4674 }
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004675 if (reader->ctxt != NULL) {
4676 xmlCtxtReset(reader->ctxt);
4677 }
4678
4679 reader->entNr = 0;
4680 reader->input = NULL;
4681 reader->mode = XML_TEXTREADER_MODE_INITIAL;
4682 reader->node = NULL;
4683 reader->curnode = NULL;
4684 reader->base = 0;
4685 reader->cur = 0;
4686 reader->allocs = XML_TEXTREADER_CTXT;
4687 reader->doc = doc;
4688 reader->state = XML_TEXTREADER_START;
4689 if (reader->dict == NULL) {
4690 if ((reader->ctxt != NULL) && (reader->ctxt->dict != NULL))
4691 reader->dict = reader->ctxt->dict;
4692 else
4693 reader->dict = xmlDictCreate();
4694 }
4695 return(0);
4696}
4697
4698/**
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004699 * xmlReaderNewDoc:
4700 * @reader: an XML reader
4701 * @cur: a pointer to a zero terminated string
4702 * @URL: the base URL to use for the document
4703 * @encoding: the document encoding, or NULL
Daniel Veillard87ab1c12003-12-21 13:01:56 +00004704 * @options: a combination of xmlParserOption
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004705 *
4706 * Setup an xmltextReader to parse an XML in-memory document.
Daniel Veillard87ab1c12003-12-21 13:01:56 +00004707 * The parsing flags @options are a combination of xmlParserOption.
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004708 * This reuses the existing @reader xmlTextReader.
4709 *
4710 * Returns 0 in case of success and -1 in case of error
4711 */
4712int
4713xmlReaderNewDoc(xmlTextReaderPtr reader, const xmlChar * cur,
4714 const char *URL, const char *encoding, int options)
4715{
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004716
4717 int len;
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004718
4719 if (cur == NULL)
4720 return (-1);
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004721 if (reader == NULL)
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004722 return (-1);
4723
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004724 len = xmlStrlen(cur);
4725 return (xmlReaderNewMemory(reader, (const char *)cur, len,
4726 URL, encoding, options));
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004727}
4728
4729/**
4730 * xmlReaderNewFile:
4731 * @reader: an XML reader
4732 * @filename: a file or URL
4733 * @encoding: the document encoding, or NULL
Daniel Veillard87ab1c12003-12-21 13:01:56 +00004734 * @options: a combination of xmlParserOption
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004735 *
4736 * parse an XML file from the filesystem or the network.
Daniel Veillard87ab1c12003-12-21 13:01:56 +00004737 * The parsing flags @options are a combination of xmlParserOption.
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004738 * This reuses the existing @reader xmlTextReader.
4739 *
4740 * Returns 0 in case of success and -1 in case of error
4741 */
4742int
4743xmlReaderNewFile(xmlTextReaderPtr reader, const char *filename,
4744 const char *encoding, int options)
4745{
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004746 xmlParserInputBufferPtr input;
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004747
4748 if (filename == NULL)
4749 return (-1);
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004750 if (reader == NULL)
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004751 return (-1);
4752
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004753 input =
4754 xmlParserInputBufferCreateFilename(filename,
4755 XML_CHAR_ENCODING_NONE);
4756 if (input == NULL)
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004757 return (-1);
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004758 return (xmlTextReaderSetup(reader, input, filename, encoding, options));
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004759}
4760
4761/**
4762 * xmlReaderNewMemory:
4763 * @reader: an XML reader
4764 * @buffer: a pointer to a char array
4765 * @size: the size of the array
4766 * @URL: the base URL to use for the document
4767 * @encoding: the document encoding, or NULL
Daniel Veillard87ab1c12003-12-21 13:01:56 +00004768 * @options: a combination of xmlParserOption
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004769 *
4770 * Setup an xmltextReader to parse an XML in-memory document.
Daniel Veillard87ab1c12003-12-21 13:01:56 +00004771 * The parsing flags @options are a combination of xmlParserOption.
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004772 * This reuses the existing @reader xmlTextReader.
4773 *
4774 * Returns 0 in case of success and -1 in case of error
4775 */
4776int
4777xmlReaderNewMemory(xmlTextReaderPtr reader, const char *buffer, int size,
4778 const char *URL, const char *encoding, int options)
4779{
4780 xmlParserInputBufferPtr input;
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004781
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004782 if (reader == NULL)
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004783 return (-1);
4784 if (buffer == NULL)
4785 return (-1);
4786
Daniel Veillard21924522004-02-19 16:37:07 +00004787 input = xmlParserInputBufferCreateStatic(buffer, size,
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004788 XML_CHAR_ENCODING_NONE);
4789 if (input == NULL) {
4790 return (-1);
4791 }
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004792 return (xmlTextReaderSetup(reader, input, URL, encoding, options));
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004793}
4794
4795/**
4796 * xmlReaderNewFd:
4797 * @reader: an XML reader
4798 * @fd: an open file descriptor
4799 * @URL: the base URL to use for the document
4800 * @encoding: the document encoding, or NULL
Daniel Veillard87ab1c12003-12-21 13:01:56 +00004801 * @options: a combination of xmlParserOption
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004802 *
4803 * Setup an xmltextReader to parse an XML from a file descriptor.
Daniel Veillard4bc5f432003-12-22 18:13:12 +00004804 * NOTE that the file descriptor will not be closed when the
4805 * reader is closed or reset.
Daniel Veillard87ab1c12003-12-21 13:01:56 +00004806 * The parsing flags @options are a combination of xmlParserOption.
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004807 * This reuses the existing @reader xmlTextReader.
4808 *
4809 * Returns 0 in case of success and -1 in case of error
4810 */
4811int
4812xmlReaderNewFd(xmlTextReaderPtr reader, int fd,
4813 const char *URL, const char *encoding, int options)
4814{
4815 xmlParserInputBufferPtr input;
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004816
4817 if (fd < 0)
4818 return (-1);
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004819 if (reader == NULL)
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004820 return (-1);
4821
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004822 input = xmlParserInputBufferCreateFd(fd, XML_CHAR_ENCODING_NONE);
4823 if (input == NULL)
4824 return (-1);
Daniel Veillard4bc5f432003-12-22 18:13:12 +00004825 input->closecallback = NULL;
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004826 return (xmlTextReaderSetup(reader, input, URL, encoding, options));
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004827}
4828
4829/**
4830 * xmlReaderNewIO:
4831 * @reader: an XML reader
4832 * @ioread: an I/O read function
4833 * @ioclose: an I/O close function
4834 * @ioctx: an I/O handler
4835 * @URL: the base URL to use for the document
4836 * @encoding: the document encoding, or NULL
Daniel Veillard87ab1c12003-12-21 13:01:56 +00004837 * @options: a combination of xmlParserOption
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004838 *
4839 * Setup an xmltextReader to parse an XML document from I/O functions
4840 * and source.
Daniel Veillard87ab1c12003-12-21 13:01:56 +00004841 * The parsing flags @options are a combination of xmlParserOption.
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004842 * This reuses the existing @reader xmlTextReader.
4843 *
4844 * Returns 0 in case of success and -1 in case of error
4845 */
4846int
4847xmlReaderNewIO(xmlTextReaderPtr reader, xmlInputReadCallback ioread,
4848 xmlInputCloseCallback ioclose, void *ioctx,
4849 const char *URL, const char *encoding, int options)
4850{
4851 xmlParserInputBufferPtr input;
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004852
4853 if (ioread == NULL)
4854 return (-1);
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004855 if (reader == NULL)
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004856 return (-1);
4857
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004858 input = xmlParserInputBufferCreateIO(ioread, ioclose, ioctx,
4859 XML_CHAR_ENCODING_NONE);
4860 if (input == NULL)
4861 return (-1);
Daniel Veillard198c1bf2003-10-20 17:07:41 +00004862 return (xmlTextReaderSetup(reader, input, URL, encoding, options));
Daniel Veillardfc8dc352003-10-18 09:07:46 +00004863}
Daniel Veillard26f70262003-01-16 22:45:08 +00004864/************************************************************************
4865 * *
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00004866 * Utilities *
4867 * *
4868 ************************************************************************/
Daniel Veillard9f7eb0b2003-09-17 10:26:25 +00004869#ifdef NOT_USED_YET
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00004870/**
4871 * xmlBase64Decode:
4872 * @in: the input buffer
4873 * @inlen: the size of the input (in), the size read from it (out)
4874 * @to: the output buffer
4875 * @tolen: the size of the output (in), the size written to (out)
4876 *
4877 * Base64 decoder, reads from @in and save in @to
Daniel Veillardd4310742003-02-18 21:12:46 +00004878 * TODO: tell jody when this is actually exported
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00004879 *
4880 * Returns 0 if all the input was consumer, 1 if the Base64 end was reached,
4881 * 2 if there wasn't enough space on the output or -1 in case of error.
4882 */
4883static int
4884xmlBase64Decode(const unsigned char *in, unsigned long *inlen,
4885 unsigned char *to, unsigned long *tolen) {
4886 unsigned long incur; /* current index in in[] */
4887 unsigned long inblk; /* last block index in in[] */
4888 unsigned long outcur; /* current index in out[] */
4889 unsigned long inmax; /* size of in[] */
4890 unsigned long outmax; /* size of out[] */
4891 unsigned char cur; /* the current value read from in[] */
Daniel Veillardc127adc2003-07-23 15:07:08 +00004892 unsigned char intmp[4], outtmp[4]; /* temporary buffers for the convert */
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00004893 int nbintmp; /* number of byte in intmp[] */
4894 int is_ignore; /* cur should be ignored */
4895 int is_end = 0; /* the end of the base64 was found */
4896 int retval = 1;
4897 int i;
4898
4899 if ((in == NULL) || (inlen == NULL) || (to == NULL) || (tolen == NULL))
4900 return(-1);
4901
4902 incur = 0;
4903 inblk = 0;
4904 outcur = 0;
4905 inmax = *inlen;
4906 outmax = *tolen;
4907 nbintmp = 0;
4908
4909 while (1) {
4910 if (incur >= inmax)
4911 break;
4912 cur = in[incur++];
4913 is_ignore = 0;
4914 if ((cur >= 'A') && (cur <= 'Z'))
4915 cur = cur - 'A';
4916 else if ((cur >= 'a') && (cur <= 'z'))
4917 cur = cur - 'a' + 26;
4918 else if ((cur >= '0') && (cur <= '9'))
4919 cur = cur - '0' + 52;
4920 else if (cur == '+')
4921 cur = 62;
4922 else if (cur == '/')
4923 cur = 63;
4924 else if (cur == '.')
4925 cur = 0;
4926 else if (cur == '=') /*no op , end of the base64 stream */
4927 is_end = 1;
4928 else {
4929 is_ignore = 1;
4930 if (nbintmp == 0)
4931 inblk = incur;
4932 }
4933
4934 if (!is_ignore) {
4935 int nbouttmp = 3;
4936 int is_break = 0;
4937
4938 if (is_end) {
4939 if (nbintmp == 0)
4940 break;
4941 if ((nbintmp == 1) || (nbintmp == 2))
4942 nbouttmp = 1;
4943 else
4944 nbouttmp = 2;
4945 nbintmp = 3;
4946 is_break = 1;
4947 }
4948 intmp[nbintmp++] = cur;
4949 /*
4950 * if intmp is full, push the 4byte sequence as a 3 byte
4951 * sequence out
4952 */
4953 if (nbintmp == 4) {
4954 nbintmp = 0;
4955 outtmp[0] = (intmp[0] << 2) | ((intmp[1] & 0x30) >> 4);
4956 outtmp[1] =
4957 ((intmp[1] & 0x0F) << 4) | ((intmp[2] & 0x3C) >> 2);
4958 outtmp[2] = ((intmp[2] & 0x03) << 6) | (intmp[3] & 0x3F);
4959 if (outcur + 3 >= outmax) {
4960 retval = 2;
4961 break;
4962 }
4963
4964 for (i = 0; i < nbouttmp; i++)
4965 to[outcur++] = outtmp[i];
4966 inblk = incur;
4967 }
4968
4969 if (is_break) {
4970 retval = 0;
4971 break;
4972 }
4973 }
4974 }
4975
4976 *tolen = outcur;
4977 *inlen = inblk;
4978 return (retval);
4979}
4980
4981/*
4982 * Test routine for the xmlBase64Decode function
4983 */
4984#if 0
4985int main(int argc, char **argv) {
4986 char *input = " VW4 gcGV0 \n aXQgdGVzdCAuCg== ";
4987 char output[100];
4988 char output2[100];
4989 char output3[100];
4990 unsigned long inlen = strlen(input);
4991 unsigned long outlen = 100;
4992 int ret;
4993 unsigned long cons, tmp, tmp2, prod;
4994
4995 /*
4996 * Direct
4997 */
4998 ret = xmlBase64Decode(input, &inlen, output, &outlen);
4999
5000 output[outlen] = 0;
5001 printf("ret: %d, inlen: %ld , outlen: %ld, output: '%s'\n", ret, inlen, outlen, output);
5002
5003 /*
5004 * output chunking
5005 */
5006 cons = 0;
5007 prod = 0;
5008 while (cons < inlen) {
5009 tmp = 5;
5010 tmp2 = inlen - cons;
5011
5012 printf("%ld %ld\n", cons, prod);
5013 ret = xmlBase64Decode(&input[cons], &tmp2, &output2[prod], &tmp);
5014 cons += tmp2;
5015 prod += tmp;
5016 printf("%ld %ld\n", cons, prod);
5017 }
5018 output2[outlen] = 0;
5019 printf("ret: %d, cons: %ld , prod: %ld, output: '%s'\n", ret, cons, prod, output2);
5020
5021 /*
5022 * input chunking
5023 */
5024 cons = 0;
5025 prod = 0;
5026 while (cons < inlen) {
5027 tmp = 100 - prod;
5028 tmp2 = inlen - cons;
5029 if (tmp2 > 5)
5030 tmp2 = 5;
5031
5032 printf("%ld %ld\n", cons, prod);
5033 ret = xmlBase64Decode(&input[cons], &tmp2, &output3[prod], &tmp);
5034 cons += tmp2;
5035 prod += tmp;
5036 printf("%ld %ld\n", cons, prod);
5037 }
5038 output3[outlen] = 0;
5039 printf("ret: %d, cons: %ld , prod: %ld, output: '%s'\n", ret, cons, prod, output3);
5040 return(0);
5041
5042}
5043#endif
Daniel Veillard9f7eb0b2003-09-17 10:26:25 +00005044#endif /* NOT_USED_YET */
Daniel Veillard81273902003-09-30 00:43:48 +00005045#endif /* LIBXML_READER_ENABLED */