blob: 9aa1ebee63c43eebb4fc64fdbac7b559177013dc [file] [log] [blame]
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001/*
2 * xmlreader.c: implements the xmlTextReader streaming node API
3 *
Daniel Veillard67df8092002-12-16 22:04:11 +00004 * NOTE:
5 * XmlTextReader.Normalization Property won't be supported, since
6 * it makes the parser non compliant to the XML recommendation
7 *
Daniel Veillarde1ca5032002-12-09 14:13:43 +00008 * See Copyright for the status of this software.
9 *
10 * daniel@veillard.com
11 */
12
Daniel Veillard7704fb12003-01-03 16:19:51 +000013/*
14 * TODOs:
15 * - provide an API to expand part of the tree
16 * - provide an API to preserve part of the tree
17 * - Streaming XInclude support
Daniel Veillard067bae52003-01-05 01:27:54 +000018 * - validation against a provided DTD
19 * - XML Schemas validation
Daniel Veillard7704fb12003-01-03 16:19:51 +000020 * - setting(s) for NoBlanks
21 * - performances and tuning ...
22 */
Daniel Veillarde1ca5032002-12-09 14:13:43 +000023#define IN_LIBXML
24#include "libxml.h"
25
26#include <string.h> /* for memset() only ! */
Daniel Veillard26f70262003-01-16 22:45:08 +000027#include <stdarg.h>
Daniel Veillarde1ca5032002-12-09 14:13:43 +000028
29#ifdef HAVE_CTYPE_H
30#include <ctype.h>
31#endif
32#ifdef HAVE_STDLIB_H
33#include <stdlib.h>
34#endif
35
36#include <libxml/xmlmemory.h>
37#include <libxml/xmlIO.h>
38#include <libxml/xmlreader.h>
39
40/* #define DEBUG_CALLBACKS */
41/* #define DEBUG_READER */
42
43/**
44 * TODO:
45 *
46 * macro to flag unimplemented blocks
47 */
48#define TODO \
49 xmlGenericError(xmlGenericErrorContext, \
50 "Unimplemented block at %s:%d\n", \
51 __FILE__, __LINE__);
52
53#ifdef DEBUG_READER
54#define DUMP_READER xmlTextReaderDebug(reader);
55#else
56#define DUMP_READER
57#endif
58
59/************************************************************************
60 * *
61 * The parser: maps the Text Reader API on top of the existing *
62 * parsing routines building a tree *
63 * *
64 ************************************************************************/
65
66#define XML_TEXTREADER_INPUT 1
67#define XML_TEXTREADER_CTXT 2
68
69typedef enum {
Daniel Veillard67df8092002-12-16 22:04:11 +000070 XML_TEXTREADER_MODE_INITIAL = 0,
71 XML_TEXTREADER_MODE_INTERACTIVE = 1,
72 XML_TEXTREADER_MODE_ERROR = 2,
73 XML_TEXTREADER_MODE_EOF =3,
74 XML_TEXTREADER_MODE_CLOSED = 4,
75 XML_TEXTREADER_MODE_READING = 5
Daniel Veillarde1ca5032002-12-09 14:13:43 +000076} xmlTextReaderMode;
77
78typedef enum {
79 XML_TEXTREADER_NONE = -1,
80 XML_TEXTREADER_START= 0,
81 XML_TEXTREADER_ELEMENT= 1,
82 XML_TEXTREADER_END= 2,
83 XML_TEXTREADER_EMPTY= 3,
Daniel Veillardea7751d2002-12-20 00:16:24 +000084 XML_TEXTREADER_BACKTRACK= 4,
85 XML_TEXTREADER_DONE= 5
Daniel Veillarde1ca5032002-12-09 14:13:43 +000086} xmlTextReaderState;
87
88struct _xmlTextReader {
89 int mode; /* the parsing mode */
90 int allocs; /* what structure were deallocated */
91 xmlTextReaderState state;
92 xmlParserCtxtPtr ctxt; /* the parser context */
93 xmlSAXHandlerPtr sax; /* the parser SAX callbacks */
94 xmlParserInputBufferPtr input; /* the input */
95 startElementSAXFunc startElement;/* initial SAX callbacks */
96 endElementSAXFunc endElement; /* idem */
Daniel Veillardea7751d2002-12-20 00:16:24 +000097 charactersSAXFunc characters;
98 cdataBlockSAXFunc cdataBlock;
Daniel Veillarde1ca5032002-12-09 14:13:43 +000099 unsigned int base; /* base of the segment in the input */
100 unsigned int cur; /* current position in the input */
101 xmlNodePtr node; /* current node */
Daniel Veillardda46d2d2002-12-15 23:36:49 +0000102 xmlNodePtr curnode;/* current attribute node */
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000103 int depth; /* depth of the current node */
Daniel Veillardbeb70bd2002-12-18 14:53:54 +0000104 xmlNodePtr faketext;/* fake xmlNs chld */
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000105
106 /* entity stack when traversing entities content */
107 xmlNodePtr ent; /* Current Entity Ref Node */
108 int entNr; /* Depth of the entities stack */
109 int entMax; /* Max depth of the entities stack */
110 xmlNodePtr *entTab; /* array of entities */
Daniel Veillard26f70262003-01-16 22:45:08 +0000111
112 /* error handling */
113 xmlTextReaderErrorFunc errorFunc; /* callback function */
114 void *errorFuncArg; /* callback function user argument */
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000115};
116
Daniel Veillard067bae52003-01-05 01:27:54 +0000117static const char *xmlTextReaderIsEmpty = "This element is empty";
118
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000119#ifdef DEBUG_READER
120static void
121xmlTextReaderDebug(xmlTextReaderPtr reader) {
122 if ((reader == NULL) || (reader->ctxt == NULL)) {
123 fprintf(stderr, "xmlTextReader NULL\n");
124 return;
125 }
126 fprintf(stderr, "xmlTextReader: state %d depth %d ",
127 reader->state, reader->depth);
128 if (reader->node == NULL) {
129 fprintf(stderr, "node = NULL\n");
130 } else {
131 fprintf(stderr, "node %s\n", reader->node->name);
132 }
133 fprintf(stderr, " input: base %d, cur %d, depth %d: ",
134 reader->base, reader->cur, reader->ctxt->nodeNr);
135 if (reader->input->buffer == NULL) {
136 fprintf(stderr, "buffer is NULL\n");
137 } else {
138#ifdef LIBXML_DEBUG_ENABLED
139 xmlDebugDumpString(stderr,
140 &reader->input->buffer->content[reader->cur]);
141#endif
142 fprintf(stderr, "\n");
143 }
144}
145#endif
146
147/**
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000148 * xmlTextReaderEntPush:
149 * @reader: the xmlTextReaderPtr used
150 * @value: the entity reference node
151 *
152 * Pushes a new entity reference node on top of the entities stack
153 *
154 * Returns 0 in case of error, the index in the stack otherwise
155 */
156static int
157xmlTextReaderEntPush(xmlTextReaderPtr reader, xmlNodePtr value)
158{
159 if (reader->entMax <= 0) {
160 reader->entMax = 10;
161 reader->entTab = (xmlNodePtr *) xmlMalloc(reader->entMax *
162 sizeof(reader->entTab[0]));
163 if (reader->entTab == NULL) {
164 xmlGenericError(xmlGenericErrorContext, "xmlMalloc failed !\n");
165 return (0);
166 }
167 }
168 if (reader->entNr >= reader->entMax) {
169 reader->entMax *= 2;
170 reader->entTab =
171 (xmlNodePtr *) xmlRealloc(reader->entTab,
172 reader->entMax *
173 sizeof(reader->entTab[0]));
174 if (reader->entTab == NULL) {
175 xmlGenericError(xmlGenericErrorContext, "xmlRealloc failed !\n");
176 return (0);
177 }
178 }
179 reader->entTab[reader->entNr] = value;
180 reader->ent = value;
181 return (reader->entNr++);
182}
183
184/**
185 * xmlTextReaderEntPop:
186 * @reader: the xmlTextReaderPtr used
187 *
188 * Pops the top element entity from the entities stack
189 *
190 * Returns the entity just removed
191 */
192static xmlNodePtr
193xmlTextReaderEntPop(xmlTextReaderPtr reader)
194{
195 xmlNodePtr ret;
196
197 if (reader->entNr <= 0)
198 return (0);
199 reader->entNr--;
200 if (reader->entNr > 0)
201 reader->ent = reader->entTab[reader->entNr - 1];
202 else
203 reader->ent = NULL;
204 ret = reader->entTab[reader->entNr];
205 reader->entTab[reader->entNr] = 0;
206 return (ret);
207}
208
209/**
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000210 * xmlTextReaderStartElement:
211 * @ctx: the user data (XML parser context)
212 * @fullname: The element name, including namespace prefix
213 * @atts: An array of name/value attributes pairs, NULL terminated
214 *
215 * called when an opening tag has been processed.
216 */
217static void
218xmlTextReaderStartElement(void *ctx, const xmlChar *fullname,
219 const xmlChar **atts) {
220 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
Daniel Veillardd5896142002-12-31 14:45:26 +0000221 xmlParserCtxtPtr origctxt;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000222 xmlTextReaderPtr reader = ctxt->_private;
223
224#ifdef DEBUG_CALLBACKS
225 printf("xmlTextReaderStartElement(%s)\n", fullname);
226#endif
Daniel Veillardea7751d2002-12-20 00:16:24 +0000227 if ((reader != NULL) && (reader->startElement != NULL)) {
Daniel Veillardd5896142002-12-31 14:45:26 +0000228 /*
229 * when processing an entity, the context may have been changed
230 */
231 origctxt = reader->ctxt;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000232 reader->startElement(ctx, fullname, atts);
Daniel Veillard067bae52003-01-05 01:27:54 +0000233 if ((ctxt->node != NULL) && (ctxt->input != NULL) &&
234 (ctxt->input->cur != NULL) && (ctxt->input->cur[0] == '/') &&
235 (ctxt->input->cur[1] == '>'))
236 ctxt->node->_private = (void *) xmlTextReaderIsEmpty;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000237 }
Daniel Veillard9e395c22003-01-01 14:50:44 +0000238 if (reader != NULL)
239 reader->state = XML_TEXTREADER_ELEMENT;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000240}
241
242/**
243 * xmlTextReaderEndElement:
244 * @ctx: the user data (XML parser context)
245 * @fullname: The element name, including namespace prefix
246 *
247 * called when an ending tag has been processed.
248 */
249static void
250xmlTextReaderEndElement(void *ctx, const xmlChar *fullname) {
251 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
Daniel Veillardd5896142002-12-31 14:45:26 +0000252 xmlParserCtxtPtr origctxt;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000253 xmlTextReaderPtr reader = ctxt->_private;
254
255#ifdef DEBUG_CALLBACKS
256 printf("xmlTextReaderEndElement(%s)\n", fullname);
257#endif
Daniel Veillardea7751d2002-12-20 00:16:24 +0000258 if ((reader != NULL) && (reader->endElement != NULL)) {
Daniel Veillardd5896142002-12-31 14:45:26 +0000259 /*
260 * when processing an entity, the context may have been changed
261 */
262 origctxt = reader->ctxt;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000263
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000264 reader->endElement(ctx, fullname);
Daniel Veillardea7751d2002-12-20 00:16:24 +0000265 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000266}
267
268/**
Daniel Veillardea7751d2002-12-20 00:16:24 +0000269 * xmlTextReaderCharacters:
270 * @ctx: the user data (XML parser context)
271 * @ch: a xmlChar string
272 * @len: the number of xmlChar
273 *
274 * receiving some chars from the parser.
275 */
276static void
277xmlTextReaderCharacters(void *ctx, const xmlChar *ch, int len)
278{
279 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
Daniel Veillardd5896142002-12-31 14:45:26 +0000280 xmlParserCtxtPtr origctxt;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000281 xmlTextReaderPtr reader = ctxt->_private;
282
283#ifdef DEBUG_CALLBACKS
284 printf("xmlTextReaderCharacters()\n");
285#endif
286 if ((reader != NULL) && (reader->characters != NULL)) {
287 reader->characters(ctx, ch, len);
Daniel Veillardd5896142002-12-31 14:45:26 +0000288 /*
289 * when processing an entity, the context may have been changed
290 */
291 origctxt = reader->ctxt;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000292 }
293}
294
295/**
296 * xmlTextReaderCDataBlock:
297 * @ctx: the user data (XML parser context)
298 * @value: The pcdata content
299 * @len: the block length
300 *
301 * called when a pcdata block has been parsed
302 */
303static void
304xmlTextReaderCDataBlock(void *ctx, const xmlChar *ch, int len)
305{
306 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
307 xmlTextReaderPtr reader = ctxt->_private;
308
309#ifdef DEBUG_CALLBACKS
310 printf("xmlTextReaderCDataBlock()\n");
311#endif
312 if ((reader != NULL) && (reader->cdataBlock != NULL)) {
313 reader->cdataBlock(ctx, ch, len);
Daniel Veillardea7751d2002-12-20 00:16:24 +0000314 }
315}
316
317/**
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000318 * xmlTextReaderPushData:
319 * @reader: the xmlTextReaderPtr used
320 *
321 * Push data down the progressive parser until a significant callback
322 * got raised.
323 *
324 * Returns -1 in case of failure, 0 otherwise
325 */
326static int
327xmlTextReaderPushData(xmlTextReaderPtr reader) {
328 unsigned int cur = reader->cur;
329 xmlBufferPtr inbuf;
330 int val;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000331 int oldstate;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000332
333 if ((reader->input == NULL) || (reader->input->buffer == NULL))
334 return(-1);
335
Daniel Veillardea7751d2002-12-20 00:16:24 +0000336 oldstate = reader->state;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000337 reader->state = XML_TEXTREADER_NONE;
338 inbuf = reader->input->buffer;
339 while (reader->state == XML_TEXTREADER_NONE) {
340 if (cur >= inbuf->use) {
341 /*
342 * Refill the buffer unless we are at the end of the stream
343 */
344 if (reader->mode != XML_TEXTREADER_MODE_EOF) {
345 val = xmlParserInputBufferRead(reader->input, 4096);
346 if (val <= 0) {
347 reader->mode = XML_TEXTREADER_MODE_EOF;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000348 reader->state = oldstate;
Daniel Veillardaaa105b2002-12-30 11:42:17 +0000349 if ((oldstate != XML_TEXTREADER_START) ||
350 (reader->ctxt->myDoc != NULL))
351 return(val);
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000352 }
353 } else
354 break;
355 }
Daniel Veillard067bae52003-01-05 01:27:54 +0000356 /*
357 * parse by block of 512 bytes
358 */
359 if ((cur >= reader->cur + 512) || (cur >= inbuf->use)) {
360 if (cur < inbuf->use)
361 cur = cur + 1;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000362 val = xmlParseChunk(reader->ctxt,
363 (const char *) &inbuf->content[reader->cur],
364 cur - reader->cur, 0);
365 if (val != 0)
366 return(-1);
367 reader->cur = cur;
368 break;
369 } else {
370 cur = cur + 1;
371
372 /*
373 * One may have to force a flush at some point when parsing really
374 * large CDATA sections
375 */
376 if ((cur - reader->cur > 4096) && (reader->base == 0) &&
Daniel Veillard67df8092002-12-16 22:04:11 +0000377 (reader->mode == XML_TEXTREADER_MODE_INTERACTIVE)) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000378 cur = cur + 1;
379 val = xmlParseChunk(reader->ctxt,
380 (const char *) &inbuf->content[reader->cur],
381 cur - reader->cur, 0);
382 if (val != 0)
383 return(-1);
384 reader->cur = cur;
385 }
386 }
387 }
388 /*
389 * Discard the consumed input when needed and possible
390 */
Daniel Veillard67df8092002-12-16 22:04:11 +0000391 if (reader->mode == XML_TEXTREADER_MODE_INTERACTIVE) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000392 if ((reader->cur >= 4096) && (reader->base == 0)) {
393 val = xmlBufferShrink(inbuf, cur);
394 if (val >= 0) {
395 reader->cur -= val;
396 }
397 }
398 }
399
400 /*
401 * At the end of the stream signal that the work is done to the Push
402 * parser.
403 */
Daniel Veillardea7751d2002-12-20 00:16:24 +0000404 if (reader->mode == XML_TEXTREADER_MODE_EOF) {
405 if (reader->mode != XML_TEXTREADER_DONE) {
406 val = xmlParseChunk(reader->ctxt,
Daniel Veillard067bae52003-01-05 01:27:54 +0000407 (const char *) &inbuf->content[reader->cur],
408 cur - reader->cur, 1);
409 reader->cur = cur;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000410 reader->mode = XML_TEXTREADER_DONE;
411 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000412 }
Daniel Veillardea7751d2002-12-20 00:16:24 +0000413 reader->state = oldstate;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000414 return(0);
415}
416
417/**
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000418 * xmlTextReaderValidatePush:
419 * @reader: the xmlTextReaderPtr used
420 *
421 * Push the current node for validation
422 */
423static void
424xmlTextReaderValidatePush(xmlTextReaderPtr reader) {
Daniel Veillard0e298ad2003-02-04 16:14:33 +0000425#ifdef LIBXML_REGEXP_ENABLED
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000426 xmlNodePtr node = reader->node;
427
428 if ((node->ns == NULL) || (node->ns->prefix == NULL)) {
429 reader->ctxt->valid &= xmlValidatePushElement(&reader->ctxt->vctxt,
430 reader->ctxt->myDoc, node, node->name);
431 } else {
432 xmlChar *qname;
433
434 qname = xmlStrdup(node->ns->prefix);
435 qname = xmlStrcat(qname, BAD_CAST ":");
436 qname = xmlStrcat(qname, node->name);
437 reader->ctxt->valid &= xmlValidatePushElement(&reader->ctxt->vctxt,
438 reader->ctxt->myDoc, node, qname);
439 if (qname != NULL)
440 xmlFree(qname);
441 }
Daniel Veillard0e298ad2003-02-04 16:14:33 +0000442#endif /* LIBXML_REGEXP_ENABLED */
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000443}
444/**
445 * xmlTextReaderValidatePop:
446 * @reader: the xmlTextReaderPtr used
447 *
448 * Pop the current node from validation
449 */
450static void
451xmlTextReaderValidatePop(xmlTextReaderPtr reader) {
Daniel Veillard0e298ad2003-02-04 16:14:33 +0000452#ifdef LIBXML_REGEXP_ENABLED
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000453 xmlNodePtr node = reader->node;
454
455 if ((node->ns == NULL) || (node->ns->prefix == NULL)) {
456 reader->ctxt->valid &= xmlValidatePopElement(&reader->ctxt->vctxt,
457 reader->ctxt->myDoc, node, node->name);
458 } else {
459 xmlChar *qname;
460
461 qname = xmlStrdup(node->ns->prefix);
462 qname = xmlStrcat(qname, BAD_CAST ":");
463 qname = xmlStrcat(qname, node->name);
464 reader->ctxt->valid &= xmlValidatePopElement(&reader->ctxt->vctxt,
465 reader->ctxt->myDoc, node, qname);
466 if (qname != NULL)
467 xmlFree(qname);
468 }
Daniel Veillard0e298ad2003-02-04 16:14:33 +0000469#endif /* LIBXML_REGEXP_ENABLED */
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000470}
Daniel Veillarda80ff6e2003-01-03 12:52:08 +0000471/**
472 * xmlTextReaderValidateEntity:
473 * @reader: the xmlTextReaderPtr used
474 *
475 * Handle the validation when an entity reference is encountered and
476 * entity substitution is not activated. As a result the parser interface
477 * must walk through the entity and do the validation calls
478 */
479static void
480xmlTextReaderValidateEntity(xmlTextReaderPtr reader) {
Daniel Veillard0e298ad2003-02-04 16:14:33 +0000481#ifdef LIBXML_REGEXP_ENABLED
Daniel Veillarda80ff6e2003-01-03 12:52:08 +0000482 xmlNodePtr oldnode = reader->node;
483 xmlNodePtr node = reader->node;
484 xmlParserCtxtPtr ctxt = reader->ctxt;
485
486 do {
487 if (node->type == XML_ENTITY_REF_NODE) {
488 /*
489 * Case where the underlying tree is not availble, lookup the entity
490 * and walk it.
491 */
492 if ((node->children == NULL) && (ctxt->sax != NULL) &&
493 (ctxt->sax->getEntity != NULL)) {
494 node->children = (xmlNodePtr)
495 ctxt->sax->getEntity(ctxt, node->name);
496 }
497
498 if ((node->children != NULL) &&
499 (node->children->type == XML_ENTITY_DECL) &&
500 (node->children->children != NULL)) {
501 xmlTextReaderEntPush(reader, node);
502 node = node->children->children;
503 continue;
504 } else {
505 /*
506 * The error has probably be raised already.
507 */
508 if (node == oldnode)
509 break;
510 node = node->next;
511 }
512 } else if (node->type == XML_ELEMENT_NODE) {
513 reader->node = node;
514 xmlTextReaderValidatePush(reader);
515 } else if ((node->type == XML_TEXT_NODE) ||
516 (node->type == XML_CDATA_SECTION_NODE)) {
517 ctxt->valid &= xmlValidatePushCData(&ctxt->vctxt,
518 node->content, xmlStrlen(node->content));
519 }
520
521 /*
522 * go to next node
523 */
524 if (node->children != NULL) {
525 node = node->children;
526 continue;
527 }
528 if (node->next != NULL) {
529 node = node->next;
530 continue;
531 }
532 do {
533 node = node->parent;
534 if (node->type == XML_ELEMENT_NODE) {
535 reader->node = node;
536 xmlTextReaderValidatePop(reader);
537 }
538 if ((node->type == XML_ENTITY_DECL) &&
539 (reader->ent != NULL) && (reader->ent->children == node)) {
540 node = xmlTextReaderEntPop(reader);
541 }
542 if (node == oldnode)
543 break;
544 if (node->next != NULL) {
545 node = node->next;
546 break;
547 }
548 } while ((node != NULL) && (node != oldnode));
549 } while ((node != NULL) && (node != oldnode));
550 reader->node = oldnode;
Daniel Veillard0e298ad2003-02-04 16:14:33 +0000551#endif /* LIBXML_REGEXP_ENABLED */
Daniel Veillarda80ff6e2003-01-03 12:52:08 +0000552}
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000553
554
555/**
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000556 * xmlTextReaderRead:
557 * @reader: the xmlTextReaderPtr used
558 *
559 * Moves the position of the current instance to the next node in
560 * the stream, exposing its properties.
561 *
562 * Returns 1 if the node was read successfully, 0 if there is no more
563 * nodes to read, or -1 in case of error
564 */
565int
566xmlTextReaderRead(xmlTextReaderPtr reader) {
Daniel Veillard067bae52003-01-05 01:27:54 +0000567 int val, olddepth = 0;
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000568 xmlTextReaderState oldstate = 0;
569 xmlNodePtr oldnode = NULL;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000570
571 if ((reader == NULL) || (reader->ctxt == NULL))
572 return(-1);
573 if (reader->ctxt->wellFormed != 1)
574 return(-1);
575
576#ifdef DEBUG_READER
577 fprintf(stderr, "\nREAD ");
578 DUMP_READER
579#endif
Daniel Veillard29b3e282002-12-29 11:14:41 +0000580 reader->curnode = NULL;
Daniel Veillard67df8092002-12-16 22:04:11 +0000581 if (reader->mode == XML_TEXTREADER_MODE_INITIAL) {
582 reader->mode = XML_TEXTREADER_MODE_INTERACTIVE;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000583 /*
584 * Initial state
585 */
586 do {
587 val = xmlTextReaderPushData(reader);
588 if (val < 0)
589 return(-1);
590 } while ((reader->ctxt->node == NULL) &&
Daniel Veillard067bae52003-01-05 01:27:54 +0000591 ((reader->mode != XML_TEXTREADER_MODE_EOF) &&
592 (reader->mode != XML_TEXTREADER_DONE)));
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000593 if (reader->ctxt->node == NULL) {
Daniel Veillarddab8ea92003-01-02 14:16:45 +0000594 if (reader->ctxt->myDoc != NULL) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000595 reader->node = reader->ctxt->myDoc->children;
Daniel Veillarddab8ea92003-01-02 14:16:45 +0000596 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000597 if (reader->node == NULL)
598 return(-1);
Daniel Veillarddab8ea92003-01-02 14:16:45 +0000599 reader->state = XML_TEXTREADER_ELEMENT;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000600 } else {
Daniel Veillard4d8db8a2002-12-30 18:40:42 +0000601 reader->node = reader->ctxt->nodeTab[0];
Daniel Veillarde59494f2003-01-04 16:35:29 +0000602 reader->state = XML_TEXTREADER_ELEMENT;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000603 }
Daniel Veillard4d8db8a2002-12-30 18:40:42 +0000604 reader->depth = 0;
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000605 goto node_found;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000606 }
607 oldstate = reader->state;
608 olddepth = reader->ctxt->nodeNr;
609 oldnode = reader->node;
Daniel Veillarddf512f42002-12-23 15:56:21 +0000610
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000611get_next_node:
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000612 /*
613 * If we are not backtracking on ancestors or examined nodes,
614 * that the parser didn't finished or that we arent at the end
615 * of stream, continue processing.
616 */
Daniel Veillardea7751d2002-12-20 00:16:24 +0000617 while (((oldstate == XML_TEXTREADER_BACKTRACK) ||
618 (reader->node->children == NULL) ||
619 (reader->node->type == XML_ENTITY_REF_NODE) ||
Daniel Veillard4dbe77a2003-01-14 00:17:42 +0000620 (reader->node->type == XML_DTD_NODE) ||
621 (reader->node->type == XML_DOCUMENT_NODE) ||
622 (reader->node->type == XML_HTML_DOCUMENT_NODE)) &&
Daniel Veillardea7751d2002-12-20 00:16:24 +0000623 (reader->node->next == NULL) &&
Daniel Veillard4dbe77a2003-01-14 00:17:42 +0000624 ((reader->ctxt->node == NULL) ||
625 (reader->ctxt->node == reader->node) ||
626 (reader->ctxt->node == reader->node->parent)) &&
Daniel Veillardea7751d2002-12-20 00:16:24 +0000627 (reader->ctxt->nodeNr == olddepth) &&
628 (reader->ctxt->instate != XML_PARSER_EOF)) {
629 val = xmlTextReaderPushData(reader);
630 if (val < 0)
631 return(-1);
632 if (reader->node == NULL)
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000633 goto node_end;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000634 }
Daniel Veillard120e8eb2003-03-22 01:00:34 +0000635 /*
636 * If we are in the middle of a piece of CDATA make sure it's finished
637 * Maybe calling a function checking that a non-character() callback was
638 * received would be cleaner for the loop exit.
639 */
640 if ((oldstate == XML_TEXTREADER_ELEMENT) &&
641 (reader->ctxt->instate == XML_PARSER_CDATA_SECTION)) {
642 while ((reader->ctxt->instate == XML_PARSER_CDATA_SECTION) &&
643 (((reader->node->content == NULL) &&
644 (reader->node->next != NULL) &&
645 (reader->node->next->type == XML_CDATA_SECTION_NODE) &&
646 (reader->node->next->next == NULL) &&
647 (reader->node->parent->next == NULL)) ||
648 ((reader->node->children != NULL) &&
649 (reader->node->children->type == XML_CDATA_SECTION_NODE) &&
650 (reader->node->children->next == NULL) &&
651 (reader->node->children->next == NULL)))) {
652 val = xmlTextReaderPushData(reader);
653 if (val < 0)
654 return(-1);
655 }
656 }
657 if ((oldstate == XML_TEXTREADER_ELEMENT) &&
658 (reader->ctxt->instate == XML_PARSER_CONTENT)) {
659 while ((reader->ctxt->instate == XML_PARSER_CONTENT) &&
660 (((reader->node->content == NULL) &&
661 (reader->node->next != NULL) &&
662 (reader->node->next->type == XML_TEXT_NODE) &&
663 (reader->node->next->next == NULL) &&
664 (reader->node->parent->next == NULL)) ||
665 ((reader->node->children != NULL) &&
666 (reader->node->children->type == XML_TEXT_NODE) &&
667 (reader->node->children->next == NULL) &&
668 (reader->node->children->next == NULL)))) {
669 val = xmlTextReaderPushData(reader);
670 if (val < 0)
671 return(-1);
672 }
673 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000674 if (oldstate != XML_TEXTREADER_BACKTRACK) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000675 if ((reader->node->children != NULL) &&
676 (reader->node->type != XML_ENTITY_REF_NODE) &&
677 (reader->node->type != XML_DTD_NODE)) {
678 reader->node = reader->node->children;
679 reader->depth++;
Daniel Veillarddf512f42002-12-23 15:56:21 +0000680 reader->state = XML_TEXTREADER_ELEMENT;
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000681 goto node_found;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000682 }
683 }
684 if (reader->node->next != NULL) {
685 if ((oldstate == XML_TEXTREADER_ELEMENT) &&
Daniel Veillarddf512f42002-12-23 15:56:21 +0000686 (reader->node->type == XML_ELEMENT_NODE) &&
Daniel Veillard067bae52003-01-05 01:27:54 +0000687 (reader->node->children == NULL) &&
688 (reader->node->_private != (void *)xmlTextReaderIsEmpty)) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000689 reader->state = XML_TEXTREADER_END;
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000690 goto node_found;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000691 }
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000692 if ((reader->ctxt->validate) &&
693 (reader->node->type == XML_ELEMENT_NODE))
694 xmlTextReaderValidatePop(reader);
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000695 reader->node = reader->node->next;
696 reader->state = XML_TEXTREADER_ELEMENT;
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000697
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000698 /*
699 * Cleanup of the old node
700 */
Daniel Veillard4dbe77a2003-01-14 00:17:42 +0000701 if ((reader->node->prev != NULL) &&
702 (reader->node->prev->type != XML_DTD_NODE)) {
703 xmlNodePtr tmp = reader->node->prev;
704 xmlUnlinkNode(tmp);
705 xmlFreeNode(tmp);
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000706 }
707
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000708 goto node_found;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000709 }
Daniel Veillardea7751d2002-12-20 00:16:24 +0000710 if ((oldstate == XML_TEXTREADER_ELEMENT) &&
Daniel Veillard571b8892002-12-30 12:37:59 +0000711 (reader->node->type == XML_ELEMENT_NODE) &&
Daniel Veillard067bae52003-01-05 01:27:54 +0000712 (reader->node->children == NULL) &&
713 (reader->node->_private != (void *)xmlTextReaderIsEmpty)) {
Daniel Veillardea7751d2002-12-20 00:16:24 +0000714 reader->state = XML_TEXTREADER_END;
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000715 goto node_found;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000716 }
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000717 if ((reader->ctxt->validate) && (reader->node->type == XML_ELEMENT_NODE))
718 xmlTextReaderValidatePop(reader);
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000719 reader->node = reader->node->parent;
720 if ((reader->node == NULL) ||
721 (reader->node->type == XML_DOCUMENT_NODE) ||
722#ifdef LIBXML_DOCB_ENABLED
723 (reader->node->type == XML_DOCB_DOCUMENT_NODE) ||
724#endif
725 (reader->node->type == XML_HTML_DOCUMENT_NODE)) {
Daniel Veillardea7751d2002-12-20 00:16:24 +0000726 if (reader->mode != XML_TEXTREADER_DONE) {
727 val = xmlParseChunk(reader->ctxt, "", 0, 1);
728 reader->mode = XML_TEXTREADER_DONE;
729 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000730 reader->node = NULL;
Daniel Veillard4d8db8a2002-12-30 18:40:42 +0000731 reader->depth = -1;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000732
733 /*
734 * Cleanup of the old node
735 */
736 if (oldnode->type != XML_DTD_NODE) {
737 xmlUnlinkNode(oldnode);
738 xmlFreeNode(oldnode);
739 }
740
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000741 goto node_end;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000742 }
743 reader->depth--;
744 reader->state = XML_TEXTREADER_BACKTRACK;
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000745
746node_found:
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000747 DUMP_READER
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000748
749 /*
Daniel Veillarda80ff6e2003-01-03 12:52:08 +0000750 * Handle entities enter and exit when in entity replacement mode
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000751 */
752 if ((reader->node != NULL) &&
753 (reader->node->type == XML_ENTITY_REF_NODE) &&
754 (reader->ctxt != NULL) && (reader->ctxt->replaceEntities == 1)) {
755 /*
756 * Case where the underlying tree is not availble, lookup the entity
757 * and walk it.
758 */
759 if ((reader->node->children == NULL) && (reader->ctxt->sax != NULL) &&
760 (reader->ctxt->sax->getEntity != NULL)) {
761 reader->node->children = (xmlNodePtr)
762 reader->ctxt->sax->getEntity(reader->ctxt, reader->node->name);
763 }
764
765 if ((reader->node->children != NULL) &&
766 (reader->node->children->type == XML_ENTITY_DECL) &&
767 (reader->node->children->children != NULL)) {
768 xmlTextReaderEntPush(reader, reader->node);
769 reader->node = reader->node->children->children;
770 }
Daniel Veillarda80ff6e2003-01-03 12:52:08 +0000771 } else if ((reader->node != NULL) &&
772 (reader->node->type == XML_ENTITY_REF_NODE) &&
773 (reader->ctxt != NULL) && (reader->ctxt->validate == 1)) {
774 xmlTextReaderValidateEntity(reader);
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000775 }
776 if ((reader->node != NULL) &&
777 (reader->node->type == XML_ENTITY_DECL) &&
778 (reader->ent != NULL) && (reader->ent->children == reader->node)) {
779 reader->node = xmlTextReaderEntPop(reader);
780 reader->depth++;
781 goto get_next_node;
782 }
Daniel Veillard0e298ad2003-02-04 16:14:33 +0000783#ifdef LIBXML_REGEXP_ENABLED
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000784 if ((reader->ctxt->validate) && (reader->node != NULL)) {
785 xmlNodePtr node = reader->node;
786 xmlParserCtxtPtr ctxt = reader->ctxt;
787
788 if ((node->type == XML_ELEMENT_NODE) &&
789 ((reader->state != XML_TEXTREADER_END) &&
790 (reader->state != XML_TEXTREADER_BACKTRACK))) {
791 xmlTextReaderValidatePush(reader);
792 } else if ((node->type == XML_TEXT_NODE) ||
793 (node->type == XML_CDATA_SECTION_NODE)) {
794 ctxt->valid &= xmlValidatePushCData(&ctxt->vctxt,
795 node->content, xmlStrlen(node->content));
796 }
797 }
Daniel Veillard0e298ad2003-02-04 16:14:33 +0000798#endif /* LIBXML_REGEXP_ENABLED */
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000799 return(1);
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000800node_end:
801 return(0);
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000802}
803
Daniel Veillard67df8092002-12-16 22:04:11 +0000804/**
805 * xmlTextReaderReadState:
806 * @reader: the xmlTextReaderPtr used
807 *
808 * Gets the read state of the reader.
809 *
810 * Returns the state value, or -1 in case of error
811 */
812int
813xmlTextReaderReadState(xmlTextReaderPtr reader) {
814 if (reader == NULL)
815 return(-1);
816 return(reader->mode);
817}
818
819/**
820 * xmlTextReaderReadInnerXml:
821 * @reader: the xmlTextReaderPtr used
822 *
823 * Reads the contents of the current node, including child nodes and markup.
824 *
825 * Returns a string containing the XML content, or NULL if the current node
826 * is neither an element nor attribute, or has no child nodes. The
827 * string must be deallocated by the caller.
828 */
829xmlChar *
830xmlTextReaderReadInnerXml(xmlTextReaderPtr reader) {
831 TODO
832 return(NULL);
833}
834
835/**
836 * xmlTextReaderReadOuterXml:
837 * @reader: the xmlTextReaderPtr used
838 *
839 * Reads the contents of the current node, including child nodes and markup.
840 *
841 * Returns a string containing the XML content, or NULL if the current node
842 * is neither an element nor attribute, or has no child nodes. The
843 * string must be deallocated by the caller.
844 */
845xmlChar *
846xmlTextReaderReadOuterXml(xmlTextReaderPtr reader) {
847 TODO
848 return(NULL);
849}
850
851/**
852 * xmlTextReaderReadString:
853 * @reader: the xmlTextReaderPtr used
854 *
855 * Reads the contents of an element or a text node as a string.
856 *
857 * Returns a string containing the contents of the Element or Text node,
858 * or NULL if the reader is positioned on any other type of node.
859 * The string must be deallocated by the caller.
860 */
861xmlChar *
862xmlTextReaderReadString(xmlTextReaderPtr reader) {
863 TODO
864 return(NULL);
865}
866
Daniel Veillardbeb70bd2002-12-18 14:53:54 +0000867/**
868 * xmlTextReaderReadBase64:
869 * @reader: the xmlTextReaderPtr used
870 * @array: a byte array to store the content.
871 * @offset: the zero-based index into array where the method should
872 * begin to write.
873 * @len: the number of bytes to write.
874 *
875 * Reads and decodes the Base64 encoded contents of an element and
876 * stores the result in a byte buffer.
877 *
878 * Returns the number of bytes written to array, or zero if the current
879 * instance is not positioned on an element or -1 in case of error.
880 */
881int
882xmlTextReaderReadBase64(xmlTextReaderPtr reader, unsigned char *array,
883 int offset, int len) {
884 if ((reader == NULL) || (reader->ctxt == NULL))
885 return(-1);
886 if (reader->ctxt->wellFormed != 1)
887 return(-1);
888
889 if ((reader->node == NULL) || (reader->node->type == XML_ELEMENT_NODE))
890 return(0);
891 TODO
892 return(0);
893}
894
895/**
896 * xmlTextReaderReadBinHex:
897 * @reader: the xmlTextReaderPtr used
898 * @array: a byte array to store the content.
899 * @offset: the zero-based index into array where the method should
900 * begin to write.
901 * @len: the number of bytes to write.
902 *
903 * Reads and decodes the BinHex encoded contents of an element and
904 * stores the result in a byte buffer.
905 *
906 * Returns the number of bytes written to array, or zero if the current
907 * instance is not positioned on an element or -1 in case of error.
908 */
909int
910xmlTextReaderReadBinHex(xmlTextReaderPtr reader, unsigned char *array,
911 int offset, int len) {
912 if ((reader == NULL) || (reader->ctxt == NULL))
913 return(-1);
914 if (reader->ctxt->wellFormed != 1)
915 return(-1);
916
917 if ((reader->node == NULL) || (reader->node->type == XML_ELEMENT_NODE))
918 return(0);
919 TODO
920 return(0);
921}
922
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000923/************************************************************************
924 * *
925 * Constructor and destructors *
926 * *
927 ************************************************************************/
928/**
929 * xmlNewTextReader:
930 * @input: the xmlParserInputBufferPtr used to read data
Daniel Veillardea7751d2002-12-20 00:16:24 +0000931 * @URI: the URI information for the source if available
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000932 *
933 * Create an xmlTextReader structure fed with @input
934 *
935 * Returns the new xmlTextReaderPtr or NULL in case of error
936 */
937xmlTextReaderPtr
Daniel Veillardea7751d2002-12-20 00:16:24 +0000938xmlNewTextReader(xmlParserInputBufferPtr input, const char *URI) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000939 xmlTextReaderPtr ret;
940 int val;
941
942 if (input == NULL)
943 return(NULL);
944 ret = xmlMalloc(sizeof(xmlTextReader));
945 if (ret == NULL) {
946 xmlGenericError(xmlGenericErrorContext,
947 "xmlNewTextReader : malloc failed\n");
948 return(NULL);
949 }
950 memset(ret, 0, sizeof(xmlTextReader));
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000951 ret->entTab = NULL;
952 ret->entMax = 0;
953 ret->entNr = 0;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000954 ret->input = input;
955 ret->sax = (xmlSAXHandler *) xmlMalloc(sizeof(xmlSAXHandler));
956 if (ret->sax == NULL) {
957 xmlFree(ret);
958 xmlGenericError(xmlGenericErrorContext,
959 "xmlNewTextReader : malloc failed\n");
960 return(NULL);
961 }
962 memcpy(ret->sax, &xmlDefaultSAXHandler, sizeof(xmlSAXHandler));
963 ret->startElement = ret->sax->startElement;
964 ret->sax->startElement = xmlTextReaderStartElement;
965 ret->endElement = ret->sax->endElement;
966 ret->sax->endElement = xmlTextReaderEndElement;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000967 ret->characters = ret->sax->characters;
968 ret->sax->characters = xmlTextReaderCharacters;
969 ret->cdataBlock = ret->sax->cdataBlock;
970 ret->sax->cdataBlock = xmlTextReaderCDataBlock;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000971
Daniel Veillard67df8092002-12-16 22:04:11 +0000972 ret->mode = XML_TEXTREADER_MODE_INITIAL;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000973 ret->node = NULL;
Daniel Veillardda46d2d2002-12-15 23:36:49 +0000974 ret->curnode = NULL;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000975 val = xmlParserInputBufferRead(input, 4);
976 if (val >= 4) {
977 ret->ctxt = xmlCreatePushParserCtxt(ret->sax, NULL,
Daniel Veillardea7751d2002-12-20 00:16:24 +0000978 (const char *) ret->input->buffer->content, 4, URI);
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000979 ret->base = 0;
980 ret->cur = 4;
981 } else {
Daniel Veillardea7751d2002-12-20 00:16:24 +0000982 ret->ctxt = xmlCreatePushParserCtxt(ret->sax, NULL, NULL, 0, URI);
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000983 ret->base = 0;
984 ret->cur = 0;
985 }
986 ret->ctxt->_private = ret;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000987 ret->ctxt->linenumbers = 1;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000988 ret->allocs = XML_TEXTREADER_CTXT;
989 return(ret);
990
991}
992
993/**
994 * xmlNewTextReaderFilename:
995 * @URI: the URI of the resource to process
996 *
997 * Create an xmlTextReader structure fed with the resource at @URI
998 *
999 * Returns the new xmlTextReaderPtr or NULL in case of error
1000 */
1001xmlTextReaderPtr
1002xmlNewTextReaderFilename(const char *URI) {
1003 xmlParserInputBufferPtr input;
1004 xmlTextReaderPtr ret;
Daniel Veillardea7751d2002-12-20 00:16:24 +00001005 char *directory = NULL;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001006
1007 input = xmlParserInputBufferCreateFilename(URI, XML_CHAR_ENCODING_NONE);
1008 if (input == NULL)
1009 return(NULL);
Daniel Veillardea7751d2002-12-20 00:16:24 +00001010 ret = xmlNewTextReader(input, URI);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001011 if (ret == NULL) {
1012 xmlFreeParserInputBuffer(input);
1013 return(NULL);
1014 }
1015 ret->allocs |= XML_TEXTREADER_INPUT;
Daniel Veillardea7751d2002-12-20 00:16:24 +00001016 if (ret->ctxt->directory == NULL)
1017 directory = xmlParserGetDirectory(URI);
1018 if ((ret->ctxt->directory == NULL) && (directory != NULL))
1019 ret->ctxt->directory = (char *) xmlStrdup((xmlChar *) directory);
1020 if (directory != NULL)
1021 xmlFree(directory);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001022 return(ret);
1023}
1024
1025/**
1026 * xmlFreeTextReader:
1027 * @reader: the xmlTextReaderPtr
1028 *
1029 * Deallocate all the resources associated to the reader
1030 */
1031void
1032xmlFreeTextReader(xmlTextReaderPtr reader) {
1033 if (reader == NULL)
1034 return;
1035 if (reader->ctxt != NULL) {
1036 if (reader->ctxt->myDoc != NULL) {
1037 xmlFreeDoc(reader->ctxt->myDoc);
1038 reader->ctxt->myDoc = NULL;
1039 }
Daniel Veillard336fc7d2002-12-27 19:37:04 +00001040 if ((reader->ctxt->vctxt.vstateTab != NULL) &&
1041 (reader->ctxt->vctxt.vstateMax > 0)){
1042 xmlFree(reader->ctxt->vctxt.vstateTab);
1043 reader->ctxt->vctxt.vstateTab = 0;
1044 reader->ctxt->vctxt.vstateMax = 0;
1045 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001046 if (reader->allocs & XML_TEXTREADER_CTXT)
1047 xmlFreeParserCtxt(reader->ctxt);
1048 }
1049 if (reader->sax != NULL)
1050 xmlFree(reader->sax);
1051 if ((reader->input != NULL) && (reader->allocs & XML_TEXTREADER_INPUT))
1052 xmlFreeParserInputBuffer(reader->input);
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00001053 if (reader->faketext != NULL) {
1054 xmlFreeNode(reader->faketext);
1055 }
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001056 if (reader->entTab != NULL)
1057 xmlFree(reader->entTab);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001058 xmlFree(reader);
1059}
1060
1061/************************************************************************
1062 * *
Daniel Veillard0eb38c72002-12-14 23:00:35 +00001063 * Methods for XmlTextReader *
1064 * *
1065 ************************************************************************/
1066/**
1067 * xmlTextReaderClose:
1068 * @reader: the xmlTextReaderPtr used
1069 *
1070 * This method releases any resources allocated by the current instance
1071 * changes the state to Closed and close any underlying input.
1072 *
1073 * Returns 0 or -1 in case of error
1074 */
1075int
1076xmlTextReaderClose(xmlTextReaderPtr reader) {
1077 if (reader == NULL)
1078 return(-1);
1079 reader->node = NULL;
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001080 reader->curnode = NULL;
Daniel Veillard0eb38c72002-12-14 23:00:35 +00001081 reader->mode = XML_TEXTREADER_MODE_CLOSED;
1082 if (reader->ctxt != NULL) {
1083 if (reader->ctxt->myDoc != NULL) {
1084 xmlFreeDoc(reader->ctxt->myDoc);
1085 reader->ctxt->myDoc = NULL;
1086 }
1087 if (reader->allocs & XML_TEXTREADER_CTXT) {
1088 xmlFreeParserCtxt(reader->ctxt);
1089 reader->allocs -= XML_TEXTREADER_CTXT;
1090 }
1091 }
1092 if (reader->sax != NULL) {
1093 xmlFree(reader->sax);
1094 reader->sax = NULL;
1095 }
1096 if ((reader->input != NULL) && (reader->allocs & XML_TEXTREADER_INPUT)) {
1097 xmlFreeParserInputBuffer(reader->input);
1098 reader->allocs -= XML_TEXTREADER_INPUT;
1099 }
1100 return(0);
1101}
1102
1103/**
1104 * xmlTextReaderGetAttributeNo:
1105 * @reader: the xmlTextReaderPtr used
1106 * @no: the zero-based index of the attribute relative to the containing element
1107 *
1108 * Provides the value of the attribute with the specified index relative
1109 * to the containing element.
1110 *
1111 * Returns a string containing the value of the specified attribute, or NULL
1112 * in case of error. The string must be deallocated by the caller.
1113 */
1114xmlChar *
1115xmlTextReaderGetAttributeNo(xmlTextReaderPtr reader, int no) {
1116 xmlChar *ret;
1117 int i;
1118 xmlAttrPtr cur;
1119 xmlNsPtr ns;
1120
1121 if (reader == NULL)
1122 return(NULL);
1123 if (reader->node == NULL)
1124 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001125 if (reader->curnode != NULL)
1126 return(NULL);
Daniel Veillard0eb38c72002-12-14 23:00:35 +00001127 /* TODO: handle the xmlDecl */
1128 if (reader->node->type != XML_ELEMENT_NODE)
1129 return(NULL);
1130
1131 ns = reader->node->nsDef;
1132 for (i = 0;(i < no) && (ns != NULL);i++) {
1133 ns = ns->next;
1134 }
1135 if (ns != NULL)
1136 return(xmlStrdup(ns->href));
1137
1138 cur = reader->node->properties;
1139 if (cur == NULL)
1140 return(NULL);
1141 for (;i < no;i++) {
1142 cur = cur->next;
1143 if (cur == NULL)
1144 return(NULL);
1145 }
1146 /* TODO walk the DTD if present */
1147
1148 ret = xmlNodeListGetString(reader->node->doc, cur->children, 1);
1149 if (ret == NULL) return(xmlStrdup((xmlChar *)""));
1150 return(ret);
1151}
1152
1153/**
1154 * xmlTextReaderGetAttribute:
1155 * @reader: the xmlTextReaderPtr used
1156 * @name: the qualified name of the attribute.
1157 *
1158 * Provides the value of the attribute with the specified qualified name.
1159 *
1160 * Returns a string containing the value of the specified attribute, or NULL
1161 * in case of error. The string must be deallocated by the caller.
1162 */
1163xmlChar *
1164xmlTextReaderGetAttribute(xmlTextReaderPtr reader, const xmlChar *name) {
1165 xmlChar *prefix = NULL;
1166 xmlChar *localname;
1167 xmlNsPtr ns;
1168 xmlChar *ret = NULL;
1169
1170 if ((reader == NULL) || (name == NULL))
1171 return(NULL);
1172 if (reader->node == NULL)
1173 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001174 if (reader->curnode != NULL)
1175 return(NULL);
Daniel Veillard0eb38c72002-12-14 23:00:35 +00001176
1177 /* TODO: handle the xmlDecl */
1178 if (reader->node->type != XML_ELEMENT_NODE)
1179 return(NULL);
1180
1181 localname = xmlSplitQName2(name, &prefix);
1182 if (localname == NULL)
1183 return(xmlGetProp(reader->node, name));
1184
1185 ns = xmlSearchNs(reader->node->doc, reader->node, prefix);
1186 if (ns != NULL)
1187 ret = xmlGetNsProp(reader->node, localname, ns->href);
1188
1189 if (localname != NULL)
1190 xmlFree(localname);
1191 if (prefix != NULL)
1192 xmlFree(prefix);
1193 return(ret);
1194}
1195
1196
1197/**
1198 * xmlTextReaderGetAttributeNs:
1199 * @reader: the xmlTextReaderPtr used
1200 * @localName: the local name of the attribute.
1201 * @namespaceURI: the namespace URI of the attribute.
1202 *
1203 * Provides the value of the specified attribute
1204 *
1205 * Returns a string containing the value of the specified attribute, or NULL
1206 * in case of error. The string must be deallocated by the caller.
1207 */
1208xmlChar *
1209xmlTextReaderGetAttributeNs(xmlTextReaderPtr reader, const xmlChar *localName,
1210 const xmlChar *namespaceURI) {
1211 if ((reader == NULL) || (localName == NULL))
1212 return(NULL);
1213 if (reader->node == NULL)
1214 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001215 if (reader->curnode != NULL)
1216 return(NULL);
Daniel Veillard0eb38c72002-12-14 23:00:35 +00001217
1218 /* TODO: handle the xmlDecl */
1219 if (reader->node->type != XML_ELEMENT_NODE)
1220 return(NULL);
1221
1222 return(xmlGetNsProp(reader->node, localName, namespaceURI));
1223}
1224
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001225/**
1226 * xmlTextReaderGetRemainder:
1227 * @reader: the xmlTextReaderPtr used
1228 *
1229 * Method to get the remainder of the buffered XML. this method stops the
1230 * parser, set its state to End Of File and return the input stream with
1231 * what is left that the parser did not use.
1232 *
1233 * Returns the xmlParserInputBufferPtr attached to the XML or NULL
1234 * in case of error.
1235 */
1236xmlParserInputBufferPtr
1237xmlTextReaderGetRemainder(xmlTextReaderPtr reader) {
1238 xmlParserInputBufferPtr ret = NULL;
1239
1240 if (reader == NULL)
1241 return(NULL);
1242 if (reader->node == NULL)
1243 return(NULL);
1244
1245 reader->node = NULL;
1246 reader->curnode = NULL;
1247 reader->mode = XML_TEXTREADER_MODE_EOF;
1248 if (reader->ctxt != NULL) {
1249 if (reader->ctxt->myDoc != NULL) {
1250 xmlFreeDoc(reader->ctxt->myDoc);
1251 reader->ctxt->myDoc = NULL;
1252 }
1253 if (reader->allocs & XML_TEXTREADER_CTXT) {
1254 xmlFreeParserCtxt(reader->ctxt);
1255 reader->allocs -= XML_TEXTREADER_CTXT;
1256 }
1257 }
1258 if (reader->sax != NULL) {
1259 xmlFree(reader->sax);
1260 reader->sax = NULL;
1261 }
1262 if (reader->allocs & XML_TEXTREADER_INPUT) {
1263 ret = reader->input;
1264 reader->allocs -= XML_TEXTREADER_INPUT;
1265 } else {
1266 /*
1267 * Hum, one may need to duplicate the data structure because
1268 * without reference counting the input may be freed twice:
1269 * - by the layer which allocated it.
1270 * - by the layer to which would have been returned to.
1271 */
1272 TODO
1273 return(NULL);
1274 }
1275 return(ret);
1276}
1277
1278/**
1279 * xmlTextReaderLookupNamespace:
1280 * @reader: the xmlTextReaderPtr used
1281 * @prefix: the prefix whose namespace URI is to be resolved. To return
1282 * the default namespace, specify NULL
1283 *
1284 * Resolves a namespace prefix in the scope of the current element.
1285 *
1286 * Returns a string containing the namespace URI to which the prefix maps
1287 * or NULL in case of error. The string must be deallocated by the caller.
1288 */
1289xmlChar *
1290xmlTextReaderLookupNamespace(xmlTextReaderPtr reader, const xmlChar *prefix) {
1291 xmlNsPtr ns;
1292
1293 if (reader == NULL)
1294 return(NULL);
1295 if (reader->node == NULL)
1296 return(NULL);
1297
1298 ns = xmlSearchNs(reader->node->doc, reader->node, prefix);
1299 if (ns == NULL)
1300 return(NULL);
1301 return(xmlStrdup(ns->href));
1302}
1303
1304/**
1305 * xmlTextReaderMoveToAttributeNo:
1306 * @reader: the xmlTextReaderPtr used
1307 * @no: the zero-based index of the attribute relative to the containing
1308 * element.
1309 *
1310 * Moves the position of the current instance to the attribute with
1311 * the specified index relative to the containing element.
1312 *
1313 * Returns 1 in case of success, -1 in case of error, 0 if not found
1314 */
1315int
1316xmlTextReaderMoveToAttributeNo(xmlTextReaderPtr reader, int no) {
1317 int i;
1318 xmlAttrPtr cur;
1319 xmlNsPtr ns;
1320
1321 if (reader == NULL)
1322 return(-1);
1323 if (reader->node == NULL)
1324 return(-1);
1325 /* TODO: handle the xmlDecl */
1326 if (reader->node->type != XML_ELEMENT_NODE)
1327 return(-1);
1328
1329 reader->curnode = NULL;
1330
1331 ns = reader->node->nsDef;
1332 for (i = 0;(i < no) && (ns != NULL);i++) {
1333 ns = ns->next;
1334 }
1335 if (ns != NULL) {
1336 reader->curnode = (xmlNodePtr) ns;
1337 return(1);
1338 }
1339
1340 cur = reader->node->properties;
1341 if (cur == NULL)
1342 return(0);
1343 for (;i < no;i++) {
1344 cur = cur->next;
1345 if (cur == NULL)
1346 return(0);
1347 }
1348 /* TODO walk the DTD if present */
1349
1350 reader->curnode = (xmlNodePtr) cur;
1351 return(1);
1352}
1353
1354/**
1355 * xmlTextReaderMoveToAttribute:
1356 * @reader: the xmlTextReaderPtr used
1357 * @name: the qualified name of the attribute.
1358 *
1359 * Moves the position of the current instance to the attribute with
1360 * the specified qualified name.
1361 *
1362 * Returns 1 in case of success, -1 in case of error, 0 if not found
1363 */
1364int
1365xmlTextReaderMoveToAttribute(xmlTextReaderPtr reader, const xmlChar *name) {
1366 xmlChar *prefix = NULL;
1367 xmlChar *localname;
1368 xmlNsPtr ns;
1369 xmlAttrPtr prop;
1370
1371 if ((reader == NULL) || (name == NULL))
1372 return(-1);
1373 if (reader->node == NULL)
1374 return(-1);
1375
1376 /* TODO: handle the xmlDecl */
1377 if (reader->node->type != XML_ELEMENT_NODE)
1378 return(0);
1379
1380 localname = xmlSplitQName2(name, &prefix);
1381 if (localname == NULL) {
1382 /*
1383 * Namespace default decl
1384 */
1385 if (xmlStrEqual(name, BAD_CAST "xmlns")) {
1386 ns = reader->node->nsDef;
1387 while (ns != NULL) {
1388 if (ns->prefix == NULL) {
1389 reader->curnode = (xmlNodePtr) ns;
1390 return(1);
1391 }
1392 ns = ns->next;
1393 }
1394 return(0);
1395 }
1396
1397 prop = reader->node->properties;
1398 while (prop != NULL) {
1399 /*
1400 * One need to have
1401 * - same attribute names
1402 * - and the attribute carrying that namespace
1403 */
1404 if ((xmlStrEqual(prop->name, name)) &&
1405 ((prop->ns == NULL) || (prop->ns->prefix == NULL))) {
1406 reader->curnode = (xmlNodePtr) prop;
1407 return(1);
1408 }
1409 prop = prop->next;
1410 }
1411 return(0);
1412 }
1413
1414 /*
1415 * Namespace default decl
1416 */
1417 if (xmlStrEqual(prefix, BAD_CAST "xmlns")) {
1418 ns = reader->node->nsDef;
1419 while (ns != NULL) {
1420 if ((ns->prefix != NULL) && (xmlStrEqual(ns->prefix, localname))) {
1421 reader->curnode = (xmlNodePtr) ns;
1422 goto found;
1423 }
1424 ns = ns->next;
1425 }
1426 goto not_found;
1427 }
1428 prop = reader->node->properties;
1429 while (prop != NULL) {
1430 /*
1431 * One need to have
1432 * - same attribute names
1433 * - and the attribute carrying that namespace
1434 */
1435 if ((xmlStrEqual(prop->name, localname)) &&
1436 (prop->ns != NULL) && (xmlStrEqual(prop->ns->prefix, prefix))) {
1437 reader->curnode = (xmlNodePtr) prop;
1438 goto found;
1439 }
1440 prop = prop->next;
1441 }
1442not_found:
1443 if (localname != NULL)
1444 xmlFree(localname);
1445 if (prefix != NULL)
1446 xmlFree(prefix);
1447 return(0);
1448
1449found:
1450 if (localname != NULL)
1451 xmlFree(localname);
1452 if (prefix != NULL)
1453 xmlFree(prefix);
1454 return(1);
1455}
1456
1457/**
1458 * xmlTextReaderMoveToAttributeNs:
1459 * @reader: the xmlTextReaderPtr used
1460 * @localName: the local name of the attribute.
1461 * @namespaceURI: the namespace URI of the attribute.
1462 *
1463 * Moves the position of the current instance to the attribute with the
1464 * specified local name and namespace URI.
1465 *
1466 * Returns 1 in case of success, -1 in case of error, 0 if not found
1467 */
1468int
1469xmlTextReaderMoveToAttributeNs(xmlTextReaderPtr reader,
1470 const xmlChar *localName, const xmlChar *namespaceURI) {
1471 xmlAttrPtr prop;
1472 xmlNodePtr node;
1473
1474 if ((reader == NULL) || (localName == NULL) || (namespaceURI == NULL))
1475 return(-1);
1476 if (reader->node == NULL)
1477 return(-1);
1478 if (reader->node->type != XML_ELEMENT_NODE)
1479 return(0);
1480 node = reader->node;
1481
1482 /*
1483 * A priori reading http://www.w3.org/TR/REC-xml-names/ there is no
1484 * namespace name associated to "xmlns"
1485 */
1486 prop = node->properties;
1487 while (prop != NULL) {
1488 /*
1489 * One need to have
1490 * - same attribute names
1491 * - and the attribute carrying that namespace
1492 */
1493 if (xmlStrEqual(prop->name, localName) &&
1494 ((prop->ns != NULL) &&
1495 (xmlStrEqual(prop->ns->href, namespaceURI)))) {
1496 reader->curnode = (xmlNodePtr) prop;
1497 return(1);
1498 }
1499 prop = prop->next;
1500 }
1501 return(0);
1502}
1503
1504/**
1505 * xmlTextReaderMoveToFirstAttribute:
1506 * @reader: the xmlTextReaderPtr used
1507 *
1508 * Moves the position of the current instance to the first attribute
1509 * associated with the current node.
1510 *
1511 * Returns 1 in case of success, -1 in case of error, 0 if not found
1512 */
1513int
1514xmlTextReaderMoveToFirstAttribute(xmlTextReaderPtr reader) {
1515 if (reader == NULL)
1516 return(-1);
1517 if (reader->node == NULL)
1518 return(-1);
1519 if (reader->node->type != XML_ELEMENT_NODE)
1520 return(0);
1521
1522 if (reader->node->nsDef != NULL) {
1523 reader->curnode = (xmlNodePtr) reader->node->nsDef;
1524 return(1);
1525 }
1526 if (reader->node->properties != NULL) {
1527 reader->curnode = (xmlNodePtr) reader->node->properties;
1528 return(1);
1529 }
1530 return(0);
1531}
1532
1533/**
1534 * xmlTextReaderMoveToNextAttribute:
1535 * @reader: the xmlTextReaderPtr used
1536 *
1537 * Moves the position of the current instance to the next attribute
1538 * associated with the current node.
1539 *
1540 * Returns 1 in case of success, -1 in case of error, 0 if not found
1541 */
1542int
1543xmlTextReaderMoveToNextAttribute(xmlTextReaderPtr reader) {
1544 if (reader == NULL)
1545 return(-1);
1546 if (reader->node == NULL)
1547 return(-1);
1548 if (reader->node->type != XML_ELEMENT_NODE)
1549 return(0);
1550 if (reader->curnode == NULL)
1551 return(xmlTextReaderMoveToFirstAttribute(reader));
1552
1553 if (reader->curnode->type == XML_NAMESPACE_DECL) {
1554 xmlNsPtr ns = (xmlNsPtr) reader->curnode;
1555 if (ns->next != NULL) {
1556 reader->curnode = (xmlNodePtr) ns->next;
1557 return(1);
1558 }
1559 if (reader->node->properties != NULL) {
1560 reader->curnode = (xmlNodePtr) reader->node->properties;
1561 return(1);
1562 }
1563 return(0);
1564 } else if ((reader->curnode->type == XML_ATTRIBUTE_NODE) &&
1565 (reader->curnode->next != NULL)) {
1566 reader->curnode = reader->curnode->next;
1567 return(1);
1568 }
1569 return(0);
1570}
1571
1572/**
1573 * xmlTextReaderMoveToElement:
1574 * @reader: the xmlTextReaderPtr used
1575 *
1576 * Moves the position of the current instance to the node that
1577 * contains the current Attribute node.
1578 *
1579 * Returns 1 in case of success, -1 in case of error, 0 if not moved
1580 */
1581int
1582xmlTextReaderMoveToElement(xmlTextReaderPtr reader) {
1583 if (reader == NULL)
1584 return(-1);
1585 if (reader->node == NULL)
1586 return(-1);
1587 if (reader->node->type != XML_ELEMENT_NODE)
1588 return(0);
1589 if (reader->curnode != NULL) {
1590 reader->curnode = NULL;
1591 return(1);
1592 }
1593 return(0);
1594}
1595
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00001596/**
1597 * xmlTextReaderReadAttributeValue:
1598 * @reader: the xmlTextReaderPtr used
1599 *
1600 * Parses an attribute value into one or more Text and EntityReference nodes.
1601 *
1602 * Returns 1 in case of success, 0 if the reader was not positionned on an
1603 * ttribute node or all the attribute values have been read, or -1
1604 * in case of error.
1605 */
1606int
1607xmlTextReaderReadAttributeValue(xmlTextReaderPtr reader) {
1608 if (reader == NULL)
1609 return(-1);
1610 if (reader->node == NULL)
1611 return(-1);
1612 if (reader->curnode == NULL)
1613 return(0);
1614 if (reader->curnode->type == XML_ATTRIBUTE_NODE) {
1615 if (reader->curnode->children == NULL)
1616 return(0);
1617 reader->curnode = reader->curnode->children;
1618 } else if (reader->curnode->type == XML_NAMESPACE_DECL) {
1619 xmlNsPtr ns = (xmlNsPtr) reader->curnode;
1620
1621 if (reader->faketext == NULL) {
1622 reader->faketext = xmlNewDocText(reader->node->doc,
1623 ns->href);
1624 } else {
1625 if (reader->faketext->content != NULL)
1626 xmlFree(reader->faketext->content);
1627 reader->faketext->content = xmlStrdup(ns->href);
1628 }
1629 reader->curnode = reader->faketext;
1630 } else {
1631 if (reader->curnode->next == NULL)
1632 return(0);
1633 reader->curnode = reader->curnode->next;
1634 }
1635 return(1);
1636}
1637
Daniel Veillard0eb38c72002-12-14 23:00:35 +00001638/************************************************************************
1639 * *
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001640 * Acces API to the current node *
1641 * *
1642 ************************************************************************/
1643/**
1644 * xmlTextReaderAttributeCount:
1645 * @reader: the xmlTextReaderPtr used
1646 *
Daniel Veillarda9b66d02002-12-11 14:23:49 +00001647 * Provides the number of attributes of the current node
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001648 *
1649 * Returns 0 i no attributes, -1 in case of error or the attribute count
1650 */
1651int
1652xmlTextReaderAttributeCount(xmlTextReaderPtr reader) {
1653 int ret;
1654 xmlAttrPtr attr;
Daniel Veillard67df8092002-12-16 22:04:11 +00001655 xmlNsPtr ns;
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001656 xmlNodePtr node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001657
1658 if (reader == NULL)
1659 return(-1);
1660 if (reader->node == NULL)
1661 return(0);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001662
1663 if (reader->curnode != NULL)
1664 node = reader->curnode;
1665 else
1666 node = reader->node;
1667
1668 if (node->type != XML_ELEMENT_NODE)
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001669 return(0);
1670 if ((reader->state == XML_TEXTREADER_END) ||
1671 (reader->state == XML_TEXTREADER_BACKTRACK))
1672 return(0);
1673 ret = 0;
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001674 attr = node->properties;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001675 while (attr != NULL) {
1676 ret++;
1677 attr = attr->next;
1678 }
Daniel Veillard67df8092002-12-16 22:04:11 +00001679 ns = node->nsDef;
1680 while (ns != NULL) {
1681 ret++;
1682 ns = ns->next;
1683 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001684 return(ret);
1685}
1686
1687/**
1688 * xmlTextReaderNodeType:
1689 * @reader: the xmlTextReaderPtr used
1690 *
1691 * Get the node type of the current node
1692 * Reference:
1693 * http://dotgnu.org/pnetlib-doc/System/Xml/XmlNodeType.html
1694 *
1695 * Returns the xmlNodeType of the current node or -1 in case of error
1696 */
1697int
1698xmlTextReaderNodeType(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001699 xmlNodePtr node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001700 if (reader == NULL)
1701 return(-1);
1702 if (reader->node == NULL)
1703 return(0);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001704 if (reader->curnode != NULL)
1705 node = reader->curnode;
1706 else
1707 node = reader->node;
1708 switch (node->type) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001709 case XML_ELEMENT_NODE:
1710 if ((reader->state == XML_TEXTREADER_END) ||
1711 (reader->state == XML_TEXTREADER_BACKTRACK))
1712 return(15);
1713 return(1);
Daniel Veillardecaba492002-12-30 10:55:29 +00001714 case XML_NAMESPACE_DECL:
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001715 case XML_ATTRIBUTE_NODE:
1716 return(2);
1717 case XML_TEXT_NODE:
1718 return(3); /* TODO: SignificantWhitespace == 14 Whitespace == 13 */
1719 case XML_CDATA_SECTION_NODE:
1720 return(4);
1721 case XML_ENTITY_REF_NODE:
1722 return(5);
1723 case XML_ENTITY_NODE:
1724 return(6);
1725 case XML_PI_NODE:
1726 return(7);
1727 case XML_COMMENT_NODE:
1728 return(8);
1729 case XML_DOCUMENT_NODE:
1730 case XML_HTML_DOCUMENT_NODE:
1731#ifdef LIBXML_DOCB_ENABLED
1732 case XML_DOCB_DOCUMENT_NODE:
1733#endif
1734 return(9);
1735 case XML_DOCUMENT_FRAG_NODE:
1736 return(11);
1737 case XML_NOTATION_NODE:
1738 return(12);
1739 case XML_DOCUMENT_TYPE_NODE:
1740 case XML_DTD_NODE:
1741 return(10);
1742
1743 case XML_ELEMENT_DECL:
1744 case XML_ATTRIBUTE_DECL:
1745 case XML_ENTITY_DECL:
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001746 case XML_XINCLUDE_START:
1747 case XML_XINCLUDE_END:
1748 return(0);
1749 }
1750 return(-1);
1751}
1752
1753/**
Daniel Veillard01c13b52002-12-10 15:19:08 +00001754 * xmlTextReaderIsEmptyElement:
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001755 * @reader: the xmlTextReaderPtr used
1756 *
1757 * Check if the current node is empty
1758 *
1759 * Returns 1 if empty, 0 if not and -1 in case of error
1760 */
1761int
1762xmlTextReaderIsEmptyElement(xmlTextReaderPtr reader) {
1763 if ((reader == NULL) || (reader->node == NULL))
1764 return(-1);
Daniel Veillarddf512f42002-12-23 15:56:21 +00001765 if (reader->node->type != XML_ELEMENT_NODE)
1766 return(0);
Daniel Veillarde3c036e2003-01-01 15:11:05 +00001767 if (reader->curnode != NULL)
1768 return(0);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001769 if (reader->node->children != NULL)
1770 return(0);
Daniel Veillarddab8ea92003-01-02 14:16:45 +00001771 if (reader->state == XML_TEXTREADER_END)
1772 return(0);
Daniel Veillard067bae52003-01-05 01:27:54 +00001773 return(reader->node->_private == (void *)xmlTextReaderIsEmpty);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001774}
1775
1776/**
1777 * xmlTextReaderLocalName:
1778 * @reader: the xmlTextReaderPtr used
1779 *
1780 * The local name of the node.
1781 *
1782 * Returns the local name or NULL if not available
1783 */
1784xmlChar *
1785xmlTextReaderLocalName(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001786 xmlNodePtr node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001787 if ((reader == NULL) || (reader->node == NULL))
1788 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001789 if (reader->curnode != NULL)
1790 node = reader->curnode;
1791 else
1792 node = reader->node;
1793 if (node->type == XML_NAMESPACE_DECL) {
1794 xmlNsPtr ns = (xmlNsPtr) node;
1795 if (ns->prefix == NULL)
1796 return(xmlStrdup(BAD_CAST "xmlns"));
1797 else
1798 return(xmlStrdup(ns->prefix));
1799 }
1800 if ((node->type != XML_ELEMENT_NODE) &&
1801 (node->type != XML_ATTRIBUTE_NODE))
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00001802 return(xmlTextReaderName(reader));
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001803 return(xmlStrdup(node->name));
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001804}
1805
1806/**
1807 * xmlTextReaderName:
1808 * @reader: the xmlTextReaderPtr used
1809 *
1810 * The qualified name of the node, equal to Prefix :LocalName.
1811 *
1812 * Returns the local name or NULL if not available
1813 */
1814xmlChar *
1815xmlTextReaderName(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001816 xmlNodePtr node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001817 xmlChar *ret;
1818
1819 if ((reader == NULL) || (reader->node == NULL))
1820 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001821 if (reader->curnode != NULL)
1822 node = reader->curnode;
1823 else
1824 node = reader->node;
1825 switch (node->type) {
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00001826 case XML_ELEMENT_NODE:
1827 case XML_ATTRIBUTE_NODE:
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001828 if ((node->ns == NULL) ||
1829 (node->ns->prefix == NULL))
1830 return(xmlStrdup(node->name));
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00001831
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001832 ret = xmlStrdup(node->ns->prefix);
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00001833 ret = xmlStrcat(ret, BAD_CAST ":");
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001834 ret = xmlStrcat(ret, node->name);
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00001835 return(ret);
1836 case XML_TEXT_NODE:
1837 return(xmlStrdup(BAD_CAST "#text"));
1838 case XML_CDATA_SECTION_NODE:
1839 return(xmlStrdup(BAD_CAST "#cdata-section"));
1840 case XML_ENTITY_NODE:
1841 case XML_ENTITY_REF_NODE:
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001842 return(xmlStrdup(node->name));
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00001843 case XML_PI_NODE:
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001844 return(xmlStrdup(node->name));
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00001845 case XML_COMMENT_NODE:
1846 return(xmlStrdup(BAD_CAST "#comment"));
1847 case XML_DOCUMENT_NODE:
1848 case XML_HTML_DOCUMENT_NODE:
1849#ifdef LIBXML_DOCB_ENABLED
1850 case XML_DOCB_DOCUMENT_NODE:
1851#endif
1852 return(xmlStrdup(BAD_CAST "#document"));
1853 case XML_DOCUMENT_FRAG_NODE:
1854 return(xmlStrdup(BAD_CAST "#document-fragment"));
1855 case XML_NOTATION_NODE:
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001856 return(xmlStrdup(node->name));
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00001857 case XML_DOCUMENT_TYPE_NODE:
1858 case XML_DTD_NODE:
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001859 return(xmlStrdup(node->name));
1860 case XML_NAMESPACE_DECL: {
1861 xmlNsPtr ns = (xmlNsPtr) node;
1862
1863 ret = xmlStrdup(BAD_CAST "xmlns");
1864 if (ns->prefix == NULL)
1865 return(ret);
1866 ret = xmlStrcat(ret, BAD_CAST ":");
1867 ret = xmlStrcat(ret, ns->prefix);
1868 return(ret);
1869 }
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00001870
1871 case XML_ELEMENT_DECL:
1872 case XML_ATTRIBUTE_DECL:
1873 case XML_ENTITY_DECL:
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00001874 case XML_XINCLUDE_START:
1875 case XML_XINCLUDE_END:
1876 return(NULL);
1877 }
1878 return(NULL);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001879}
1880
1881/**
1882 * xmlTextReaderPrefix:
1883 * @reader: the xmlTextReaderPtr used
1884 *
1885 * A shorthand reference to the namespace associated with the node.
1886 *
1887 * Returns the prefix or NULL if not available
1888 */
1889xmlChar *
1890xmlTextReaderPrefix(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001891 xmlNodePtr node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001892 if ((reader == NULL) || (reader->node == NULL))
1893 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001894 if (reader->curnode != NULL)
1895 node = reader->curnode;
1896 else
1897 node = reader->node;
1898 if (node->type == XML_NAMESPACE_DECL) {
1899 xmlNsPtr ns = (xmlNsPtr) node;
1900 if (ns->prefix == NULL)
1901 return(NULL);
1902 return(xmlStrdup(BAD_CAST "xmlns"));
1903 }
1904 if ((node->type != XML_ELEMENT_NODE) &&
1905 (node->type != XML_ATTRIBUTE_NODE))
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001906 return(NULL);
Daniel Veillard952379b2003-03-17 15:37:12 +00001907 if ((node->ns != NULL) && (node->ns->prefix != NULL))
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001908 return(xmlStrdup(node->ns->prefix));
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001909 return(NULL);
1910}
1911
1912/**
1913 * xmlTextReaderNamespaceUri:
1914 * @reader: the xmlTextReaderPtr used
1915 *
1916 * The URI defining the namespace associated with the node.
1917 *
1918 * Returns the namespace URI or NULL if not available
1919 */
1920xmlChar *
1921xmlTextReaderNamespaceUri(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001922 xmlNodePtr node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001923 if ((reader == NULL) || (reader->node == NULL))
1924 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001925 if (reader->curnode != NULL)
1926 node = reader->curnode;
1927 else
1928 node = reader->node;
Daniel Veillardecaba492002-12-30 10:55:29 +00001929 if (node->type == XML_NAMESPACE_DECL)
1930 return(xmlStrdup(BAD_CAST "http://www.w3.org/2000/xmlns/"));
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001931 if ((node->type != XML_ELEMENT_NODE) &&
1932 (node->type != XML_ATTRIBUTE_NODE))
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001933 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001934 if (node->ns != NULL)
1935 return(xmlStrdup(node->ns->href));
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001936 return(NULL);
1937}
1938
1939/**
1940 * xmlTextReaderBaseUri:
1941 * @reader: the xmlTextReaderPtr used
1942 *
1943 * The base URI of the node.
1944 *
1945 * Returns the base URI or NULL if not available
1946 */
1947xmlChar *
1948xmlTextReaderBaseUri(xmlTextReaderPtr reader) {
1949 if ((reader == NULL) || (reader->node == NULL))
1950 return(NULL);
1951 return(xmlNodeGetBase(NULL, reader->node));
1952}
1953
1954/**
1955 * xmlTextReaderDepth:
1956 * @reader: the xmlTextReaderPtr used
1957 *
1958 * The depth of the node in the tree.
1959 *
1960 * Returns the depth or -1 in case of error
1961 */
1962int
1963xmlTextReaderDepth(xmlTextReaderPtr reader) {
1964 if (reader == NULL)
1965 return(-1);
1966 if (reader->node == NULL)
1967 return(0);
1968
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00001969 if (reader->curnode != NULL) {
1970 if ((reader->curnode->type == XML_ATTRIBUTE_NODE) ||
1971 (reader->curnode->type == XML_NAMESPACE_DECL))
1972 return(reader->depth + 1);
1973 return(reader->depth + 2);
1974 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001975 return(reader->depth);
1976}
1977
1978/**
1979 * xmlTextReaderHasAttributes:
1980 * @reader: the xmlTextReaderPtr used
1981 *
1982 * Whether the node has attributes.
1983 *
1984 * Returns 1 if true, 0 if false, and -1 in case or error
1985 */
1986int
1987xmlTextReaderHasAttributes(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001988 xmlNodePtr node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001989 if (reader == NULL)
1990 return(-1);
1991 if (reader->node == NULL)
1992 return(0);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001993 if (reader->curnode != NULL)
1994 node = reader->curnode;
1995 else
1996 node = reader->node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001997
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001998 if ((node->type == XML_ELEMENT_NODE) &&
1999 (node->properties != NULL))
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002000 return(1);
2001 /* TODO: handle the xmlDecl */
2002 return(0);
2003}
2004
2005/**
2006 * xmlTextReaderHasValue:
2007 * @reader: the xmlTextReaderPtr used
2008 *
2009 * Whether the node can have a text value.
2010 *
2011 * Returns 1 if true, 0 if false, and -1 in case or error
2012 */
2013int
2014xmlTextReaderHasValue(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002015 xmlNodePtr node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002016 if (reader == NULL)
2017 return(-1);
2018 if (reader->node == NULL)
2019 return(0);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002020 if (reader->curnode != NULL)
2021 node = reader->curnode;
2022 else
2023 node = reader->node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002024
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002025 switch (node->type) {
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002026 case XML_ATTRIBUTE_NODE:
2027 case XML_TEXT_NODE:
2028 case XML_CDATA_SECTION_NODE:
2029 case XML_PI_NODE:
2030 case XML_COMMENT_NODE:
2031 return(1);
2032 default:
2033 return(0);
2034 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002035 return(0);
2036}
2037
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002038/**
2039 * xmlTextReaderValue:
2040 * @reader: the xmlTextReaderPtr used
2041 *
2042 * Provides the text value of the node if present
2043 *
2044 * Returns the string or NULL if not available. The retsult must be deallocated
2045 * with xmlFree()
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002046 */
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002047xmlChar *
2048xmlTextReaderValue(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002049 xmlNodePtr node;
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002050 if (reader == NULL)
2051 return(NULL);
2052 if (reader->node == NULL)
2053 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002054 if (reader->curnode != NULL)
2055 node = reader->curnode;
2056 else
2057 node = reader->node;
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002058
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002059 switch (node->type) {
2060 case XML_NAMESPACE_DECL:
2061 return(xmlStrdup(((xmlNsPtr) node)->href));
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002062 case XML_ATTRIBUTE_NODE:{
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002063 xmlAttrPtr attr = (xmlAttrPtr) node;
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002064
2065 if (attr->parent != NULL)
2066 return (xmlNodeListGetString
2067 (attr->parent->doc, attr->children, 1));
2068 else
2069 return (xmlNodeListGetString(NULL, attr->children, 1));
2070 break;
2071 }
2072 case XML_TEXT_NODE:
2073 case XML_CDATA_SECTION_NODE:
2074 case XML_PI_NODE:
2075 case XML_COMMENT_NODE:
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002076 if (node->content != NULL)
2077 return (xmlStrdup(node->content));
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002078 default:
2079 return(NULL);
2080 }
2081 return(NULL);
2082}
2083
2084/**
2085 * xmlTextReaderIsDefault:
2086 * @reader: the xmlTextReaderPtr used
2087 *
2088 * Whether an Attribute node was generated from the default value
2089 * defined in the DTD or schema.
2090 *
2091 * Returns 0 if not defaulted, 1 if defaulted, and -1 in case of error
2092 */
2093int
2094xmlTextReaderIsDefault(xmlTextReaderPtr reader) {
2095 if (reader == NULL)
2096 return(-1);
2097 return(0);
2098}
2099
2100/**
2101 * xmlTextReaderQuoteChar:
2102 * @reader: the xmlTextReaderPtr used
2103 *
2104 * The quotation mark character used to enclose the value of an attribute.
2105 *
2106 * Returns " or ' and -1 in case of error
2107 */
2108int
2109xmlTextReaderQuoteChar(xmlTextReaderPtr reader) {
2110 if (reader == NULL)
2111 return(-1);
2112 /* TODO maybe lookup the attribute value for " first */
2113 return((int) '"');
2114}
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002115
2116/**
2117 * xmlTextReaderXmlLang:
2118 * @reader: the xmlTextReaderPtr used
2119 *
2120 * The xml:lang scope within which the node resides.
2121 *
2122 * Returns the xml:lang value or NULL if none exists.
2123 */
2124xmlChar *
2125xmlTextReaderXmlLang(xmlTextReaderPtr reader) {
2126 if (reader == NULL)
2127 return(NULL);
2128 if (reader->node == NULL)
2129 return(NULL);
2130 return(xmlNodeGetLang(reader->node));
2131}
2132
Daniel Veillard67df8092002-12-16 22:04:11 +00002133/**
2134 * xmlTextReaderNormalization:
2135 * @reader: the xmlTextReaderPtr used
2136 *
2137 * The value indicating whether to normalize white space and attribute values.
2138 * Since attribute value and end of line normalizations are a MUST in the XML
2139 * specification only the value true is accepted. The broken bahaviour of
2140 * accepting out of range character entities like &#0; is of course not
2141 * supported either.
2142 *
2143 * Returns 1 or -1 in case of error.
2144 */
2145int
2146xmlTextReaderNormalization(xmlTextReaderPtr reader) {
2147 if (reader == NULL)
2148 return(-1);
2149 return(1);
2150}
2151
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00002152/************************************************************************
2153 * *
2154 * Extensions to the base APIs *
2155 * *
2156 ************************************************************************/
2157
2158/**
2159 * xmlTextReaderSetParserProp:
2160 * @reader: the xmlTextReaderPtr used
2161 * @prop: the xmlParserProperties to set
2162 * @value: usually 0 or 1 to (de)activate it
2163 *
2164 * Change the parser processing behaviour by changing some of its internal
2165 * properties. Note that some properties can only be changed before any
2166 * read has been done.
2167 *
2168 * Returns 0 if the call was successful, or -1 in case of error
2169 */
2170int
2171xmlTextReaderSetParserProp(xmlTextReaderPtr reader, int prop, int value) {
2172 xmlParserProperties p = (xmlParserProperties) prop;
2173 xmlParserCtxtPtr ctxt;
2174
2175 if ((reader == NULL) || (reader->ctxt == NULL))
2176 return(-1);
2177 ctxt = reader->ctxt;
2178
2179 switch (p) {
2180 case XML_PARSER_LOADDTD:
2181 if (value != 0) {
2182 if (ctxt->loadsubset == 0) {
2183 if (reader->mode != XML_TEXTREADER_MODE_INITIAL)
2184 return(-1);
2185 ctxt->loadsubset = XML_DETECT_IDS;
2186 }
2187 } else {
2188 ctxt->loadsubset = 0;
2189 }
2190 return(0);
2191 case XML_PARSER_DEFAULTATTRS:
2192 if (value != 0) {
2193 ctxt->loadsubset |= XML_COMPLETE_ATTRS;
2194 } else {
2195 if (ctxt->loadsubset & XML_COMPLETE_ATTRS)
2196 ctxt->loadsubset -= XML_COMPLETE_ATTRS;
2197 }
2198 return(0);
2199 case XML_PARSER_VALIDATE:
2200 if (value != 0) {
2201 ctxt->validate = 1;
2202 } else {
2203 ctxt->validate = 0;
2204 }
2205 return(0);
Daniel Veillarde18fc182002-12-28 22:56:33 +00002206 case XML_PARSER_SUBST_ENTITIES:
2207 if (value != 0) {
2208 ctxt->replaceEntities = 1;
2209 } else {
2210 ctxt->replaceEntities = 0;
2211 }
2212 return(0);
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00002213 }
2214 return(-1);
2215}
2216
2217/**
2218 * xmlTextReaderGetParserProp:
2219 * @reader: the xmlTextReaderPtr used
2220 * @prop: the xmlParserProperties to get
2221 *
2222 * Read the parser internal property.
2223 *
2224 * Returns the value, usually 0 or 1, or -1 in case of error.
2225 */
2226int
2227xmlTextReaderGetParserProp(xmlTextReaderPtr reader, int prop) {
2228 xmlParserProperties p = (xmlParserProperties) prop;
2229 xmlParserCtxtPtr ctxt;
2230
2231 if ((reader == NULL) || (reader->ctxt == NULL))
2232 return(-1);
2233 ctxt = reader->ctxt;
2234
2235 switch (p) {
2236 case XML_PARSER_LOADDTD:
2237 if ((ctxt->loadsubset != 0) || (ctxt->validate != 0))
2238 return(1);
2239 return(0);
2240 case XML_PARSER_DEFAULTATTRS:
2241 if (ctxt->loadsubset & XML_COMPLETE_ATTRS)
2242 return(1);
2243 return(0);
2244 case XML_PARSER_VALIDATE:
2245 return(ctxt->validate);
Daniel Veillarde18fc182002-12-28 22:56:33 +00002246 case XML_PARSER_SUBST_ENTITIES:
2247 return(ctxt->replaceEntities);
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00002248 }
2249 return(-1);
2250}
2251
Daniel Veillarde18fc182002-12-28 22:56:33 +00002252/**
2253 * xmlTextReaderCurrentNode:
2254 * @reader: the xmlTextReaderPtr used
2255 *
2256 * Hacking interface allowing to get the xmlNodePtr correponding to the
2257 * current node being accessed by the xmlTextReader. This is dangerous
2258 * because the underlying node may be destroyed on the next Reads.
2259 *
2260 * Returns the xmlNodePtr or NULL in case of error.
2261 */
2262xmlNodePtr
2263xmlTextReaderCurrentNode(xmlTextReaderPtr reader) {
2264 if (reader == NULL)
2265 return(NULL);
2266
2267 if (reader->curnode != NULL)
2268 return(reader->curnode);
2269 return(reader->node);
2270}
2271
2272/**
2273 * xmlTextReaderCurrentDoc:
2274 * @reader: the xmlTextReaderPtr used
2275 *
2276 * Hacking interface allowing to get the xmlDocPtr correponding to the
2277 * current document being accessed by the xmlTextReader. This is dangerous
2278 * because the associated node may be destroyed on the next Reads.
2279 *
2280 * Returns the xmlDocPtr or NULL in case of error.
2281 */
2282xmlDocPtr
2283xmlTextReaderCurrentDoc(xmlTextReaderPtr reader) {
2284 if ((reader == NULL) || (reader->ctxt == NULL))
2285 return(NULL);
2286
2287 return(reader->ctxt->myDoc);
2288}
2289
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00002290/************************************************************************
2291 * *
Daniel Veillard26f70262003-01-16 22:45:08 +00002292 * Error Handling Extensions *
2293 * *
2294 ************************************************************************/
2295
2296/* helper to build a xmlMalloc'ed string from a format and va_list */
2297static char *
2298xmlTextReaderBuildMessage(const char *msg, va_list ap) {
2299 int size;
2300 int chars;
2301 char *larger;
2302 char *str;
2303
2304 str = (char *) xmlMalloc(150);
2305 if (str == NULL) {
2306 xmlGenericError(xmlGenericErrorContext, "xmlMalloc failed !\n");
2307 return NULL;
2308 }
2309
2310 size = 150;
2311
2312 while (1) {
2313 chars = vsnprintf(str, size, msg, ap);
2314 if ((chars > -1) && (chars < size))
2315 break;
2316 if (chars > -1)
2317 size += chars + 1;
2318 else
2319 size += 100;
2320 if ((larger = (char *) xmlRealloc(str, size)) == NULL) {
2321 xmlGenericError(xmlGenericErrorContext, "xmlRealloc failed !\n");
2322 xmlFree(str);
2323 return NULL;
2324 }
2325 str = larger;
2326 }
2327
2328 return str;
2329}
2330
Daniel Veillard417be3a2003-01-20 21:26:34 +00002331/**
Daniel Veillard540a31a2003-01-21 11:21:07 +00002332 * xmlTextReaderLocatorLineNumber:
Daniel Veillard417be3a2003-01-20 21:26:34 +00002333 * @locator: the xmlTextReaderLocatorPtr used
2334 *
2335 * Obtain the line number for the given locator.
2336 *
2337 * Returns the line number or -1 in case of error.
2338 */
2339int
2340xmlTextReaderLocatorLineNumber(xmlTextReaderLocatorPtr locator) {
2341 /* we know that locator is a xmlParserCtxtPtr */
2342 xmlParserCtxtPtr ctx = (xmlParserCtxtPtr)locator;
2343 int ret = -1;
2344
2345 if (ctx->node != NULL) {
2346 ret = xmlGetLineNo(ctx->node);
2347 }
2348 else {
2349 /* inspired from error.c */
2350 xmlParserInputPtr input;
2351 input = ctx->input;
2352 if ((input->filename == NULL) && (ctx->inputNr > 1))
2353 input = ctx->inputTab[ctx->inputNr - 2];
2354 if (input != NULL) {
2355 ret = input->line;
2356 }
2357 else {
2358 ret = -1;
2359 }
2360 }
2361
2362 return ret;
2363}
2364
2365/**
Daniel Veillard540a31a2003-01-21 11:21:07 +00002366 * xmlTextReaderLocatorBaseURI:
Daniel Veillard417be3a2003-01-20 21:26:34 +00002367 * @locator: the xmlTextReaderLocatorPtr used
2368 *
2369 * Obtain the base URI for the given locator.
2370 *
2371 * Returns the base URI or NULL in case of error.
2372 */
2373xmlChar *
2374xmlTextReaderLocatorBaseURI(xmlTextReaderLocatorPtr locator) {
2375 /* we know that locator is a xmlParserCtxtPtr */
2376 xmlParserCtxtPtr ctx = (xmlParserCtxtPtr)locator;
2377 xmlChar *ret = NULL;
2378
2379 if (ctx->node != NULL) {
2380 ret = xmlNodeGetBase(NULL,ctx->node);
2381 }
2382 else {
2383 /* inspired from error.c */
2384 xmlParserInputPtr input;
2385 input = ctx->input;
2386 if ((input->filename == NULL) && (ctx->inputNr > 1))
2387 input = ctx->inputTab[ctx->inputNr - 2];
2388 if (input != NULL) {
Daniel Veillard580ced82003-03-21 21:22:48 +00002389 ret = xmlStrdup(BAD_CAST input->filename);
Daniel Veillard417be3a2003-01-20 21:26:34 +00002390 }
2391 else {
2392 ret = NULL;
2393 }
2394 }
2395
2396 return ret;
2397}
2398
Daniel Veillard26f70262003-01-16 22:45:08 +00002399static void
2400xmlTextReaderGenericError(void *ctxt, int severity, char *str) {
2401 xmlParserCtxtPtr ctx = (xmlParserCtxtPtr)ctxt;
2402 xmlTextReaderPtr reader = (xmlTextReaderPtr)ctx->_private;
2403
2404 if (str != NULL) {
2405 reader->errorFunc(reader->errorFuncArg,
2406 str,
Daniel Veillard417be3a2003-01-20 21:26:34 +00002407 severity,
2408 (xmlTextReaderLocatorPtr)ctx);
Daniel Veillard26f70262003-01-16 22:45:08 +00002409 xmlFree(str);
2410 }
2411}
2412
2413static void
2414xmlTextReaderError(void *ctxt, const char *msg, ...) {
2415 va_list ap;
2416
2417 va_start(ap,msg);
2418 xmlTextReaderGenericError(ctxt,
Daniel Veillard417be3a2003-01-20 21:26:34 +00002419 XML_PARSER_SEVERITY_ERROR,
Daniel Veillard26f70262003-01-16 22:45:08 +00002420 xmlTextReaderBuildMessage(msg,ap));
2421 va_end(ap);
2422
2423}
2424
2425static void
2426xmlTextReaderWarning(void *ctxt, const char *msg, ...) {
2427 va_list ap;
2428
2429 va_start(ap,msg);
2430 xmlTextReaderGenericError(ctxt,
Daniel Veillard417be3a2003-01-20 21:26:34 +00002431 XML_PARSER_SEVERITY_WARNING,
Daniel Veillard26f70262003-01-16 22:45:08 +00002432 xmlTextReaderBuildMessage(msg,ap));
2433 va_end(ap);
2434}
2435
2436static void
2437xmlTextReaderValidityError(void *ctxt, const char *msg, ...) {
2438 va_list ap;
Daniel Veillard417be3a2003-01-20 21:26:34 +00002439 int len = xmlStrlen((const xmlChar *) msg);
Daniel Veillard26f70262003-01-16 22:45:08 +00002440
Daniel Veillard417be3a2003-01-20 21:26:34 +00002441 if ((len > 1) && (msg[len - 2] != ':')) {
2442 /*
2443 * some callbacks only report locator information:
2444 * skip them (mimicking behaviour in error.c)
2445 */
2446 va_start(ap,msg);
2447 xmlTextReaderGenericError(ctxt,
2448 XML_PARSER_SEVERITY_VALIDITY_ERROR,
2449 xmlTextReaderBuildMessage(msg,ap));
2450 va_end(ap);
2451 }
Daniel Veillard26f70262003-01-16 22:45:08 +00002452}
2453
2454static void
2455xmlTextReaderValidityWarning(void *ctxt, const char *msg, ...) {
2456 va_list ap;
Daniel Veillard417be3a2003-01-20 21:26:34 +00002457 int len = xmlStrlen((const xmlChar *) msg);
Daniel Veillard26f70262003-01-16 22:45:08 +00002458
Daniel Veillard417be3a2003-01-20 21:26:34 +00002459 if ((len != 0) && (msg[len - 1] != ':')) {
2460 /*
2461 * some callbacks only report locator information:
2462 * skip them (mimicking behaviour in error.c)
2463 */
2464 va_start(ap,msg);
2465 xmlTextReaderGenericError(ctxt,
2466 XML_PARSER_SEVERITY_VALIDITY_WARNING,
2467 xmlTextReaderBuildMessage(msg,ap));
2468 va_end(ap);
2469 }
Daniel Veillard26f70262003-01-16 22:45:08 +00002470}
2471
2472/**
2473 * xmlTextReaderSetErrorHandler:
2474 * @reader: the xmlTextReaderPtr used
2475 * @f: the callback function to call on error and warnings
2476 * @arg: a user argument to pass to the callback function
2477 *
Daniel Veillard417be3a2003-01-20 21:26:34 +00002478 * Register a callback function that will be called on error and warnings.
2479 *
Daniel Veillard26f70262003-01-16 22:45:08 +00002480 * If @f is NULL, the default error and warning handlers are restored.
2481 */
2482void
2483xmlTextReaderSetErrorHandler(xmlTextReaderPtr reader,
2484 xmlTextReaderErrorFunc f,
Daniel Veillard417be3a2003-01-20 21:26:34 +00002485 void *arg) {
Daniel Veillard26f70262003-01-16 22:45:08 +00002486 if (f != NULL) {
2487 reader->ctxt->sax->error = xmlTextReaderError;
2488 reader->ctxt->vctxt.error = xmlTextReaderValidityError;
2489 reader->ctxt->sax->warning = xmlTextReaderWarning;
2490 reader->ctxt->vctxt.warning = xmlTextReaderValidityWarning;
2491 reader->errorFunc = f;
2492 reader->errorFuncArg = arg;
2493 }
2494 else {
2495 /* restore defaults */
2496 reader->ctxt->sax->error = xmlParserError;
2497 reader->ctxt->vctxt.error = xmlParserValidityError;
2498 reader->ctxt->sax->warning = xmlParserWarning;
2499 reader->ctxt->vctxt.warning = xmlParserValidityWarning;
2500 reader->errorFunc = NULL;
2501 reader->errorFuncArg = NULL;
2502 }
2503}
2504
Daniel Veillard417be3a2003-01-20 21:26:34 +00002505/**
2506 * xmlTextReaderGetErrorHandler:
2507 * @reader: the xmlTextReaderPtr used
2508 * @f: the callback function or NULL is no callback has been registered
2509 * @arg: a user argument
2510 *
2511 * Retrieve the error callback function and user argument.
2512 */
Daniel Veillard26f70262003-01-16 22:45:08 +00002513void
2514xmlTextReaderGetErrorHandler(xmlTextReaderPtr reader,
2515 xmlTextReaderErrorFunc *f,
Daniel Veillard417be3a2003-01-20 21:26:34 +00002516 void **arg) {
Daniel Veillard26f70262003-01-16 22:45:08 +00002517 *f = reader->errorFunc;
2518 *arg = reader->errorFuncArg;
2519}
2520
2521/************************************************************************
2522 * *
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00002523 * Utilities *
2524 * *
2525 ************************************************************************/
2526/**
2527 * xmlBase64Decode:
2528 * @in: the input buffer
2529 * @inlen: the size of the input (in), the size read from it (out)
2530 * @to: the output buffer
2531 * @tolen: the size of the output (in), the size written to (out)
2532 *
2533 * Base64 decoder, reads from @in and save in @to
Daniel Veillardd4310742003-02-18 21:12:46 +00002534 * TODO: tell jody when this is actually exported
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00002535 *
2536 * Returns 0 if all the input was consumer, 1 if the Base64 end was reached,
2537 * 2 if there wasn't enough space on the output or -1 in case of error.
2538 */
2539static int
2540xmlBase64Decode(const unsigned char *in, unsigned long *inlen,
2541 unsigned char *to, unsigned long *tolen) {
2542 unsigned long incur; /* current index in in[] */
2543 unsigned long inblk; /* last block index in in[] */
2544 unsigned long outcur; /* current index in out[] */
2545 unsigned long inmax; /* size of in[] */
2546 unsigned long outmax; /* size of out[] */
2547 unsigned char cur; /* the current value read from in[] */
2548 unsigned char intmp[3], outtmp[4]; /* temporary buffers for the convert */
2549 int nbintmp; /* number of byte in intmp[] */
2550 int is_ignore; /* cur should be ignored */
2551 int is_end = 0; /* the end of the base64 was found */
2552 int retval = 1;
2553 int i;
2554
2555 if ((in == NULL) || (inlen == NULL) || (to == NULL) || (tolen == NULL))
2556 return(-1);
2557
2558 incur = 0;
2559 inblk = 0;
2560 outcur = 0;
2561 inmax = *inlen;
2562 outmax = *tolen;
2563 nbintmp = 0;
2564
2565 while (1) {
2566 if (incur >= inmax)
2567 break;
2568 cur = in[incur++];
2569 is_ignore = 0;
2570 if ((cur >= 'A') && (cur <= 'Z'))
2571 cur = cur - 'A';
2572 else if ((cur >= 'a') && (cur <= 'z'))
2573 cur = cur - 'a' + 26;
2574 else if ((cur >= '0') && (cur <= '9'))
2575 cur = cur - '0' + 52;
2576 else if (cur == '+')
2577 cur = 62;
2578 else if (cur == '/')
2579 cur = 63;
2580 else if (cur == '.')
2581 cur = 0;
2582 else if (cur == '=') /*no op , end of the base64 stream */
2583 is_end = 1;
2584 else {
2585 is_ignore = 1;
2586 if (nbintmp == 0)
2587 inblk = incur;
2588 }
2589
2590 if (!is_ignore) {
2591 int nbouttmp = 3;
2592 int is_break = 0;
2593
2594 if (is_end) {
2595 if (nbintmp == 0)
2596 break;
2597 if ((nbintmp == 1) || (nbintmp == 2))
2598 nbouttmp = 1;
2599 else
2600 nbouttmp = 2;
2601 nbintmp = 3;
2602 is_break = 1;
2603 }
2604 intmp[nbintmp++] = cur;
2605 /*
2606 * if intmp is full, push the 4byte sequence as a 3 byte
2607 * sequence out
2608 */
2609 if (nbintmp == 4) {
2610 nbintmp = 0;
2611 outtmp[0] = (intmp[0] << 2) | ((intmp[1] & 0x30) >> 4);
2612 outtmp[1] =
2613 ((intmp[1] & 0x0F) << 4) | ((intmp[2] & 0x3C) >> 2);
2614 outtmp[2] = ((intmp[2] & 0x03) << 6) | (intmp[3] & 0x3F);
2615 if (outcur + 3 >= outmax) {
2616 retval = 2;
2617 break;
2618 }
2619
2620 for (i = 0; i < nbouttmp; i++)
2621 to[outcur++] = outtmp[i];
2622 inblk = incur;
2623 }
2624
2625 if (is_break) {
2626 retval = 0;
2627 break;
2628 }
2629 }
2630 }
2631
2632 *tolen = outcur;
2633 *inlen = inblk;
2634 return (retval);
2635}
2636
2637/*
2638 * Test routine for the xmlBase64Decode function
2639 */
2640#if 0
2641int main(int argc, char **argv) {
2642 char *input = " VW4 gcGV0 \n aXQgdGVzdCAuCg== ";
2643 char output[100];
2644 char output2[100];
2645 char output3[100];
2646 unsigned long inlen = strlen(input);
2647 unsigned long outlen = 100;
2648 int ret;
2649 unsigned long cons, tmp, tmp2, prod;
2650
2651 /*
2652 * Direct
2653 */
2654 ret = xmlBase64Decode(input, &inlen, output, &outlen);
2655
2656 output[outlen] = 0;
2657 printf("ret: %d, inlen: %ld , outlen: %ld, output: '%s'\n", ret, inlen, outlen, output);
2658
2659 /*
2660 * output chunking
2661 */
2662 cons = 0;
2663 prod = 0;
2664 while (cons < inlen) {
2665 tmp = 5;
2666 tmp2 = inlen - cons;
2667
2668 printf("%ld %ld\n", cons, prod);
2669 ret = xmlBase64Decode(&input[cons], &tmp2, &output2[prod], &tmp);
2670 cons += tmp2;
2671 prod += tmp;
2672 printf("%ld %ld\n", cons, prod);
2673 }
2674 output2[outlen] = 0;
2675 printf("ret: %d, cons: %ld , prod: %ld, output: '%s'\n", ret, cons, prod, output2);
2676
2677 /*
2678 * input chunking
2679 */
2680 cons = 0;
2681 prod = 0;
2682 while (cons < inlen) {
2683 tmp = 100 - prod;
2684 tmp2 = inlen - cons;
2685 if (tmp2 > 5)
2686 tmp2 = 5;
2687
2688 printf("%ld %ld\n", cons, prod);
2689 ret = xmlBase64Decode(&input[cons], &tmp2, &output3[prod], &tmp);
2690 cons += tmp2;
2691 prod += tmp;
2692 printf("%ld %ld\n", cons, prod);
2693 }
2694 output3[outlen] = 0;
2695 printf("ret: %d, cons: %ld , prod: %ld, output: '%s'\n", ret, cons, prod, output3);
2696 return(0);
2697
2698}
2699#endif