blob: 8621c701a8662fa87873e3f46f28d855fc8799e5 [file] [log] [blame]
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001/*
2 * xmlreader.c: implements the xmlTextReader streaming node API
3 *
Daniel Veillard67df8092002-12-16 22:04:11 +00004 * NOTE:
5 * XmlTextReader.Normalization Property won't be supported, since
6 * it makes the parser non compliant to the XML recommendation
7 *
Daniel Veillarde1ca5032002-12-09 14:13:43 +00008 * See Copyright for the status of this software.
9 *
10 * daniel@veillard.com
11 */
12
Daniel Veillard7704fb12003-01-03 16:19:51 +000013/*
14 * TODOs:
15 * - provide an API to expand part of the tree
16 * - provide an API to preserve part of the tree
17 * - Streaming XInclude support
Daniel Veillard067bae52003-01-05 01:27:54 +000018 * - validation against a provided DTD
19 * - XML Schemas validation
Daniel Veillard7704fb12003-01-03 16:19:51 +000020 * - setting(s) for NoBlanks
21 * - performances and tuning ...
22 */
Daniel Veillarde1ca5032002-12-09 14:13:43 +000023#define IN_LIBXML
24#include "libxml.h"
25
26#include <string.h> /* for memset() only ! */
Daniel Veillard26f70262003-01-16 22:45:08 +000027#include <stdarg.h>
Daniel Veillarde1ca5032002-12-09 14:13:43 +000028
29#ifdef HAVE_CTYPE_H
30#include <ctype.h>
31#endif
32#ifdef HAVE_STDLIB_H
33#include <stdlib.h>
34#endif
35
36#include <libxml/xmlmemory.h>
37#include <libxml/xmlIO.h>
38#include <libxml/xmlreader.h>
39
40/* #define DEBUG_CALLBACKS */
41/* #define DEBUG_READER */
42
43/**
44 * TODO:
45 *
46 * macro to flag unimplemented blocks
47 */
48#define TODO \
49 xmlGenericError(xmlGenericErrorContext, \
50 "Unimplemented block at %s:%d\n", \
51 __FILE__, __LINE__);
52
53#ifdef DEBUG_READER
54#define DUMP_READER xmlTextReaderDebug(reader);
55#else
56#define DUMP_READER
57#endif
58
59/************************************************************************
60 * *
61 * The parser: maps the Text Reader API on top of the existing *
62 * parsing routines building a tree *
63 * *
64 ************************************************************************/
65
66#define XML_TEXTREADER_INPUT 1
67#define XML_TEXTREADER_CTXT 2
68
69typedef enum {
Daniel Veillard67df8092002-12-16 22:04:11 +000070 XML_TEXTREADER_MODE_INITIAL = 0,
71 XML_TEXTREADER_MODE_INTERACTIVE = 1,
72 XML_TEXTREADER_MODE_ERROR = 2,
73 XML_TEXTREADER_MODE_EOF =3,
74 XML_TEXTREADER_MODE_CLOSED = 4,
75 XML_TEXTREADER_MODE_READING = 5
Daniel Veillarde1ca5032002-12-09 14:13:43 +000076} xmlTextReaderMode;
77
78typedef enum {
79 XML_TEXTREADER_NONE = -1,
80 XML_TEXTREADER_START= 0,
81 XML_TEXTREADER_ELEMENT= 1,
82 XML_TEXTREADER_END= 2,
83 XML_TEXTREADER_EMPTY= 3,
Daniel Veillardea7751d2002-12-20 00:16:24 +000084 XML_TEXTREADER_BACKTRACK= 4,
85 XML_TEXTREADER_DONE= 5
Daniel Veillarde1ca5032002-12-09 14:13:43 +000086} xmlTextReaderState;
87
88struct _xmlTextReader {
89 int mode; /* the parsing mode */
90 int allocs; /* what structure were deallocated */
91 xmlTextReaderState state;
92 xmlParserCtxtPtr ctxt; /* the parser context */
93 xmlSAXHandlerPtr sax; /* the parser SAX callbacks */
94 xmlParserInputBufferPtr input; /* the input */
95 startElementSAXFunc startElement;/* initial SAX callbacks */
96 endElementSAXFunc endElement; /* idem */
Daniel Veillardea7751d2002-12-20 00:16:24 +000097 charactersSAXFunc characters;
98 cdataBlockSAXFunc cdataBlock;
Daniel Veillarde1ca5032002-12-09 14:13:43 +000099 unsigned int base; /* base of the segment in the input */
100 unsigned int cur; /* current position in the input */
101 xmlNodePtr node; /* current node */
Daniel Veillardda46d2d2002-12-15 23:36:49 +0000102 xmlNodePtr curnode;/* current attribute node */
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000103 int depth; /* depth of the current node */
Daniel Veillardbeb70bd2002-12-18 14:53:54 +0000104 xmlNodePtr faketext;/* fake xmlNs chld */
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000105
106 /* entity stack when traversing entities content */
107 xmlNodePtr ent; /* Current Entity Ref Node */
108 int entNr; /* Depth of the entities stack */
109 int entMax; /* Max depth of the entities stack */
110 xmlNodePtr *entTab; /* array of entities */
Daniel Veillard26f70262003-01-16 22:45:08 +0000111
112 /* error handling */
113 xmlTextReaderErrorFunc errorFunc; /* callback function */
114 void *errorFuncArg; /* callback function user argument */
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000115};
116
Daniel Veillard067bae52003-01-05 01:27:54 +0000117static const char *xmlTextReaderIsEmpty = "This element is empty";
118
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000119#ifdef DEBUG_READER
120static void
121xmlTextReaderDebug(xmlTextReaderPtr reader) {
122 if ((reader == NULL) || (reader->ctxt == NULL)) {
123 fprintf(stderr, "xmlTextReader NULL\n");
124 return;
125 }
126 fprintf(stderr, "xmlTextReader: state %d depth %d ",
127 reader->state, reader->depth);
128 if (reader->node == NULL) {
129 fprintf(stderr, "node = NULL\n");
130 } else {
131 fprintf(stderr, "node %s\n", reader->node->name);
132 }
133 fprintf(stderr, " input: base %d, cur %d, depth %d: ",
134 reader->base, reader->cur, reader->ctxt->nodeNr);
135 if (reader->input->buffer == NULL) {
136 fprintf(stderr, "buffer is NULL\n");
137 } else {
138#ifdef LIBXML_DEBUG_ENABLED
139 xmlDebugDumpString(stderr,
140 &reader->input->buffer->content[reader->cur]);
141#endif
142 fprintf(stderr, "\n");
143 }
144}
145#endif
146
147/**
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000148 * xmlTextReaderEntPush:
149 * @reader: the xmlTextReaderPtr used
150 * @value: the entity reference node
151 *
152 * Pushes a new entity reference node on top of the entities stack
153 *
154 * Returns 0 in case of error, the index in the stack otherwise
155 */
156static int
157xmlTextReaderEntPush(xmlTextReaderPtr reader, xmlNodePtr value)
158{
159 if (reader->entMax <= 0) {
160 reader->entMax = 10;
161 reader->entTab = (xmlNodePtr *) xmlMalloc(reader->entMax *
162 sizeof(reader->entTab[0]));
163 if (reader->entTab == NULL) {
164 xmlGenericError(xmlGenericErrorContext, "xmlMalloc failed !\n");
165 return (0);
166 }
167 }
168 if (reader->entNr >= reader->entMax) {
169 reader->entMax *= 2;
170 reader->entTab =
171 (xmlNodePtr *) xmlRealloc(reader->entTab,
172 reader->entMax *
173 sizeof(reader->entTab[0]));
174 if (reader->entTab == NULL) {
175 xmlGenericError(xmlGenericErrorContext, "xmlRealloc failed !\n");
176 return (0);
177 }
178 }
179 reader->entTab[reader->entNr] = value;
180 reader->ent = value;
181 return (reader->entNr++);
182}
183
184/**
185 * xmlTextReaderEntPop:
186 * @reader: the xmlTextReaderPtr used
187 *
188 * Pops the top element entity from the entities stack
189 *
190 * Returns the entity just removed
191 */
192static xmlNodePtr
193xmlTextReaderEntPop(xmlTextReaderPtr reader)
194{
195 xmlNodePtr ret;
196
197 if (reader->entNr <= 0)
198 return (0);
199 reader->entNr--;
200 if (reader->entNr > 0)
201 reader->ent = reader->entTab[reader->entNr - 1];
202 else
203 reader->ent = NULL;
204 ret = reader->entTab[reader->entNr];
205 reader->entTab[reader->entNr] = 0;
206 return (ret);
207}
208
209/**
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000210 * xmlTextReaderStartElement:
211 * @ctx: the user data (XML parser context)
212 * @fullname: The element name, including namespace prefix
213 * @atts: An array of name/value attributes pairs, NULL terminated
214 *
215 * called when an opening tag has been processed.
216 */
217static void
218xmlTextReaderStartElement(void *ctx, const xmlChar *fullname,
219 const xmlChar **atts) {
220 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
Daniel Veillardd5896142002-12-31 14:45:26 +0000221 xmlParserCtxtPtr origctxt;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000222 xmlTextReaderPtr reader = ctxt->_private;
223
224#ifdef DEBUG_CALLBACKS
225 printf("xmlTextReaderStartElement(%s)\n", fullname);
226#endif
Daniel Veillardea7751d2002-12-20 00:16:24 +0000227 if ((reader != NULL) && (reader->startElement != NULL)) {
Daniel Veillardd5896142002-12-31 14:45:26 +0000228 /*
229 * when processing an entity, the context may have been changed
230 */
231 origctxt = reader->ctxt;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000232 reader->startElement(ctx, fullname, atts);
Daniel Veillard067bae52003-01-05 01:27:54 +0000233 if ((ctxt->node != NULL) && (ctxt->input != NULL) &&
234 (ctxt->input->cur != NULL) && (ctxt->input->cur[0] == '/') &&
235 (ctxt->input->cur[1] == '>'))
236 ctxt->node->_private = (void *) xmlTextReaderIsEmpty;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000237 }
Daniel Veillard9e395c22003-01-01 14:50:44 +0000238 if (reader != NULL)
239 reader->state = XML_TEXTREADER_ELEMENT;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000240}
241
242/**
243 * xmlTextReaderEndElement:
244 * @ctx: the user data (XML parser context)
245 * @fullname: The element name, including namespace prefix
246 *
247 * called when an ending tag has been processed.
248 */
249static void
250xmlTextReaderEndElement(void *ctx, const xmlChar *fullname) {
251 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
Daniel Veillardd5896142002-12-31 14:45:26 +0000252 xmlParserCtxtPtr origctxt;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000253 xmlTextReaderPtr reader = ctxt->_private;
254
255#ifdef DEBUG_CALLBACKS
256 printf("xmlTextReaderEndElement(%s)\n", fullname);
257#endif
Daniel Veillardea7751d2002-12-20 00:16:24 +0000258 if ((reader != NULL) && (reader->endElement != NULL)) {
Daniel Veillardd5896142002-12-31 14:45:26 +0000259 /*
260 * when processing an entity, the context may have been changed
261 */
262 origctxt = reader->ctxt;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000263
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000264 reader->endElement(ctx, fullname);
Daniel Veillardea7751d2002-12-20 00:16:24 +0000265 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000266}
267
268/**
Daniel Veillardea7751d2002-12-20 00:16:24 +0000269 * xmlTextReaderCharacters:
270 * @ctx: the user data (XML parser context)
271 * @ch: a xmlChar string
272 * @len: the number of xmlChar
273 *
274 * receiving some chars from the parser.
275 */
276static void
277xmlTextReaderCharacters(void *ctx, const xmlChar *ch, int len)
278{
279 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
Daniel Veillardd5896142002-12-31 14:45:26 +0000280 xmlParserCtxtPtr origctxt;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000281 xmlTextReaderPtr reader = ctxt->_private;
282
283#ifdef DEBUG_CALLBACKS
284 printf("xmlTextReaderCharacters()\n");
285#endif
286 if ((reader != NULL) && (reader->characters != NULL)) {
287 reader->characters(ctx, ch, len);
Daniel Veillardd5896142002-12-31 14:45:26 +0000288 /*
289 * when processing an entity, the context may have been changed
290 */
291 origctxt = reader->ctxt;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000292 }
293}
294
295/**
296 * xmlTextReaderCDataBlock:
297 * @ctx: the user data (XML parser context)
298 * @value: The pcdata content
299 * @len: the block length
300 *
301 * called when a pcdata block has been parsed
302 */
303static void
304xmlTextReaderCDataBlock(void *ctx, const xmlChar *ch, int len)
305{
306 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
307 xmlTextReaderPtr reader = ctxt->_private;
308
309#ifdef DEBUG_CALLBACKS
310 printf("xmlTextReaderCDataBlock()\n");
311#endif
312 if ((reader != NULL) && (reader->cdataBlock != NULL)) {
313 reader->cdataBlock(ctx, ch, len);
Daniel Veillardea7751d2002-12-20 00:16:24 +0000314 }
315}
316
317/**
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000318 * xmlTextReaderPushData:
319 * @reader: the xmlTextReaderPtr used
320 *
321 * Push data down the progressive parser until a significant callback
322 * got raised.
323 *
324 * Returns -1 in case of failure, 0 otherwise
325 */
326static int
327xmlTextReaderPushData(xmlTextReaderPtr reader) {
328 unsigned int cur = reader->cur;
329 xmlBufferPtr inbuf;
330 int val;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000331 int oldstate;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000332
333 if ((reader->input == NULL) || (reader->input->buffer == NULL))
334 return(-1);
335
Daniel Veillardea7751d2002-12-20 00:16:24 +0000336 oldstate = reader->state;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000337 reader->state = XML_TEXTREADER_NONE;
338 inbuf = reader->input->buffer;
339 while (reader->state == XML_TEXTREADER_NONE) {
340 if (cur >= inbuf->use) {
341 /*
342 * Refill the buffer unless we are at the end of the stream
343 */
344 if (reader->mode != XML_TEXTREADER_MODE_EOF) {
345 val = xmlParserInputBufferRead(reader->input, 4096);
346 if (val <= 0) {
347 reader->mode = XML_TEXTREADER_MODE_EOF;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000348 reader->state = oldstate;
Daniel Veillardaaa105b2002-12-30 11:42:17 +0000349 if ((oldstate != XML_TEXTREADER_START) ||
350 (reader->ctxt->myDoc != NULL))
351 return(val);
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000352 }
353 } else
354 break;
355 }
Daniel Veillard067bae52003-01-05 01:27:54 +0000356 /*
357 * parse by block of 512 bytes
358 */
359 if ((cur >= reader->cur + 512) || (cur >= inbuf->use)) {
360 if (cur < inbuf->use)
361 cur = cur + 1;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000362 val = xmlParseChunk(reader->ctxt,
363 (const char *) &inbuf->content[reader->cur],
364 cur - reader->cur, 0);
365 if (val != 0)
366 return(-1);
367 reader->cur = cur;
368 break;
369 } else {
370 cur = cur + 1;
371
372 /*
373 * One may have to force a flush at some point when parsing really
374 * large CDATA sections
375 */
376 if ((cur - reader->cur > 4096) && (reader->base == 0) &&
Daniel Veillard67df8092002-12-16 22:04:11 +0000377 (reader->mode == XML_TEXTREADER_MODE_INTERACTIVE)) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000378 cur = cur + 1;
379 val = xmlParseChunk(reader->ctxt,
380 (const char *) &inbuf->content[reader->cur],
381 cur - reader->cur, 0);
382 if (val != 0)
383 return(-1);
384 reader->cur = cur;
385 }
386 }
387 }
388 /*
389 * Discard the consumed input when needed and possible
390 */
Daniel Veillard67df8092002-12-16 22:04:11 +0000391 if (reader->mode == XML_TEXTREADER_MODE_INTERACTIVE) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000392 if ((reader->cur >= 4096) && (reader->base == 0)) {
393 val = xmlBufferShrink(inbuf, cur);
394 if (val >= 0) {
395 reader->cur -= val;
396 }
397 }
398 }
399
400 /*
401 * At the end of the stream signal that the work is done to the Push
402 * parser.
403 */
Daniel Veillardea7751d2002-12-20 00:16:24 +0000404 if (reader->mode == XML_TEXTREADER_MODE_EOF) {
405 if (reader->mode != XML_TEXTREADER_DONE) {
406 val = xmlParseChunk(reader->ctxt,
Daniel Veillard067bae52003-01-05 01:27:54 +0000407 (const char *) &inbuf->content[reader->cur],
408 cur - reader->cur, 1);
409 reader->cur = cur;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000410 reader->mode = XML_TEXTREADER_DONE;
411 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000412 }
Daniel Veillardea7751d2002-12-20 00:16:24 +0000413 reader->state = oldstate;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000414 return(0);
415}
416
417/**
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000418 * xmlTextReaderValidatePush:
419 * @reader: the xmlTextReaderPtr used
420 *
421 * Push the current node for validation
422 */
423static void
424xmlTextReaderValidatePush(xmlTextReaderPtr reader) {
Daniel Veillard0e298ad2003-02-04 16:14:33 +0000425#ifdef LIBXML_REGEXP_ENABLED
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000426 xmlNodePtr node = reader->node;
427
428 if ((node->ns == NULL) || (node->ns->prefix == NULL)) {
429 reader->ctxt->valid &= xmlValidatePushElement(&reader->ctxt->vctxt,
430 reader->ctxt->myDoc, node, node->name);
431 } else {
432 xmlChar *qname;
433
434 qname = xmlStrdup(node->ns->prefix);
435 qname = xmlStrcat(qname, BAD_CAST ":");
436 qname = xmlStrcat(qname, node->name);
437 reader->ctxt->valid &= xmlValidatePushElement(&reader->ctxt->vctxt,
438 reader->ctxt->myDoc, node, qname);
439 if (qname != NULL)
440 xmlFree(qname);
441 }
Daniel Veillard0e298ad2003-02-04 16:14:33 +0000442#endif /* LIBXML_REGEXP_ENABLED */
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000443}
444/**
445 * xmlTextReaderValidatePop:
446 * @reader: the xmlTextReaderPtr used
447 *
448 * Pop the current node from validation
449 */
450static void
451xmlTextReaderValidatePop(xmlTextReaderPtr reader) {
Daniel Veillard0e298ad2003-02-04 16:14:33 +0000452#ifdef LIBXML_REGEXP_ENABLED
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000453 xmlNodePtr node = reader->node;
454
455 if ((node->ns == NULL) || (node->ns->prefix == NULL)) {
456 reader->ctxt->valid &= xmlValidatePopElement(&reader->ctxt->vctxt,
457 reader->ctxt->myDoc, node, node->name);
458 } else {
459 xmlChar *qname;
460
461 qname = xmlStrdup(node->ns->prefix);
462 qname = xmlStrcat(qname, BAD_CAST ":");
463 qname = xmlStrcat(qname, node->name);
464 reader->ctxt->valid &= xmlValidatePopElement(&reader->ctxt->vctxt,
465 reader->ctxt->myDoc, node, qname);
466 if (qname != NULL)
467 xmlFree(qname);
468 }
Daniel Veillard0e298ad2003-02-04 16:14:33 +0000469#endif /* LIBXML_REGEXP_ENABLED */
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000470}
Daniel Veillarda80ff6e2003-01-03 12:52:08 +0000471/**
472 * xmlTextReaderValidateEntity:
473 * @reader: the xmlTextReaderPtr used
474 *
475 * Handle the validation when an entity reference is encountered and
476 * entity substitution is not activated. As a result the parser interface
477 * must walk through the entity and do the validation calls
478 */
479static void
480xmlTextReaderValidateEntity(xmlTextReaderPtr reader) {
Daniel Veillard0e298ad2003-02-04 16:14:33 +0000481#ifdef LIBXML_REGEXP_ENABLED
Daniel Veillarda80ff6e2003-01-03 12:52:08 +0000482 xmlNodePtr oldnode = reader->node;
483 xmlNodePtr node = reader->node;
484 xmlParserCtxtPtr ctxt = reader->ctxt;
485
486 do {
487 if (node->type == XML_ENTITY_REF_NODE) {
488 /*
489 * Case where the underlying tree is not availble, lookup the entity
490 * and walk it.
491 */
492 if ((node->children == NULL) && (ctxt->sax != NULL) &&
493 (ctxt->sax->getEntity != NULL)) {
494 node->children = (xmlNodePtr)
495 ctxt->sax->getEntity(ctxt, node->name);
496 }
497
498 if ((node->children != NULL) &&
499 (node->children->type == XML_ENTITY_DECL) &&
500 (node->children->children != NULL)) {
501 xmlTextReaderEntPush(reader, node);
502 node = node->children->children;
503 continue;
504 } else {
505 /*
506 * The error has probably be raised already.
507 */
508 if (node == oldnode)
509 break;
510 node = node->next;
511 }
512 } else if (node->type == XML_ELEMENT_NODE) {
513 reader->node = node;
514 xmlTextReaderValidatePush(reader);
515 } else if ((node->type == XML_TEXT_NODE) ||
516 (node->type == XML_CDATA_SECTION_NODE)) {
517 ctxt->valid &= xmlValidatePushCData(&ctxt->vctxt,
518 node->content, xmlStrlen(node->content));
519 }
520
521 /*
522 * go to next node
523 */
524 if (node->children != NULL) {
525 node = node->children;
526 continue;
527 }
528 if (node->next != NULL) {
529 node = node->next;
530 continue;
531 }
532 do {
533 node = node->parent;
534 if (node->type == XML_ELEMENT_NODE) {
535 reader->node = node;
536 xmlTextReaderValidatePop(reader);
537 }
538 if ((node->type == XML_ENTITY_DECL) &&
539 (reader->ent != NULL) && (reader->ent->children == node)) {
540 node = xmlTextReaderEntPop(reader);
541 }
542 if (node == oldnode)
543 break;
544 if (node->next != NULL) {
545 node = node->next;
546 break;
547 }
548 } while ((node != NULL) && (node != oldnode));
549 } while ((node != NULL) && (node != oldnode));
550 reader->node = oldnode;
Daniel Veillard0e298ad2003-02-04 16:14:33 +0000551#endif /* LIBXML_REGEXP_ENABLED */
Daniel Veillarda80ff6e2003-01-03 12:52:08 +0000552}
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000553
554
555/**
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000556 * xmlTextReaderRead:
557 * @reader: the xmlTextReaderPtr used
558 *
559 * Moves the position of the current instance to the next node in
560 * the stream, exposing its properties.
561 *
562 * Returns 1 if the node was read successfully, 0 if there is no more
563 * nodes to read, or -1 in case of error
564 */
565int
566xmlTextReaderRead(xmlTextReaderPtr reader) {
Daniel Veillard067bae52003-01-05 01:27:54 +0000567 int val, olddepth = 0;
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000568 xmlTextReaderState oldstate = 0;
569 xmlNodePtr oldnode = NULL;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000570
571 if ((reader == NULL) || (reader->ctxt == NULL))
572 return(-1);
573 if (reader->ctxt->wellFormed != 1)
574 return(-1);
575
576#ifdef DEBUG_READER
577 fprintf(stderr, "\nREAD ");
578 DUMP_READER
579#endif
Daniel Veillard29b3e282002-12-29 11:14:41 +0000580 reader->curnode = NULL;
Daniel Veillard67df8092002-12-16 22:04:11 +0000581 if (reader->mode == XML_TEXTREADER_MODE_INITIAL) {
582 reader->mode = XML_TEXTREADER_MODE_INTERACTIVE;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000583 /*
584 * Initial state
585 */
586 do {
587 val = xmlTextReaderPushData(reader);
588 if (val < 0)
589 return(-1);
590 } while ((reader->ctxt->node == NULL) &&
Daniel Veillard067bae52003-01-05 01:27:54 +0000591 ((reader->mode != XML_TEXTREADER_MODE_EOF) &&
592 (reader->mode != XML_TEXTREADER_DONE)));
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000593 if (reader->ctxt->node == NULL) {
Daniel Veillarddab8ea92003-01-02 14:16:45 +0000594 if (reader->ctxt->myDoc != NULL) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000595 reader->node = reader->ctxt->myDoc->children;
Daniel Veillarddab8ea92003-01-02 14:16:45 +0000596 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000597 if (reader->node == NULL)
598 return(-1);
Daniel Veillarddab8ea92003-01-02 14:16:45 +0000599 reader->state = XML_TEXTREADER_ELEMENT;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000600 } else {
Daniel Veillard48ef4c92003-03-22 12:38:15 +0000601 if (reader->ctxt->myDoc != NULL) {
602 reader->node = reader->ctxt->myDoc->children;
603 }
604 if (reader->node == NULL)
605 reader->node = reader->ctxt->nodeTab[0];
Daniel Veillarde59494f2003-01-04 16:35:29 +0000606 reader->state = XML_TEXTREADER_ELEMENT;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000607 }
Daniel Veillard4d8db8a2002-12-30 18:40:42 +0000608 reader->depth = 0;
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000609 goto node_found;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000610 }
611 oldstate = reader->state;
612 olddepth = reader->ctxt->nodeNr;
613 oldnode = reader->node;
Daniel Veillarddf512f42002-12-23 15:56:21 +0000614
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000615get_next_node:
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000616 /*
617 * If we are not backtracking on ancestors or examined nodes,
618 * that the parser didn't finished or that we arent at the end
619 * of stream, continue processing.
620 */
Daniel Veillardea7751d2002-12-20 00:16:24 +0000621 while (((oldstate == XML_TEXTREADER_BACKTRACK) ||
622 (reader->node->children == NULL) ||
623 (reader->node->type == XML_ENTITY_REF_NODE) ||
Daniel Veillard4dbe77a2003-01-14 00:17:42 +0000624 (reader->node->type == XML_DTD_NODE) ||
625 (reader->node->type == XML_DOCUMENT_NODE) ||
626 (reader->node->type == XML_HTML_DOCUMENT_NODE)) &&
Daniel Veillardea7751d2002-12-20 00:16:24 +0000627 (reader->node->next == NULL) &&
Daniel Veillard4dbe77a2003-01-14 00:17:42 +0000628 ((reader->ctxt->node == NULL) ||
629 (reader->ctxt->node == reader->node) ||
630 (reader->ctxt->node == reader->node->parent)) &&
Daniel Veillardea7751d2002-12-20 00:16:24 +0000631 (reader->ctxt->nodeNr == olddepth) &&
632 (reader->ctxt->instate != XML_PARSER_EOF)) {
633 val = xmlTextReaderPushData(reader);
634 if (val < 0)
635 return(-1);
636 if (reader->node == NULL)
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000637 goto node_end;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000638 }
Daniel Veillard120e8eb2003-03-22 01:00:34 +0000639 /*
640 * If we are in the middle of a piece of CDATA make sure it's finished
641 * Maybe calling a function checking that a non-character() callback was
642 * received would be cleaner for the loop exit.
643 */
644 if ((oldstate == XML_TEXTREADER_ELEMENT) &&
645 (reader->ctxt->instate == XML_PARSER_CDATA_SECTION)) {
646 while ((reader->ctxt->instate == XML_PARSER_CDATA_SECTION) &&
647 (((reader->node->content == NULL) &&
648 (reader->node->next != NULL) &&
649 (reader->node->next->type == XML_CDATA_SECTION_NODE) &&
650 (reader->node->next->next == NULL) &&
651 (reader->node->parent->next == NULL)) ||
652 ((reader->node->children != NULL) &&
653 (reader->node->children->type == XML_CDATA_SECTION_NODE) &&
654 (reader->node->children->next == NULL) &&
655 (reader->node->children->next == NULL)))) {
656 val = xmlTextReaderPushData(reader);
657 if (val < 0)
658 return(-1);
659 }
660 }
661 if ((oldstate == XML_TEXTREADER_ELEMENT) &&
662 (reader->ctxt->instate == XML_PARSER_CONTENT)) {
663 while ((reader->ctxt->instate == XML_PARSER_CONTENT) &&
664 (((reader->node->content == NULL) &&
665 (reader->node->next != NULL) &&
666 (reader->node->next->type == XML_TEXT_NODE) &&
667 (reader->node->next->next == NULL) &&
668 (reader->node->parent->next == NULL)) ||
669 ((reader->node->children != NULL) &&
670 (reader->node->children->type == XML_TEXT_NODE) &&
671 (reader->node->children->next == NULL) &&
672 (reader->node->children->next == NULL)))) {
673 val = xmlTextReaderPushData(reader);
674 if (val < 0)
675 return(-1);
676 }
677 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000678 if (oldstate != XML_TEXTREADER_BACKTRACK) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000679 if ((reader->node->children != NULL) &&
680 (reader->node->type != XML_ENTITY_REF_NODE) &&
681 (reader->node->type != XML_DTD_NODE)) {
682 reader->node = reader->node->children;
683 reader->depth++;
Daniel Veillarddf512f42002-12-23 15:56:21 +0000684 reader->state = XML_TEXTREADER_ELEMENT;
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000685 goto node_found;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000686 }
687 }
688 if (reader->node->next != NULL) {
689 if ((oldstate == XML_TEXTREADER_ELEMENT) &&
Daniel Veillarddf512f42002-12-23 15:56:21 +0000690 (reader->node->type == XML_ELEMENT_NODE) &&
Daniel Veillard067bae52003-01-05 01:27:54 +0000691 (reader->node->children == NULL) &&
692 (reader->node->_private != (void *)xmlTextReaderIsEmpty)) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000693 reader->state = XML_TEXTREADER_END;
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000694 goto node_found;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000695 }
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000696 if ((reader->ctxt->validate) &&
697 (reader->node->type == XML_ELEMENT_NODE))
698 xmlTextReaderValidatePop(reader);
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000699 reader->node = reader->node->next;
700 reader->state = XML_TEXTREADER_ELEMENT;
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000701
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000702 /*
703 * Cleanup of the old node
704 */
Daniel Veillard4dbe77a2003-01-14 00:17:42 +0000705 if ((reader->node->prev != NULL) &&
706 (reader->node->prev->type != XML_DTD_NODE)) {
707 xmlNodePtr tmp = reader->node->prev;
708 xmlUnlinkNode(tmp);
709 xmlFreeNode(tmp);
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000710 }
711
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000712 goto node_found;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000713 }
Daniel Veillardea7751d2002-12-20 00:16:24 +0000714 if ((oldstate == XML_TEXTREADER_ELEMENT) &&
Daniel Veillard571b8892002-12-30 12:37:59 +0000715 (reader->node->type == XML_ELEMENT_NODE) &&
Daniel Veillard067bae52003-01-05 01:27:54 +0000716 (reader->node->children == NULL) &&
717 (reader->node->_private != (void *)xmlTextReaderIsEmpty)) {
Daniel Veillardea7751d2002-12-20 00:16:24 +0000718 reader->state = XML_TEXTREADER_END;
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000719 goto node_found;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000720 }
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000721 if ((reader->ctxt->validate) && (reader->node->type == XML_ELEMENT_NODE))
722 xmlTextReaderValidatePop(reader);
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000723 reader->node = reader->node->parent;
724 if ((reader->node == NULL) ||
725 (reader->node->type == XML_DOCUMENT_NODE) ||
726#ifdef LIBXML_DOCB_ENABLED
727 (reader->node->type == XML_DOCB_DOCUMENT_NODE) ||
728#endif
729 (reader->node->type == XML_HTML_DOCUMENT_NODE)) {
Daniel Veillardea7751d2002-12-20 00:16:24 +0000730 if (reader->mode != XML_TEXTREADER_DONE) {
731 val = xmlParseChunk(reader->ctxt, "", 0, 1);
732 reader->mode = XML_TEXTREADER_DONE;
733 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000734 reader->node = NULL;
Daniel Veillard4d8db8a2002-12-30 18:40:42 +0000735 reader->depth = -1;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000736
737 /*
738 * Cleanup of the old node
739 */
740 if (oldnode->type != XML_DTD_NODE) {
741 xmlUnlinkNode(oldnode);
742 xmlFreeNode(oldnode);
743 }
744
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000745 goto node_end;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000746 }
747 reader->depth--;
748 reader->state = XML_TEXTREADER_BACKTRACK;
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000749
750node_found:
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000751 DUMP_READER
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000752
753 /*
Daniel Veillarda80ff6e2003-01-03 12:52:08 +0000754 * Handle entities enter and exit when in entity replacement mode
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000755 */
756 if ((reader->node != NULL) &&
757 (reader->node->type == XML_ENTITY_REF_NODE) &&
758 (reader->ctxt != NULL) && (reader->ctxt->replaceEntities == 1)) {
759 /*
760 * Case where the underlying tree is not availble, lookup the entity
761 * and walk it.
762 */
763 if ((reader->node->children == NULL) && (reader->ctxt->sax != NULL) &&
764 (reader->ctxt->sax->getEntity != NULL)) {
765 reader->node->children = (xmlNodePtr)
766 reader->ctxt->sax->getEntity(reader->ctxt, reader->node->name);
767 }
768
769 if ((reader->node->children != NULL) &&
770 (reader->node->children->type == XML_ENTITY_DECL) &&
771 (reader->node->children->children != NULL)) {
772 xmlTextReaderEntPush(reader, reader->node);
773 reader->node = reader->node->children->children;
774 }
Daniel Veillarda80ff6e2003-01-03 12:52:08 +0000775 } else if ((reader->node != NULL) &&
776 (reader->node->type == XML_ENTITY_REF_NODE) &&
777 (reader->ctxt != NULL) && (reader->ctxt->validate == 1)) {
778 xmlTextReaderValidateEntity(reader);
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000779 }
780 if ((reader->node != NULL) &&
781 (reader->node->type == XML_ENTITY_DECL) &&
782 (reader->ent != NULL) && (reader->ent->children == reader->node)) {
783 reader->node = xmlTextReaderEntPop(reader);
784 reader->depth++;
785 goto get_next_node;
786 }
Daniel Veillard0e298ad2003-02-04 16:14:33 +0000787#ifdef LIBXML_REGEXP_ENABLED
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000788 if ((reader->ctxt->validate) && (reader->node != NULL)) {
789 xmlNodePtr node = reader->node;
790 xmlParserCtxtPtr ctxt = reader->ctxt;
791
792 if ((node->type == XML_ELEMENT_NODE) &&
793 ((reader->state != XML_TEXTREADER_END) &&
794 (reader->state != XML_TEXTREADER_BACKTRACK))) {
795 xmlTextReaderValidatePush(reader);
796 } else if ((node->type == XML_TEXT_NODE) ||
797 (node->type == XML_CDATA_SECTION_NODE)) {
798 ctxt->valid &= xmlValidatePushCData(&ctxt->vctxt,
799 node->content, xmlStrlen(node->content));
800 }
801 }
Daniel Veillard0e298ad2003-02-04 16:14:33 +0000802#endif /* LIBXML_REGEXP_ENABLED */
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000803 return(1);
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000804node_end:
805 return(0);
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000806}
807
Daniel Veillard67df8092002-12-16 22:04:11 +0000808/**
809 * xmlTextReaderReadState:
810 * @reader: the xmlTextReaderPtr used
811 *
812 * Gets the read state of the reader.
813 *
814 * Returns the state value, or -1 in case of error
815 */
816int
817xmlTextReaderReadState(xmlTextReaderPtr reader) {
818 if (reader == NULL)
819 return(-1);
820 return(reader->mode);
821}
822
823/**
824 * xmlTextReaderReadInnerXml:
825 * @reader: the xmlTextReaderPtr used
826 *
827 * Reads the contents of the current node, including child nodes and markup.
828 *
829 * Returns a string containing the XML content, or NULL if the current node
830 * is neither an element nor attribute, or has no child nodes. The
831 * string must be deallocated by the caller.
832 */
833xmlChar *
834xmlTextReaderReadInnerXml(xmlTextReaderPtr reader) {
835 TODO
836 return(NULL);
837}
838
839/**
840 * xmlTextReaderReadOuterXml:
841 * @reader: the xmlTextReaderPtr used
842 *
843 * Reads the contents of the current node, including child nodes and markup.
844 *
845 * Returns a string containing the XML content, or NULL if the current node
846 * is neither an element nor attribute, or has no child nodes. The
847 * string must be deallocated by the caller.
848 */
849xmlChar *
850xmlTextReaderReadOuterXml(xmlTextReaderPtr reader) {
851 TODO
852 return(NULL);
853}
854
855/**
856 * xmlTextReaderReadString:
857 * @reader: the xmlTextReaderPtr used
858 *
859 * Reads the contents of an element or a text node as a string.
860 *
861 * Returns a string containing the contents of the Element or Text node,
862 * or NULL if the reader is positioned on any other type of node.
863 * The string must be deallocated by the caller.
864 */
865xmlChar *
866xmlTextReaderReadString(xmlTextReaderPtr reader) {
867 TODO
868 return(NULL);
869}
870
Daniel Veillardbeb70bd2002-12-18 14:53:54 +0000871/**
872 * xmlTextReaderReadBase64:
873 * @reader: the xmlTextReaderPtr used
874 * @array: a byte array to store the content.
875 * @offset: the zero-based index into array where the method should
876 * begin to write.
877 * @len: the number of bytes to write.
878 *
879 * Reads and decodes the Base64 encoded contents of an element and
880 * stores the result in a byte buffer.
881 *
882 * Returns the number of bytes written to array, or zero if the current
883 * instance is not positioned on an element or -1 in case of error.
884 */
885int
886xmlTextReaderReadBase64(xmlTextReaderPtr reader, unsigned char *array,
887 int offset, int len) {
888 if ((reader == NULL) || (reader->ctxt == NULL))
889 return(-1);
890 if (reader->ctxt->wellFormed != 1)
891 return(-1);
892
893 if ((reader->node == NULL) || (reader->node->type == XML_ELEMENT_NODE))
894 return(0);
895 TODO
896 return(0);
897}
898
899/**
900 * xmlTextReaderReadBinHex:
901 * @reader: the xmlTextReaderPtr used
902 * @array: a byte array to store the content.
903 * @offset: the zero-based index into array where the method should
904 * begin to write.
905 * @len: the number of bytes to write.
906 *
907 * Reads and decodes the BinHex encoded contents of an element and
908 * stores the result in a byte buffer.
909 *
910 * Returns the number of bytes written to array, or zero if the current
911 * instance is not positioned on an element or -1 in case of error.
912 */
913int
914xmlTextReaderReadBinHex(xmlTextReaderPtr reader, unsigned char *array,
915 int offset, int len) {
916 if ((reader == NULL) || (reader->ctxt == NULL))
917 return(-1);
918 if (reader->ctxt->wellFormed != 1)
919 return(-1);
920
921 if ((reader->node == NULL) || (reader->node->type == XML_ELEMENT_NODE))
922 return(0);
923 TODO
924 return(0);
925}
926
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000927/************************************************************************
928 * *
929 * Constructor and destructors *
930 * *
931 ************************************************************************/
932/**
933 * xmlNewTextReader:
934 * @input: the xmlParserInputBufferPtr used to read data
Daniel Veillardea7751d2002-12-20 00:16:24 +0000935 * @URI: the URI information for the source if available
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000936 *
937 * Create an xmlTextReader structure fed with @input
938 *
939 * Returns the new xmlTextReaderPtr or NULL in case of error
940 */
941xmlTextReaderPtr
Daniel Veillardea7751d2002-12-20 00:16:24 +0000942xmlNewTextReader(xmlParserInputBufferPtr input, const char *URI) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000943 xmlTextReaderPtr ret;
944 int val;
945
946 if (input == NULL)
947 return(NULL);
948 ret = xmlMalloc(sizeof(xmlTextReader));
949 if (ret == NULL) {
950 xmlGenericError(xmlGenericErrorContext,
951 "xmlNewTextReader : malloc failed\n");
952 return(NULL);
953 }
954 memset(ret, 0, sizeof(xmlTextReader));
Daniel Veillard1fdfd112003-01-03 01:18:43 +0000955 ret->entTab = NULL;
956 ret->entMax = 0;
957 ret->entNr = 0;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000958 ret->input = input;
959 ret->sax = (xmlSAXHandler *) xmlMalloc(sizeof(xmlSAXHandler));
960 if (ret->sax == NULL) {
961 xmlFree(ret);
962 xmlGenericError(xmlGenericErrorContext,
963 "xmlNewTextReader : malloc failed\n");
964 return(NULL);
965 }
966 memcpy(ret->sax, &xmlDefaultSAXHandler, sizeof(xmlSAXHandler));
967 ret->startElement = ret->sax->startElement;
968 ret->sax->startElement = xmlTextReaderStartElement;
969 ret->endElement = ret->sax->endElement;
970 ret->sax->endElement = xmlTextReaderEndElement;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000971 ret->characters = ret->sax->characters;
972 ret->sax->characters = xmlTextReaderCharacters;
973 ret->cdataBlock = ret->sax->cdataBlock;
974 ret->sax->cdataBlock = xmlTextReaderCDataBlock;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000975
Daniel Veillard67df8092002-12-16 22:04:11 +0000976 ret->mode = XML_TEXTREADER_MODE_INITIAL;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000977 ret->node = NULL;
Daniel Veillardda46d2d2002-12-15 23:36:49 +0000978 ret->curnode = NULL;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000979 val = xmlParserInputBufferRead(input, 4);
980 if (val >= 4) {
981 ret->ctxt = xmlCreatePushParserCtxt(ret->sax, NULL,
Daniel Veillardea7751d2002-12-20 00:16:24 +0000982 (const char *) ret->input->buffer->content, 4, URI);
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000983 ret->base = 0;
984 ret->cur = 4;
985 } else {
Daniel Veillardea7751d2002-12-20 00:16:24 +0000986 ret->ctxt = xmlCreatePushParserCtxt(ret->sax, NULL, NULL, 0, URI);
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000987 ret->base = 0;
988 ret->cur = 0;
989 }
990 ret->ctxt->_private = ret;
Daniel Veillardea7751d2002-12-20 00:16:24 +0000991 ret->ctxt->linenumbers = 1;
Daniel Veillarde1ca5032002-12-09 14:13:43 +0000992 ret->allocs = XML_TEXTREADER_CTXT;
993 return(ret);
994
995}
996
997/**
998 * xmlNewTextReaderFilename:
999 * @URI: the URI of the resource to process
1000 *
1001 * Create an xmlTextReader structure fed with the resource at @URI
1002 *
1003 * Returns the new xmlTextReaderPtr or NULL in case of error
1004 */
1005xmlTextReaderPtr
1006xmlNewTextReaderFilename(const char *URI) {
1007 xmlParserInputBufferPtr input;
1008 xmlTextReaderPtr ret;
Daniel Veillardea7751d2002-12-20 00:16:24 +00001009 char *directory = NULL;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001010
1011 input = xmlParserInputBufferCreateFilename(URI, XML_CHAR_ENCODING_NONE);
1012 if (input == NULL)
1013 return(NULL);
Daniel Veillardea7751d2002-12-20 00:16:24 +00001014 ret = xmlNewTextReader(input, URI);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001015 if (ret == NULL) {
1016 xmlFreeParserInputBuffer(input);
1017 return(NULL);
1018 }
1019 ret->allocs |= XML_TEXTREADER_INPUT;
Daniel Veillardea7751d2002-12-20 00:16:24 +00001020 if (ret->ctxt->directory == NULL)
1021 directory = xmlParserGetDirectory(URI);
1022 if ((ret->ctxt->directory == NULL) && (directory != NULL))
1023 ret->ctxt->directory = (char *) xmlStrdup((xmlChar *) directory);
1024 if (directory != NULL)
1025 xmlFree(directory);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001026 return(ret);
1027}
1028
1029/**
1030 * xmlFreeTextReader:
1031 * @reader: the xmlTextReaderPtr
1032 *
1033 * Deallocate all the resources associated to the reader
1034 */
1035void
1036xmlFreeTextReader(xmlTextReaderPtr reader) {
1037 if (reader == NULL)
1038 return;
1039 if (reader->ctxt != NULL) {
1040 if (reader->ctxt->myDoc != NULL) {
1041 xmlFreeDoc(reader->ctxt->myDoc);
1042 reader->ctxt->myDoc = NULL;
1043 }
Daniel Veillard336fc7d2002-12-27 19:37:04 +00001044 if ((reader->ctxt->vctxt.vstateTab != NULL) &&
1045 (reader->ctxt->vctxt.vstateMax > 0)){
1046 xmlFree(reader->ctxt->vctxt.vstateTab);
1047 reader->ctxt->vctxt.vstateTab = 0;
1048 reader->ctxt->vctxt.vstateMax = 0;
1049 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001050 if (reader->allocs & XML_TEXTREADER_CTXT)
1051 xmlFreeParserCtxt(reader->ctxt);
1052 }
1053 if (reader->sax != NULL)
1054 xmlFree(reader->sax);
1055 if ((reader->input != NULL) && (reader->allocs & XML_TEXTREADER_INPUT))
1056 xmlFreeParserInputBuffer(reader->input);
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00001057 if (reader->faketext != NULL) {
1058 xmlFreeNode(reader->faketext);
1059 }
Daniel Veillard1fdfd112003-01-03 01:18:43 +00001060 if (reader->entTab != NULL)
1061 xmlFree(reader->entTab);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001062 xmlFree(reader);
1063}
1064
1065/************************************************************************
1066 * *
Daniel Veillard0eb38c72002-12-14 23:00:35 +00001067 * Methods for XmlTextReader *
1068 * *
1069 ************************************************************************/
1070/**
1071 * xmlTextReaderClose:
1072 * @reader: the xmlTextReaderPtr used
1073 *
1074 * This method releases any resources allocated by the current instance
1075 * changes the state to Closed and close any underlying input.
1076 *
1077 * Returns 0 or -1 in case of error
1078 */
1079int
1080xmlTextReaderClose(xmlTextReaderPtr reader) {
1081 if (reader == NULL)
1082 return(-1);
1083 reader->node = NULL;
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001084 reader->curnode = NULL;
Daniel Veillard0eb38c72002-12-14 23:00:35 +00001085 reader->mode = XML_TEXTREADER_MODE_CLOSED;
1086 if (reader->ctxt != NULL) {
1087 if (reader->ctxt->myDoc != NULL) {
1088 xmlFreeDoc(reader->ctxt->myDoc);
1089 reader->ctxt->myDoc = NULL;
1090 }
1091 if (reader->allocs & XML_TEXTREADER_CTXT) {
1092 xmlFreeParserCtxt(reader->ctxt);
1093 reader->allocs -= XML_TEXTREADER_CTXT;
1094 }
1095 }
1096 if (reader->sax != NULL) {
1097 xmlFree(reader->sax);
1098 reader->sax = NULL;
1099 }
1100 if ((reader->input != NULL) && (reader->allocs & XML_TEXTREADER_INPUT)) {
1101 xmlFreeParserInputBuffer(reader->input);
1102 reader->allocs -= XML_TEXTREADER_INPUT;
1103 }
1104 return(0);
1105}
1106
1107/**
1108 * xmlTextReaderGetAttributeNo:
1109 * @reader: the xmlTextReaderPtr used
1110 * @no: the zero-based index of the attribute relative to the containing element
1111 *
1112 * Provides the value of the attribute with the specified index relative
1113 * to the containing element.
1114 *
1115 * Returns a string containing the value of the specified attribute, or NULL
1116 * in case of error. The string must be deallocated by the caller.
1117 */
1118xmlChar *
1119xmlTextReaderGetAttributeNo(xmlTextReaderPtr reader, int no) {
1120 xmlChar *ret;
1121 int i;
1122 xmlAttrPtr cur;
1123 xmlNsPtr ns;
1124
1125 if (reader == NULL)
1126 return(NULL);
1127 if (reader->node == NULL)
1128 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001129 if (reader->curnode != NULL)
1130 return(NULL);
Daniel Veillard0eb38c72002-12-14 23:00:35 +00001131 /* TODO: handle the xmlDecl */
1132 if (reader->node->type != XML_ELEMENT_NODE)
1133 return(NULL);
1134
1135 ns = reader->node->nsDef;
1136 for (i = 0;(i < no) && (ns != NULL);i++) {
1137 ns = ns->next;
1138 }
1139 if (ns != NULL)
1140 return(xmlStrdup(ns->href));
1141
1142 cur = reader->node->properties;
1143 if (cur == NULL)
1144 return(NULL);
1145 for (;i < no;i++) {
1146 cur = cur->next;
1147 if (cur == NULL)
1148 return(NULL);
1149 }
1150 /* TODO walk the DTD if present */
1151
1152 ret = xmlNodeListGetString(reader->node->doc, cur->children, 1);
1153 if (ret == NULL) return(xmlStrdup((xmlChar *)""));
1154 return(ret);
1155}
1156
1157/**
1158 * xmlTextReaderGetAttribute:
1159 * @reader: the xmlTextReaderPtr used
1160 * @name: the qualified name of the attribute.
1161 *
1162 * Provides the value of the attribute with the specified qualified name.
1163 *
1164 * Returns a string containing the value of the specified attribute, or NULL
1165 * in case of error. The string must be deallocated by the caller.
1166 */
1167xmlChar *
1168xmlTextReaderGetAttribute(xmlTextReaderPtr reader, const xmlChar *name) {
1169 xmlChar *prefix = NULL;
1170 xmlChar *localname;
1171 xmlNsPtr ns;
1172 xmlChar *ret = NULL;
1173
1174 if ((reader == NULL) || (name == NULL))
1175 return(NULL);
1176 if (reader->node == NULL)
1177 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001178 if (reader->curnode != NULL)
1179 return(NULL);
Daniel Veillard0eb38c72002-12-14 23:00:35 +00001180
1181 /* TODO: handle the xmlDecl */
1182 if (reader->node->type != XML_ELEMENT_NODE)
1183 return(NULL);
1184
1185 localname = xmlSplitQName2(name, &prefix);
1186 if (localname == NULL)
1187 return(xmlGetProp(reader->node, name));
1188
1189 ns = xmlSearchNs(reader->node->doc, reader->node, prefix);
1190 if (ns != NULL)
1191 ret = xmlGetNsProp(reader->node, localname, ns->href);
1192
1193 if (localname != NULL)
1194 xmlFree(localname);
1195 if (prefix != NULL)
1196 xmlFree(prefix);
1197 return(ret);
1198}
1199
1200
1201/**
1202 * xmlTextReaderGetAttributeNs:
1203 * @reader: the xmlTextReaderPtr used
1204 * @localName: the local name of the attribute.
1205 * @namespaceURI: the namespace URI of the attribute.
1206 *
1207 * Provides the value of the specified attribute
1208 *
1209 * Returns a string containing the value of the specified attribute, or NULL
1210 * in case of error. The string must be deallocated by the caller.
1211 */
1212xmlChar *
1213xmlTextReaderGetAttributeNs(xmlTextReaderPtr reader, const xmlChar *localName,
1214 const xmlChar *namespaceURI) {
1215 if ((reader == NULL) || (localName == NULL))
1216 return(NULL);
1217 if (reader->node == NULL)
1218 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001219 if (reader->curnode != NULL)
1220 return(NULL);
Daniel Veillard0eb38c72002-12-14 23:00:35 +00001221
1222 /* TODO: handle the xmlDecl */
1223 if (reader->node->type != XML_ELEMENT_NODE)
1224 return(NULL);
1225
1226 return(xmlGetNsProp(reader->node, localName, namespaceURI));
1227}
1228
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001229/**
1230 * xmlTextReaderGetRemainder:
1231 * @reader: the xmlTextReaderPtr used
1232 *
1233 * Method to get the remainder of the buffered XML. this method stops the
1234 * parser, set its state to End Of File and return the input stream with
1235 * what is left that the parser did not use.
1236 *
1237 * Returns the xmlParserInputBufferPtr attached to the XML or NULL
1238 * in case of error.
1239 */
1240xmlParserInputBufferPtr
1241xmlTextReaderGetRemainder(xmlTextReaderPtr reader) {
1242 xmlParserInputBufferPtr ret = NULL;
1243
1244 if (reader == NULL)
1245 return(NULL);
1246 if (reader->node == NULL)
1247 return(NULL);
1248
1249 reader->node = NULL;
1250 reader->curnode = NULL;
1251 reader->mode = XML_TEXTREADER_MODE_EOF;
1252 if (reader->ctxt != NULL) {
1253 if (reader->ctxt->myDoc != NULL) {
1254 xmlFreeDoc(reader->ctxt->myDoc);
1255 reader->ctxt->myDoc = NULL;
1256 }
1257 if (reader->allocs & XML_TEXTREADER_CTXT) {
1258 xmlFreeParserCtxt(reader->ctxt);
1259 reader->allocs -= XML_TEXTREADER_CTXT;
1260 }
1261 }
1262 if (reader->sax != NULL) {
1263 xmlFree(reader->sax);
1264 reader->sax = NULL;
1265 }
1266 if (reader->allocs & XML_TEXTREADER_INPUT) {
1267 ret = reader->input;
1268 reader->allocs -= XML_TEXTREADER_INPUT;
1269 } else {
1270 /*
1271 * Hum, one may need to duplicate the data structure because
1272 * without reference counting the input may be freed twice:
1273 * - by the layer which allocated it.
1274 * - by the layer to which would have been returned to.
1275 */
1276 TODO
1277 return(NULL);
1278 }
1279 return(ret);
1280}
1281
1282/**
1283 * xmlTextReaderLookupNamespace:
1284 * @reader: the xmlTextReaderPtr used
1285 * @prefix: the prefix whose namespace URI is to be resolved. To return
1286 * the default namespace, specify NULL
1287 *
1288 * Resolves a namespace prefix in the scope of the current element.
1289 *
1290 * Returns a string containing the namespace URI to which the prefix maps
1291 * or NULL in case of error. The string must be deallocated by the caller.
1292 */
1293xmlChar *
1294xmlTextReaderLookupNamespace(xmlTextReaderPtr reader, const xmlChar *prefix) {
1295 xmlNsPtr ns;
1296
1297 if (reader == NULL)
1298 return(NULL);
1299 if (reader->node == NULL)
1300 return(NULL);
1301
1302 ns = xmlSearchNs(reader->node->doc, reader->node, prefix);
1303 if (ns == NULL)
1304 return(NULL);
1305 return(xmlStrdup(ns->href));
1306}
1307
1308/**
1309 * xmlTextReaderMoveToAttributeNo:
1310 * @reader: the xmlTextReaderPtr used
1311 * @no: the zero-based index of the attribute relative to the containing
1312 * element.
1313 *
1314 * Moves the position of the current instance to the attribute with
1315 * the specified index relative to the containing element.
1316 *
1317 * Returns 1 in case of success, -1 in case of error, 0 if not found
1318 */
1319int
1320xmlTextReaderMoveToAttributeNo(xmlTextReaderPtr reader, int no) {
1321 int i;
1322 xmlAttrPtr cur;
1323 xmlNsPtr ns;
1324
1325 if (reader == NULL)
1326 return(-1);
1327 if (reader->node == NULL)
1328 return(-1);
1329 /* TODO: handle the xmlDecl */
1330 if (reader->node->type != XML_ELEMENT_NODE)
1331 return(-1);
1332
1333 reader->curnode = NULL;
1334
1335 ns = reader->node->nsDef;
1336 for (i = 0;(i < no) && (ns != NULL);i++) {
1337 ns = ns->next;
1338 }
1339 if (ns != NULL) {
1340 reader->curnode = (xmlNodePtr) ns;
1341 return(1);
1342 }
1343
1344 cur = reader->node->properties;
1345 if (cur == NULL)
1346 return(0);
1347 for (;i < no;i++) {
1348 cur = cur->next;
1349 if (cur == NULL)
1350 return(0);
1351 }
1352 /* TODO walk the DTD if present */
1353
1354 reader->curnode = (xmlNodePtr) cur;
1355 return(1);
1356}
1357
1358/**
1359 * xmlTextReaderMoveToAttribute:
1360 * @reader: the xmlTextReaderPtr used
1361 * @name: the qualified name of the attribute.
1362 *
1363 * Moves the position of the current instance to the attribute with
1364 * the specified qualified name.
1365 *
1366 * Returns 1 in case of success, -1 in case of error, 0 if not found
1367 */
1368int
1369xmlTextReaderMoveToAttribute(xmlTextReaderPtr reader, const xmlChar *name) {
1370 xmlChar *prefix = NULL;
1371 xmlChar *localname;
1372 xmlNsPtr ns;
1373 xmlAttrPtr prop;
1374
1375 if ((reader == NULL) || (name == NULL))
1376 return(-1);
1377 if (reader->node == NULL)
1378 return(-1);
1379
1380 /* TODO: handle the xmlDecl */
1381 if (reader->node->type != XML_ELEMENT_NODE)
1382 return(0);
1383
1384 localname = xmlSplitQName2(name, &prefix);
1385 if (localname == NULL) {
1386 /*
1387 * Namespace default decl
1388 */
1389 if (xmlStrEqual(name, BAD_CAST "xmlns")) {
1390 ns = reader->node->nsDef;
1391 while (ns != NULL) {
1392 if (ns->prefix == NULL) {
1393 reader->curnode = (xmlNodePtr) ns;
1394 return(1);
1395 }
1396 ns = ns->next;
1397 }
1398 return(0);
1399 }
1400
1401 prop = reader->node->properties;
1402 while (prop != NULL) {
1403 /*
1404 * One need to have
1405 * - same attribute names
1406 * - and the attribute carrying that namespace
1407 */
1408 if ((xmlStrEqual(prop->name, name)) &&
1409 ((prop->ns == NULL) || (prop->ns->prefix == NULL))) {
1410 reader->curnode = (xmlNodePtr) prop;
1411 return(1);
1412 }
1413 prop = prop->next;
1414 }
1415 return(0);
1416 }
1417
1418 /*
1419 * Namespace default decl
1420 */
1421 if (xmlStrEqual(prefix, BAD_CAST "xmlns")) {
1422 ns = reader->node->nsDef;
1423 while (ns != NULL) {
1424 if ((ns->prefix != NULL) && (xmlStrEqual(ns->prefix, localname))) {
1425 reader->curnode = (xmlNodePtr) ns;
1426 goto found;
1427 }
1428 ns = ns->next;
1429 }
1430 goto not_found;
1431 }
1432 prop = reader->node->properties;
1433 while (prop != NULL) {
1434 /*
1435 * One need to have
1436 * - same attribute names
1437 * - and the attribute carrying that namespace
1438 */
1439 if ((xmlStrEqual(prop->name, localname)) &&
1440 (prop->ns != NULL) && (xmlStrEqual(prop->ns->prefix, prefix))) {
1441 reader->curnode = (xmlNodePtr) prop;
1442 goto found;
1443 }
1444 prop = prop->next;
1445 }
1446not_found:
1447 if (localname != NULL)
1448 xmlFree(localname);
1449 if (prefix != NULL)
1450 xmlFree(prefix);
1451 return(0);
1452
1453found:
1454 if (localname != NULL)
1455 xmlFree(localname);
1456 if (prefix != NULL)
1457 xmlFree(prefix);
1458 return(1);
1459}
1460
1461/**
1462 * xmlTextReaderMoveToAttributeNs:
1463 * @reader: the xmlTextReaderPtr used
1464 * @localName: the local name of the attribute.
1465 * @namespaceURI: the namespace URI of the attribute.
1466 *
1467 * Moves the position of the current instance to the attribute with the
1468 * specified local name and namespace URI.
1469 *
1470 * Returns 1 in case of success, -1 in case of error, 0 if not found
1471 */
1472int
1473xmlTextReaderMoveToAttributeNs(xmlTextReaderPtr reader,
1474 const xmlChar *localName, const xmlChar *namespaceURI) {
1475 xmlAttrPtr prop;
1476 xmlNodePtr node;
1477
1478 if ((reader == NULL) || (localName == NULL) || (namespaceURI == NULL))
1479 return(-1);
1480 if (reader->node == NULL)
1481 return(-1);
1482 if (reader->node->type != XML_ELEMENT_NODE)
1483 return(0);
1484 node = reader->node;
1485
1486 /*
1487 * A priori reading http://www.w3.org/TR/REC-xml-names/ there is no
1488 * namespace name associated to "xmlns"
1489 */
1490 prop = node->properties;
1491 while (prop != NULL) {
1492 /*
1493 * One need to have
1494 * - same attribute names
1495 * - and the attribute carrying that namespace
1496 */
1497 if (xmlStrEqual(prop->name, localName) &&
1498 ((prop->ns != NULL) &&
1499 (xmlStrEqual(prop->ns->href, namespaceURI)))) {
1500 reader->curnode = (xmlNodePtr) prop;
1501 return(1);
1502 }
1503 prop = prop->next;
1504 }
1505 return(0);
1506}
1507
1508/**
1509 * xmlTextReaderMoveToFirstAttribute:
1510 * @reader: the xmlTextReaderPtr used
1511 *
1512 * Moves the position of the current instance to the first attribute
1513 * associated with the current node.
1514 *
1515 * Returns 1 in case of success, -1 in case of error, 0 if not found
1516 */
1517int
1518xmlTextReaderMoveToFirstAttribute(xmlTextReaderPtr reader) {
1519 if (reader == NULL)
1520 return(-1);
1521 if (reader->node == NULL)
1522 return(-1);
1523 if (reader->node->type != XML_ELEMENT_NODE)
1524 return(0);
1525
1526 if (reader->node->nsDef != NULL) {
1527 reader->curnode = (xmlNodePtr) reader->node->nsDef;
1528 return(1);
1529 }
1530 if (reader->node->properties != NULL) {
1531 reader->curnode = (xmlNodePtr) reader->node->properties;
1532 return(1);
1533 }
1534 return(0);
1535}
1536
1537/**
1538 * xmlTextReaderMoveToNextAttribute:
1539 * @reader: the xmlTextReaderPtr used
1540 *
1541 * Moves the position of the current instance to the next attribute
1542 * associated with the current node.
1543 *
1544 * Returns 1 in case of success, -1 in case of error, 0 if not found
1545 */
1546int
1547xmlTextReaderMoveToNextAttribute(xmlTextReaderPtr reader) {
1548 if (reader == NULL)
1549 return(-1);
1550 if (reader->node == NULL)
1551 return(-1);
1552 if (reader->node->type != XML_ELEMENT_NODE)
1553 return(0);
1554 if (reader->curnode == NULL)
1555 return(xmlTextReaderMoveToFirstAttribute(reader));
1556
1557 if (reader->curnode->type == XML_NAMESPACE_DECL) {
1558 xmlNsPtr ns = (xmlNsPtr) reader->curnode;
1559 if (ns->next != NULL) {
1560 reader->curnode = (xmlNodePtr) ns->next;
1561 return(1);
1562 }
1563 if (reader->node->properties != NULL) {
1564 reader->curnode = (xmlNodePtr) reader->node->properties;
1565 return(1);
1566 }
1567 return(0);
1568 } else if ((reader->curnode->type == XML_ATTRIBUTE_NODE) &&
1569 (reader->curnode->next != NULL)) {
1570 reader->curnode = reader->curnode->next;
1571 return(1);
1572 }
1573 return(0);
1574}
1575
1576/**
1577 * xmlTextReaderMoveToElement:
1578 * @reader: the xmlTextReaderPtr used
1579 *
1580 * Moves the position of the current instance to the node that
1581 * contains the current Attribute node.
1582 *
1583 * Returns 1 in case of success, -1 in case of error, 0 if not moved
1584 */
1585int
1586xmlTextReaderMoveToElement(xmlTextReaderPtr reader) {
1587 if (reader == NULL)
1588 return(-1);
1589 if (reader->node == NULL)
1590 return(-1);
1591 if (reader->node->type != XML_ELEMENT_NODE)
1592 return(0);
1593 if (reader->curnode != NULL) {
1594 reader->curnode = NULL;
1595 return(1);
1596 }
1597 return(0);
1598}
1599
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00001600/**
1601 * xmlTextReaderReadAttributeValue:
1602 * @reader: the xmlTextReaderPtr used
1603 *
1604 * Parses an attribute value into one or more Text and EntityReference nodes.
1605 *
1606 * Returns 1 in case of success, 0 if the reader was not positionned on an
1607 * ttribute node or all the attribute values have been read, or -1
1608 * in case of error.
1609 */
1610int
1611xmlTextReaderReadAttributeValue(xmlTextReaderPtr reader) {
1612 if (reader == NULL)
1613 return(-1);
1614 if (reader->node == NULL)
1615 return(-1);
1616 if (reader->curnode == NULL)
1617 return(0);
1618 if (reader->curnode->type == XML_ATTRIBUTE_NODE) {
1619 if (reader->curnode->children == NULL)
1620 return(0);
1621 reader->curnode = reader->curnode->children;
1622 } else if (reader->curnode->type == XML_NAMESPACE_DECL) {
1623 xmlNsPtr ns = (xmlNsPtr) reader->curnode;
1624
1625 if (reader->faketext == NULL) {
1626 reader->faketext = xmlNewDocText(reader->node->doc,
1627 ns->href);
1628 } else {
1629 if (reader->faketext->content != NULL)
1630 xmlFree(reader->faketext->content);
1631 reader->faketext->content = xmlStrdup(ns->href);
1632 }
1633 reader->curnode = reader->faketext;
1634 } else {
1635 if (reader->curnode->next == NULL)
1636 return(0);
1637 reader->curnode = reader->curnode->next;
1638 }
1639 return(1);
1640}
1641
Daniel Veillard0eb38c72002-12-14 23:00:35 +00001642/************************************************************************
1643 * *
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001644 * Acces API to the current node *
1645 * *
1646 ************************************************************************/
1647/**
1648 * xmlTextReaderAttributeCount:
1649 * @reader: the xmlTextReaderPtr used
1650 *
Daniel Veillarda9b66d02002-12-11 14:23:49 +00001651 * Provides the number of attributes of the current node
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001652 *
1653 * Returns 0 i no attributes, -1 in case of error or the attribute count
1654 */
1655int
1656xmlTextReaderAttributeCount(xmlTextReaderPtr reader) {
1657 int ret;
1658 xmlAttrPtr attr;
Daniel Veillard67df8092002-12-16 22:04:11 +00001659 xmlNsPtr ns;
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001660 xmlNodePtr node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001661
1662 if (reader == NULL)
1663 return(-1);
1664 if (reader->node == NULL)
1665 return(0);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001666
1667 if (reader->curnode != NULL)
1668 node = reader->curnode;
1669 else
1670 node = reader->node;
1671
1672 if (node->type != XML_ELEMENT_NODE)
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001673 return(0);
1674 if ((reader->state == XML_TEXTREADER_END) ||
1675 (reader->state == XML_TEXTREADER_BACKTRACK))
1676 return(0);
1677 ret = 0;
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001678 attr = node->properties;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001679 while (attr != NULL) {
1680 ret++;
1681 attr = attr->next;
1682 }
Daniel Veillard67df8092002-12-16 22:04:11 +00001683 ns = node->nsDef;
1684 while (ns != NULL) {
1685 ret++;
1686 ns = ns->next;
1687 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001688 return(ret);
1689}
1690
1691/**
1692 * xmlTextReaderNodeType:
1693 * @reader: the xmlTextReaderPtr used
1694 *
1695 * Get the node type of the current node
1696 * Reference:
1697 * http://dotgnu.org/pnetlib-doc/System/Xml/XmlNodeType.html
1698 *
1699 * Returns the xmlNodeType of the current node or -1 in case of error
1700 */
1701int
1702xmlTextReaderNodeType(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001703 xmlNodePtr node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001704 if (reader == NULL)
1705 return(-1);
1706 if (reader->node == NULL)
1707 return(0);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001708 if (reader->curnode != NULL)
1709 node = reader->curnode;
1710 else
1711 node = reader->node;
1712 switch (node->type) {
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001713 case XML_ELEMENT_NODE:
1714 if ((reader->state == XML_TEXTREADER_END) ||
1715 (reader->state == XML_TEXTREADER_BACKTRACK))
1716 return(15);
1717 return(1);
Daniel Veillardecaba492002-12-30 10:55:29 +00001718 case XML_NAMESPACE_DECL:
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001719 case XML_ATTRIBUTE_NODE:
1720 return(2);
1721 case XML_TEXT_NODE:
1722 return(3); /* TODO: SignificantWhitespace == 14 Whitespace == 13 */
1723 case XML_CDATA_SECTION_NODE:
1724 return(4);
1725 case XML_ENTITY_REF_NODE:
1726 return(5);
1727 case XML_ENTITY_NODE:
1728 return(6);
1729 case XML_PI_NODE:
1730 return(7);
1731 case XML_COMMENT_NODE:
1732 return(8);
1733 case XML_DOCUMENT_NODE:
1734 case XML_HTML_DOCUMENT_NODE:
1735#ifdef LIBXML_DOCB_ENABLED
1736 case XML_DOCB_DOCUMENT_NODE:
1737#endif
1738 return(9);
1739 case XML_DOCUMENT_FRAG_NODE:
1740 return(11);
1741 case XML_NOTATION_NODE:
1742 return(12);
1743 case XML_DOCUMENT_TYPE_NODE:
1744 case XML_DTD_NODE:
1745 return(10);
1746
1747 case XML_ELEMENT_DECL:
1748 case XML_ATTRIBUTE_DECL:
1749 case XML_ENTITY_DECL:
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001750 case XML_XINCLUDE_START:
1751 case XML_XINCLUDE_END:
1752 return(0);
1753 }
1754 return(-1);
1755}
1756
1757/**
Daniel Veillard01c13b52002-12-10 15:19:08 +00001758 * xmlTextReaderIsEmptyElement:
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001759 * @reader: the xmlTextReaderPtr used
1760 *
1761 * Check if the current node is empty
1762 *
1763 * Returns 1 if empty, 0 if not and -1 in case of error
1764 */
1765int
1766xmlTextReaderIsEmptyElement(xmlTextReaderPtr reader) {
1767 if ((reader == NULL) || (reader->node == NULL))
1768 return(-1);
Daniel Veillarddf512f42002-12-23 15:56:21 +00001769 if (reader->node->type != XML_ELEMENT_NODE)
1770 return(0);
Daniel Veillarde3c036e2003-01-01 15:11:05 +00001771 if (reader->curnode != NULL)
1772 return(0);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001773 if (reader->node->children != NULL)
1774 return(0);
Daniel Veillarddab8ea92003-01-02 14:16:45 +00001775 if (reader->state == XML_TEXTREADER_END)
1776 return(0);
Daniel Veillard067bae52003-01-05 01:27:54 +00001777 return(reader->node->_private == (void *)xmlTextReaderIsEmpty);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001778}
1779
1780/**
1781 * xmlTextReaderLocalName:
1782 * @reader: the xmlTextReaderPtr used
1783 *
1784 * The local name of the node.
1785 *
1786 * Returns the local name or NULL if not available
1787 */
1788xmlChar *
1789xmlTextReaderLocalName(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001790 xmlNodePtr node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001791 if ((reader == NULL) || (reader->node == NULL))
1792 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001793 if (reader->curnode != NULL)
1794 node = reader->curnode;
1795 else
1796 node = reader->node;
1797 if (node->type == XML_NAMESPACE_DECL) {
1798 xmlNsPtr ns = (xmlNsPtr) node;
1799 if (ns->prefix == NULL)
1800 return(xmlStrdup(BAD_CAST "xmlns"));
1801 else
1802 return(xmlStrdup(ns->prefix));
1803 }
1804 if ((node->type != XML_ELEMENT_NODE) &&
1805 (node->type != XML_ATTRIBUTE_NODE))
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00001806 return(xmlTextReaderName(reader));
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001807 return(xmlStrdup(node->name));
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001808}
1809
1810/**
1811 * xmlTextReaderName:
1812 * @reader: the xmlTextReaderPtr used
1813 *
1814 * The qualified name of the node, equal to Prefix :LocalName.
1815 *
1816 * Returns the local name or NULL if not available
1817 */
1818xmlChar *
1819xmlTextReaderName(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001820 xmlNodePtr node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001821 xmlChar *ret;
1822
1823 if ((reader == NULL) || (reader->node == NULL))
1824 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001825 if (reader->curnode != NULL)
1826 node = reader->curnode;
1827 else
1828 node = reader->node;
1829 switch (node->type) {
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00001830 case XML_ELEMENT_NODE:
1831 case XML_ATTRIBUTE_NODE:
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001832 if ((node->ns == NULL) ||
1833 (node->ns->prefix == NULL))
1834 return(xmlStrdup(node->name));
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00001835
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001836 ret = xmlStrdup(node->ns->prefix);
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00001837 ret = xmlStrcat(ret, BAD_CAST ":");
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001838 ret = xmlStrcat(ret, node->name);
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00001839 return(ret);
1840 case XML_TEXT_NODE:
1841 return(xmlStrdup(BAD_CAST "#text"));
1842 case XML_CDATA_SECTION_NODE:
1843 return(xmlStrdup(BAD_CAST "#cdata-section"));
1844 case XML_ENTITY_NODE:
1845 case XML_ENTITY_REF_NODE:
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001846 return(xmlStrdup(node->name));
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00001847 case XML_PI_NODE:
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001848 return(xmlStrdup(node->name));
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00001849 case XML_COMMENT_NODE:
1850 return(xmlStrdup(BAD_CAST "#comment"));
1851 case XML_DOCUMENT_NODE:
1852 case XML_HTML_DOCUMENT_NODE:
1853#ifdef LIBXML_DOCB_ENABLED
1854 case XML_DOCB_DOCUMENT_NODE:
1855#endif
1856 return(xmlStrdup(BAD_CAST "#document"));
1857 case XML_DOCUMENT_FRAG_NODE:
1858 return(xmlStrdup(BAD_CAST "#document-fragment"));
1859 case XML_NOTATION_NODE:
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001860 return(xmlStrdup(node->name));
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00001861 case XML_DOCUMENT_TYPE_NODE:
1862 case XML_DTD_NODE:
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001863 return(xmlStrdup(node->name));
1864 case XML_NAMESPACE_DECL: {
1865 xmlNsPtr ns = (xmlNsPtr) node;
1866
1867 ret = xmlStrdup(BAD_CAST "xmlns");
1868 if (ns->prefix == NULL)
1869 return(ret);
1870 ret = xmlStrcat(ret, BAD_CAST ":");
1871 ret = xmlStrcat(ret, ns->prefix);
1872 return(ret);
1873 }
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00001874
1875 case XML_ELEMENT_DECL:
1876 case XML_ATTRIBUTE_DECL:
1877 case XML_ENTITY_DECL:
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00001878 case XML_XINCLUDE_START:
1879 case XML_XINCLUDE_END:
1880 return(NULL);
1881 }
1882 return(NULL);
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001883}
1884
1885/**
1886 * xmlTextReaderPrefix:
1887 * @reader: the xmlTextReaderPtr used
1888 *
1889 * A shorthand reference to the namespace associated with the node.
1890 *
1891 * Returns the prefix or NULL if not available
1892 */
1893xmlChar *
1894xmlTextReaderPrefix(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001895 xmlNodePtr node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001896 if ((reader == NULL) || (reader->node == NULL))
1897 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001898 if (reader->curnode != NULL)
1899 node = reader->curnode;
1900 else
1901 node = reader->node;
1902 if (node->type == XML_NAMESPACE_DECL) {
1903 xmlNsPtr ns = (xmlNsPtr) node;
1904 if (ns->prefix == NULL)
1905 return(NULL);
1906 return(xmlStrdup(BAD_CAST "xmlns"));
1907 }
1908 if ((node->type != XML_ELEMENT_NODE) &&
1909 (node->type != XML_ATTRIBUTE_NODE))
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001910 return(NULL);
Daniel Veillard952379b2003-03-17 15:37:12 +00001911 if ((node->ns != NULL) && (node->ns->prefix != NULL))
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001912 return(xmlStrdup(node->ns->prefix));
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001913 return(NULL);
1914}
1915
1916/**
1917 * xmlTextReaderNamespaceUri:
1918 * @reader: the xmlTextReaderPtr used
1919 *
1920 * The URI defining the namespace associated with the node.
1921 *
1922 * Returns the namespace URI or NULL if not available
1923 */
1924xmlChar *
1925xmlTextReaderNamespaceUri(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001926 xmlNodePtr node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001927 if ((reader == NULL) || (reader->node == NULL))
1928 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001929 if (reader->curnode != NULL)
1930 node = reader->curnode;
1931 else
1932 node = reader->node;
Daniel Veillardecaba492002-12-30 10:55:29 +00001933 if (node->type == XML_NAMESPACE_DECL)
1934 return(xmlStrdup(BAD_CAST "http://www.w3.org/2000/xmlns/"));
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001935 if ((node->type != XML_ELEMENT_NODE) &&
1936 (node->type != XML_ATTRIBUTE_NODE))
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001937 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001938 if (node->ns != NULL)
1939 return(xmlStrdup(node->ns->href));
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001940 return(NULL);
1941}
1942
1943/**
1944 * xmlTextReaderBaseUri:
1945 * @reader: the xmlTextReaderPtr used
1946 *
1947 * The base URI of the node.
1948 *
1949 * Returns the base URI or NULL if not available
1950 */
1951xmlChar *
1952xmlTextReaderBaseUri(xmlTextReaderPtr reader) {
1953 if ((reader == NULL) || (reader->node == NULL))
1954 return(NULL);
1955 return(xmlNodeGetBase(NULL, reader->node));
1956}
1957
1958/**
1959 * xmlTextReaderDepth:
1960 * @reader: the xmlTextReaderPtr used
1961 *
1962 * The depth of the node in the tree.
1963 *
1964 * Returns the depth or -1 in case of error
1965 */
1966int
1967xmlTextReaderDepth(xmlTextReaderPtr reader) {
1968 if (reader == NULL)
1969 return(-1);
1970 if (reader->node == NULL)
1971 return(0);
1972
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00001973 if (reader->curnode != NULL) {
1974 if ((reader->curnode->type == XML_ATTRIBUTE_NODE) ||
1975 (reader->curnode->type == XML_NAMESPACE_DECL))
1976 return(reader->depth + 1);
1977 return(reader->depth + 2);
1978 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001979 return(reader->depth);
1980}
1981
1982/**
1983 * xmlTextReaderHasAttributes:
1984 * @reader: the xmlTextReaderPtr used
1985 *
1986 * Whether the node has attributes.
1987 *
1988 * Returns 1 if true, 0 if false, and -1 in case or error
1989 */
1990int
1991xmlTextReaderHasAttributes(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001992 xmlNodePtr node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00001993 if (reader == NULL)
1994 return(-1);
1995 if (reader->node == NULL)
1996 return(0);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00001997 if (reader->curnode != NULL)
1998 node = reader->curnode;
1999 else
2000 node = reader->node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002001
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002002 if ((node->type == XML_ELEMENT_NODE) &&
2003 (node->properties != NULL))
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002004 return(1);
2005 /* TODO: handle the xmlDecl */
2006 return(0);
2007}
2008
2009/**
2010 * xmlTextReaderHasValue:
2011 * @reader: the xmlTextReaderPtr used
2012 *
2013 * Whether the node can have a text value.
2014 *
2015 * Returns 1 if true, 0 if false, and -1 in case or error
2016 */
2017int
2018xmlTextReaderHasValue(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002019 xmlNodePtr node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002020 if (reader == NULL)
2021 return(-1);
2022 if (reader->node == NULL)
2023 return(0);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002024 if (reader->curnode != NULL)
2025 node = reader->curnode;
2026 else
2027 node = reader->node;
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002028
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002029 switch (node->type) {
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002030 case XML_ATTRIBUTE_NODE:
2031 case XML_TEXT_NODE:
2032 case XML_CDATA_SECTION_NODE:
2033 case XML_PI_NODE:
2034 case XML_COMMENT_NODE:
2035 return(1);
2036 default:
2037 return(0);
2038 }
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002039 return(0);
2040}
2041
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002042/**
2043 * xmlTextReaderValue:
2044 * @reader: the xmlTextReaderPtr used
2045 *
2046 * Provides the text value of the node if present
2047 *
2048 * Returns the string or NULL if not available. The retsult must be deallocated
2049 * with xmlFree()
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002050 */
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002051xmlChar *
2052xmlTextReaderValue(xmlTextReaderPtr reader) {
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002053 xmlNodePtr node;
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002054 if (reader == NULL)
2055 return(NULL);
2056 if (reader->node == NULL)
2057 return(NULL);
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002058 if (reader->curnode != NULL)
2059 node = reader->curnode;
2060 else
2061 node = reader->node;
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002062
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002063 switch (node->type) {
2064 case XML_NAMESPACE_DECL:
2065 return(xmlStrdup(((xmlNsPtr) node)->href));
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002066 case XML_ATTRIBUTE_NODE:{
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002067 xmlAttrPtr attr = (xmlAttrPtr) node;
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002068
2069 if (attr->parent != NULL)
2070 return (xmlNodeListGetString
2071 (attr->parent->doc, attr->children, 1));
2072 else
2073 return (xmlNodeListGetString(NULL, attr->children, 1));
2074 break;
2075 }
2076 case XML_TEXT_NODE:
2077 case XML_CDATA_SECTION_NODE:
2078 case XML_PI_NODE:
2079 case XML_COMMENT_NODE:
Daniel Veillardda46d2d2002-12-15 23:36:49 +00002080 if (node->content != NULL)
2081 return (xmlStrdup(node->content));
Daniel Veillard9b4bb4d2002-12-11 19:28:47 +00002082 default:
2083 return(NULL);
2084 }
2085 return(NULL);
2086}
2087
2088/**
2089 * xmlTextReaderIsDefault:
2090 * @reader: the xmlTextReaderPtr used
2091 *
2092 * Whether an Attribute node was generated from the default value
2093 * defined in the DTD or schema.
2094 *
2095 * Returns 0 if not defaulted, 1 if defaulted, and -1 in case of error
2096 */
2097int
2098xmlTextReaderIsDefault(xmlTextReaderPtr reader) {
2099 if (reader == NULL)
2100 return(-1);
2101 return(0);
2102}
2103
2104/**
2105 * xmlTextReaderQuoteChar:
2106 * @reader: the xmlTextReaderPtr used
2107 *
2108 * The quotation mark character used to enclose the value of an attribute.
2109 *
2110 * Returns " or ' and -1 in case of error
2111 */
2112int
2113xmlTextReaderQuoteChar(xmlTextReaderPtr reader) {
2114 if (reader == NULL)
2115 return(-1);
2116 /* TODO maybe lookup the attribute value for " first */
2117 return((int) '"');
2118}
Daniel Veillarde1ca5032002-12-09 14:13:43 +00002119
2120/**
2121 * xmlTextReaderXmlLang:
2122 * @reader: the xmlTextReaderPtr used
2123 *
2124 * The xml:lang scope within which the node resides.
2125 *
2126 * Returns the xml:lang value or NULL if none exists.
2127 */
2128xmlChar *
2129xmlTextReaderXmlLang(xmlTextReaderPtr reader) {
2130 if (reader == NULL)
2131 return(NULL);
2132 if (reader->node == NULL)
2133 return(NULL);
2134 return(xmlNodeGetLang(reader->node));
2135}
2136
Daniel Veillard67df8092002-12-16 22:04:11 +00002137/**
2138 * xmlTextReaderNormalization:
2139 * @reader: the xmlTextReaderPtr used
2140 *
2141 * The value indicating whether to normalize white space and attribute values.
2142 * Since attribute value and end of line normalizations are a MUST in the XML
2143 * specification only the value true is accepted. The broken bahaviour of
2144 * accepting out of range character entities like &#0; is of course not
2145 * supported either.
2146 *
2147 * Returns 1 or -1 in case of error.
2148 */
2149int
2150xmlTextReaderNormalization(xmlTextReaderPtr reader) {
2151 if (reader == NULL)
2152 return(-1);
2153 return(1);
2154}
2155
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00002156/************************************************************************
2157 * *
2158 * Extensions to the base APIs *
2159 * *
2160 ************************************************************************/
2161
2162/**
2163 * xmlTextReaderSetParserProp:
2164 * @reader: the xmlTextReaderPtr used
2165 * @prop: the xmlParserProperties to set
2166 * @value: usually 0 or 1 to (de)activate it
2167 *
2168 * Change the parser processing behaviour by changing some of its internal
2169 * properties. Note that some properties can only be changed before any
2170 * read has been done.
2171 *
2172 * Returns 0 if the call was successful, or -1 in case of error
2173 */
2174int
2175xmlTextReaderSetParserProp(xmlTextReaderPtr reader, int prop, int value) {
2176 xmlParserProperties p = (xmlParserProperties) prop;
2177 xmlParserCtxtPtr ctxt;
2178
2179 if ((reader == NULL) || (reader->ctxt == NULL))
2180 return(-1);
2181 ctxt = reader->ctxt;
2182
2183 switch (p) {
2184 case XML_PARSER_LOADDTD:
2185 if (value != 0) {
2186 if (ctxt->loadsubset == 0) {
2187 if (reader->mode != XML_TEXTREADER_MODE_INITIAL)
2188 return(-1);
2189 ctxt->loadsubset = XML_DETECT_IDS;
2190 }
2191 } else {
2192 ctxt->loadsubset = 0;
2193 }
2194 return(0);
2195 case XML_PARSER_DEFAULTATTRS:
2196 if (value != 0) {
2197 ctxt->loadsubset |= XML_COMPLETE_ATTRS;
2198 } else {
2199 if (ctxt->loadsubset & XML_COMPLETE_ATTRS)
2200 ctxt->loadsubset -= XML_COMPLETE_ATTRS;
2201 }
2202 return(0);
2203 case XML_PARSER_VALIDATE:
2204 if (value != 0) {
2205 ctxt->validate = 1;
2206 } else {
2207 ctxt->validate = 0;
2208 }
2209 return(0);
Daniel Veillarde18fc182002-12-28 22:56:33 +00002210 case XML_PARSER_SUBST_ENTITIES:
2211 if (value != 0) {
2212 ctxt->replaceEntities = 1;
2213 } else {
2214 ctxt->replaceEntities = 0;
2215 }
2216 return(0);
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00002217 }
2218 return(-1);
2219}
2220
2221/**
2222 * xmlTextReaderGetParserProp:
2223 * @reader: the xmlTextReaderPtr used
2224 * @prop: the xmlParserProperties to get
2225 *
2226 * Read the parser internal property.
2227 *
2228 * Returns the value, usually 0 or 1, or -1 in case of error.
2229 */
2230int
2231xmlTextReaderGetParserProp(xmlTextReaderPtr reader, int prop) {
2232 xmlParserProperties p = (xmlParserProperties) prop;
2233 xmlParserCtxtPtr ctxt;
2234
2235 if ((reader == NULL) || (reader->ctxt == NULL))
2236 return(-1);
2237 ctxt = reader->ctxt;
2238
2239 switch (p) {
2240 case XML_PARSER_LOADDTD:
2241 if ((ctxt->loadsubset != 0) || (ctxt->validate != 0))
2242 return(1);
2243 return(0);
2244 case XML_PARSER_DEFAULTATTRS:
2245 if (ctxt->loadsubset & XML_COMPLETE_ATTRS)
2246 return(1);
2247 return(0);
2248 case XML_PARSER_VALIDATE:
2249 return(ctxt->validate);
Daniel Veillarde18fc182002-12-28 22:56:33 +00002250 case XML_PARSER_SUBST_ENTITIES:
2251 return(ctxt->replaceEntities);
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00002252 }
2253 return(-1);
2254}
2255
Daniel Veillarde18fc182002-12-28 22:56:33 +00002256/**
2257 * xmlTextReaderCurrentNode:
2258 * @reader: the xmlTextReaderPtr used
2259 *
2260 * Hacking interface allowing to get the xmlNodePtr correponding to the
2261 * current node being accessed by the xmlTextReader. This is dangerous
2262 * because the underlying node may be destroyed on the next Reads.
2263 *
2264 * Returns the xmlNodePtr or NULL in case of error.
2265 */
2266xmlNodePtr
2267xmlTextReaderCurrentNode(xmlTextReaderPtr reader) {
2268 if (reader == NULL)
2269 return(NULL);
2270
2271 if (reader->curnode != NULL)
2272 return(reader->curnode);
2273 return(reader->node);
2274}
2275
2276/**
2277 * xmlTextReaderCurrentDoc:
2278 * @reader: the xmlTextReaderPtr used
2279 *
2280 * Hacking interface allowing to get the xmlDocPtr correponding to the
2281 * current document being accessed by the xmlTextReader. This is dangerous
2282 * because the associated node may be destroyed on the next Reads.
2283 *
2284 * Returns the xmlDocPtr or NULL in case of error.
2285 */
2286xmlDocPtr
2287xmlTextReaderCurrentDoc(xmlTextReaderPtr reader) {
2288 if ((reader == NULL) || (reader->ctxt == NULL))
2289 return(NULL);
2290
2291 return(reader->ctxt->myDoc);
2292}
2293
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00002294/************************************************************************
2295 * *
Daniel Veillard26f70262003-01-16 22:45:08 +00002296 * Error Handling Extensions *
2297 * *
2298 ************************************************************************/
2299
2300/* helper to build a xmlMalloc'ed string from a format and va_list */
2301static char *
2302xmlTextReaderBuildMessage(const char *msg, va_list ap) {
2303 int size;
2304 int chars;
2305 char *larger;
2306 char *str;
2307
2308 str = (char *) xmlMalloc(150);
2309 if (str == NULL) {
2310 xmlGenericError(xmlGenericErrorContext, "xmlMalloc failed !\n");
2311 return NULL;
2312 }
2313
2314 size = 150;
2315
2316 while (1) {
2317 chars = vsnprintf(str, size, msg, ap);
2318 if ((chars > -1) && (chars < size))
2319 break;
2320 if (chars > -1)
2321 size += chars + 1;
2322 else
2323 size += 100;
2324 if ((larger = (char *) xmlRealloc(str, size)) == NULL) {
2325 xmlGenericError(xmlGenericErrorContext, "xmlRealloc failed !\n");
2326 xmlFree(str);
2327 return NULL;
2328 }
2329 str = larger;
2330 }
2331
2332 return str;
2333}
2334
Daniel Veillard417be3a2003-01-20 21:26:34 +00002335/**
Daniel Veillard540a31a2003-01-21 11:21:07 +00002336 * xmlTextReaderLocatorLineNumber:
Daniel Veillard417be3a2003-01-20 21:26:34 +00002337 * @locator: the xmlTextReaderLocatorPtr used
2338 *
2339 * Obtain the line number for the given locator.
2340 *
2341 * Returns the line number or -1 in case of error.
2342 */
2343int
2344xmlTextReaderLocatorLineNumber(xmlTextReaderLocatorPtr locator) {
2345 /* we know that locator is a xmlParserCtxtPtr */
2346 xmlParserCtxtPtr ctx = (xmlParserCtxtPtr)locator;
2347 int ret = -1;
2348
2349 if (ctx->node != NULL) {
2350 ret = xmlGetLineNo(ctx->node);
2351 }
2352 else {
2353 /* inspired from error.c */
2354 xmlParserInputPtr input;
2355 input = ctx->input;
2356 if ((input->filename == NULL) && (ctx->inputNr > 1))
2357 input = ctx->inputTab[ctx->inputNr - 2];
2358 if (input != NULL) {
2359 ret = input->line;
2360 }
2361 else {
2362 ret = -1;
2363 }
2364 }
2365
2366 return ret;
2367}
2368
2369/**
Daniel Veillard540a31a2003-01-21 11:21:07 +00002370 * xmlTextReaderLocatorBaseURI:
Daniel Veillard417be3a2003-01-20 21:26:34 +00002371 * @locator: the xmlTextReaderLocatorPtr used
2372 *
2373 * Obtain the base URI for the given locator.
2374 *
2375 * Returns the base URI or NULL in case of error.
2376 */
2377xmlChar *
2378xmlTextReaderLocatorBaseURI(xmlTextReaderLocatorPtr locator) {
2379 /* we know that locator is a xmlParserCtxtPtr */
2380 xmlParserCtxtPtr ctx = (xmlParserCtxtPtr)locator;
2381 xmlChar *ret = NULL;
2382
2383 if (ctx->node != NULL) {
2384 ret = xmlNodeGetBase(NULL,ctx->node);
2385 }
2386 else {
2387 /* inspired from error.c */
2388 xmlParserInputPtr input;
2389 input = ctx->input;
2390 if ((input->filename == NULL) && (ctx->inputNr > 1))
2391 input = ctx->inputTab[ctx->inputNr - 2];
2392 if (input != NULL) {
Daniel Veillard580ced82003-03-21 21:22:48 +00002393 ret = xmlStrdup(BAD_CAST input->filename);
Daniel Veillard417be3a2003-01-20 21:26:34 +00002394 }
2395 else {
2396 ret = NULL;
2397 }
2398 }
2399
2400 return ret;
2401}
2402
Daniel Veillard26f70262003-01-16 22:45:08 +00002403static void
2404xmlTextReaderGenericError(void *ctxt, int severity, char *str) {
2405 xmlParserCtxtPtr ctx = (xmlParserCtxtPtr)ctxt;
2406 xmlTextReaderPtr reader = (xmlTextReaderPtr)ctx->_private;
2407
2408 if (str != NULL) {
2409 reader->errorFunc(reader->errorFuncArg,
2410 str,
Daniel Veillard417be3a2003-01-20 21:26:34 +00002411 severity,
2412 (xmlTextReaderLocatorPtr)ctx);
Daniel Veillard26f70262003-01-16 22:45:08 +00002413 xmlFree(str);
2414 }
2415}
2416
2417static void
2418xmlTextReaderError(void *ctxt, const char *msg, ...) {
2419 va_list ap;
2420
2421 va_start(ap,msg);
2422 xmlTextReaderGenericError(ctxt,
Daniel Veillard417be3a2003-01-20 21:26:34 +00002423 XML_PARSER_SEVERITY_ERROR,
Daniel Veillard26f70262003-01-16 22:45:08 +00002424 xmlTextReaderBuildMessage(msg,ap));
2425 va_end(ap);
2426
2427}
2428
2429static void
2430xmlTextReaderWarning(void *ctxt, const char *msg, ...) {
2431 va_list ap;
2432
2433 va_start(ap,msg);
2434 xmlTextReaderGenericError(ctxt,
Daniel Veillard417be3a2003-01-20 21:26:34 +00002435 XML_PARSER_SEVERITY_WARNING,
Daniel Veillard26f70262003-01-16 22:45:08 +00002436 xmlTextReaderBuildMessage(msg,ap));
2437 va_end(ap);
2438}
2439
2440static void
2441xmlTextReaderValidityError(void *ctxt, const char *msg, ...) {
2442 va_list ap;
Daniel Veillard417be3a2003-01-20 21:26:34 +00002443 int len = xmlStrlen((const xmlChar *) msg);
Daniel Veillard26f70262003-01-16 22:45:08 +00002444
Daniel Veillard417be3a2003-01-20 21:26:34 +00002445 if ((len > 1) && (msg[len - 2] != ':')) {
2446 /*
2447 * some callbacks only report locator information:
2448 * skip them (mimicking behaviour in error.c)
2449 */
2450 va_start(ap,msg);
2451 xmlTextReaderGenericError(ctxt,
2452 XML_PARSER_SEVERITY_VALIDITY_ERROR,
2453 xmlTextReaderBuildMessage(msg,ap));
2454 va_end(ap);
2455 }
Daniel Veillard26f70262003-01-16 22:45:08 +00002456}
2457
2458static void
2459xmlTextReaderValidityWarning(void *ctxt, const char *msg, ...) {
2460 va_list ap;
Daniel Veillard417be3a2003-01-20 21:26:34 +00002461 int len = xmlStrlen((const xmlChar *) msg);
Daniel Veillard26f70262003-01-16 22:45:08 +00002462
Daniel Veillard417be3a2003-01-20 21:26:34 +00002463 if ((len != 0) && (msg[len - 1] != ':')) {
2464 /*
2465 * some callbacks only report locator information:
2466 * skip them (mimicking behaviour in error.c)
2467 */
2468 va_start(ap,msg);
2469 xmlTextReaderGenericError(ctxt,
2470 XML_PARSER_SEVERITY_VALIDITY_WARNING,
2471 xmlTextReaderBuildMessage(msg,ap));
2472 va_end(ap);
2473 }
Daniel Veillard26f70262003-01-16 22:45:08 +00002474}
2475
2476/**
2477 * xmlTextReaderSetErrorHandler:
2478 * @reader: the xmlTextReaderPtr used
2479 * @f: the callback function to call on error and warnings
2480 * @arg: a user argument to pass to the callback function
2481 *
Daniel Veillard417be3a2003-01-20 21:26:34 +00002482 * Register a callback function that will be called on error and warnings.
2483 *
Daniel Veillard26f70262003-01-16 22:45:08 +00002484 * If @f is NULL, the default error and warning handlers are restored.
2485 */
2486void
2487xmlTextReaderSetErrorHandler(xmlTextReaderPtr reader,
2488 xmlTextReaderErrorFunc f,
Daniel Veillard417be3a2003-01-20 21:26:34 +00002489 void *arg) {
Daniel Veillard26f70262003-01-16 22:45:08 +00002490 if (f != NULL) {
2491 reader->ctxt->sax->error = xmlTextReaderError;
2492 reader->ctxt->vctxt.error = xmlTextReaderValidityError;
2493 reader->ctxt->sax->warning = xmlTextReaderWarning;
2494 reader->ctxt->vctxt.warning = xmlTextReaderValidityWarning;
2495 reader->errorFunc = f;
2496 reader->errorFuncArg = arg;
2497 }
2498 else {
2499 /* restore defaults */
2500 reader->ctxt->sax->error = xmlParserError;
2501 reader->ctxt->vctxt.error = xmlParserValidityError;
2502 reader->ctxt->sax->warning = xmlParserWarning;
2503 reader->ctxt->vctxt.warning = xmlParserValidityWarning;
2504 reader->errorFunc = NULL;
2505 reader->errorFuncArg = NULL;
2506 }
2507}
2508
Daniel Veillard417be3a2003-01-20 21:26:34 +00002509/**
2510 * xmlTextReaderGetErrorHandler:
2511 * @reader: the xmlTextReaderPtr used
2512 * @f: the callback function or NULL is no callback has been registered
2513 * @arg: a user argument
2514 *
2515 * Retrieve the error callback function and user argument.
2516 */
Daniel Veillard26f70262003-01-16 22:45:08 +00002517void
2518xmlTextReaderGetErrorHandler(xmlTextReaderPtr reader,
2519 xmlTextReaderErrorFunc *f,
Daniel Veillard417be3a2003-01-20 21:26:34 +00002520 void **arg) {
Daniel Veillard26f70262003-01-16 22:45:08 +00002521 *f = reader->errorFunc;
2522 *arg = reader->errorFuncArg;
2523}
2524
2525/************************************************************************
2526 * *
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00002527 * Utilities *
2528 * *
2529 ************************************************************************/
2530/**
2531 * xmlBase64Decode:
2532 * @in: the input buffer
2533 * @inlen: the size of the input (in), the size read from it (out)
2534 * @to: the output buffer
2535 * @tolen: the size of the output (in), the size written to (out)
2536 *
2537 * Base64 decoder, reads from @in and save in @to
Daniel Veillardd4310742003-02-18 21:12:46 +00002538 * TODO: tell jody when this is actually exported
Daniel Veillardbeb70bd2002-12-18 14:53:54 +00002539 *
2540 * Returns 0 if all the input was consumer, 1 if the Base64 end was reached,
2541 * 2 if there wasn't enough space on the output or -1 in case of error.
2542 */
2543static int
2544xmlBase64Decode(const unsigned char *in, unsigned long *inlen,
2545 unsigned char *to, unsigned long *tolen) {
2546 unsigned long incur; /* current index in in[] */
2547 unsigned long inblk; /* last block index in in[] */
2548 unsigned long outcur; /* current index in out[] */
2549 unsigned long inmax; /* size of in[] */
2550 unsigned long outmax; /* size of out[] */
2551 unsigned char cur; /* the current value read from in[] */
2552 unsigned char intmp[3], outtmp[4]; /* temporary buffers for the convert */
2553 int nbintmp; /* number of byte in intmp[] */
2554 int is_ignore; /* cur should be ignored */
2555 int is_end = 0; /* the end of the base64 was found */
2556 int retval = 1;
2557 int i;
2558
2559 if ((in == NULL) || (inlen == NULL) || (to == NULL) || (tolen == NULL))
2560 return(-1);
2561
2562 incur = 0;
2563 inblk = 0;
2564 outcur = 0;
2565 inmax = *inlen;
2566 outmax = *tolen;
2567 nbintmp = 0;
2568
2569 while (1) {
2570 if (incur >= inmax)
2571 break;
2572 cur = in[incur++];
2573 is_ignore = 0;
2574 if ((cur >= 'A') && (cur <= 'Z'))
2575 cur = cur - 'A';
2576 else if ((cur >= 'a') && (cur <= 'z'))
2577 cur = cur - 'a' + 26;
2578 else if ((cur >= '0') && (cur <= '9'))
2579 cur = cur - '0' + 52;
2580 else if (cur == '+')
2581 cur = 62;
2582 else if (cur == '/')
2583 cur = 63;
2584 else if (cur == '.')
2585 cur = 0;
2586 else if (cur == '=') /*no op , end of the base64 stream */
2587 is_end = 1;
2588 else {
2589 is_ignore = 1;
2590 if (nbintmp == 0)
2591 inblk = incur;
2592 }
2593
2594 if (!is_ignore) {
2595 int nbouttmp = 3;
2596 int is_break = 0;
2597
2598 if (is_end) {
2599 if (nbintmp == 0)
2600 break;
2601 if ((nbintmp == 1) || (nbintmp == 2))
2602 nbouttmp = 1;
2603 else
2604 nbouttmp = 2;
2605 nbintmp = 3;
2606 is_break = 1;
2607 }
2608 intmp[nbintmp++] = cur;
2609 /*
2610 * if intmp is full, push the 4byte sequence as a 3 byte
2611 * sequence out
2612 */
2613 if (nbintmp == 4) {
2614 nbintmp = 0;
2615 outtmp[0] = (intmp[0] << 2) | ((intmp[1] & 0x30) >> 4);
2616 outtmp[1] =
2617 ((intmp[1] & 0x0F) << 4) | ((intmp[2] & 0x3C) >> 2);
2618 outtmp[2] = ((intmp[2] & 0x03) << 6) | (intmp[3] & 0x3F);
2619 if (outcur + 3 >= outmax) {
2620 retval = 2;
2621 break;
2622 }
2623
2624 for (i = 0; i < nbouttmp; i++)
2625 to[outcur++] = outtmp[i];
2626 inblk = incur;
2627 }
2628
2629 if (is_break) {
2630 retval = 0;
2631 break;
2632 }
2633 }
2634 }
2635
2636 *tolen = outcur;
2637 *inlen = inblk;
2638 return (retval);
2639}
2640
2641/*
2642 * Test routine for the xmlBase64Decode function
2643 */
2644#if 0
2645int main(int argc, char **argv) {
2646 char *input = " VW4 gcGV0 \n aXQgdGVzdCAuCg== ";
2647 char output[100];
2648 char output2[100];
2649 char output3[100];
2650 unsigned long inlen = strlen(input);
2651 unsigned long outlen = 100;
2652 int ret;
2653 unsigned long cons, tmp, tmp2, prod;
2654
2655 /*
2656 * Direct
2657 */
2658 ret = xmlBase64Decode(input, &inlen, output, &outlen);
2659
2660 output[outlen] = 0;
2661 printf("ret: %d, inlen: %ld , outlen: %ld, output: '%s'\n", ret, inlen, outlen, output);
2662
2663 /*
2664 * output chunking
2665 */
2666 cons = 0;
2667 prod = 0;
2668 while (cons < inlen) {
2669 tmp = 5;
2670 tmp2 = inlen - cons;
2671
2672 printf("%ld %ld\n", cons, prod);
2673 ret = xmlBase64Decode(&input[cons], &tmp2, &output2[prod], &tmp);
2674 cons += tmp2;
2675 prod += tmp;
2676 printf("%ld %ld\n", cons, prod);
2677 }
2678 output2[outlen] = 0;
2679 printf("ret: %d, cons: %ld , prod: %ld, output: '%s'\n", ret, cons, prod, output2);
2680
2681 /*
2682 * input chunking
2683 */
2684 cons = 0;
2685 prod = 0;
2686 while (cons < inlen) {
2687 tmp = 100 - prod;
2688 tmp2 = inlen - cons;
2689 if (tmp2 > 5)
2690 tmp2 = 5;
2691
2692 printf("%ld %ld\n", cons, prod);
2693 ret = xmlBase64Decode(&input[cons], &tmp2, &output3[prod], &tmp);
2694 cons += tmp2;
2695 prod += tmp;
2696 printf("%ld %ld\n", cons, prod);
2697 }
2698 output3[outlen] = 0;
2699 printf("ret: %d, cons: %ld , prod: %ld, output: '%s'\n", ret, cons, prod, output3);
2700 return(0);
2701
2702}
2703#endif