| /* |
| * testHTML.c : a small tester program for HTML input. |
| * |
| * See Copyright for the status of this software. |
| * |
| * daniel@veillard.com |
| */ |
| |
| #include "libxml.h" |
| |
| #ifdef LIBXML_HTML_ENABLED |
| |
| #include <string.h> |
| #include <stdarg.h> |
| |
| |
| #ifdef HAVE_SYS_TYPES_H |
| #include <sys/types.h> |
| #endif |
| #ifdef HAVE_SYS_STAT_H |
| #include <sys/stat.h> |
| #endif |
| #ifdef HAVE_FCNTL_H |
| #include <fcntl.h> |
| #endif |
| #ifdef HAVE_UNISTD_H |
| #include <unistd.h> |
| #endif |
| #ifdef HAVE_STDLIB_H |
| #include <stdlib.h> |
| #endif |
| |
| #include <libxml/xmlmemory.h> |
| #include <libxml/HTMLparser.h> |
| #include <libxml/HTMLtree.h> |
| #include <libxml/debugXML.h> |
| #include <libxml/xmlerror.h> |
| #include <libxml/globals.h> |
| |
| #ifdef LIBXML_DEBUG_ENABLED |
| static int debug = 0; |
| #endif |
| static int copy = 0; |
| static int sax = 0; |
| static int repeat = 0; |
| static int noout = 0; |
| #ifdef LIBXML_PUSH_ENABLED |
| static int push = 0; |
| #endif /* LIBXML_PUSH_ENABLED */ |
| static char *encoding = NULL; |
| static int options = 0; |
| |
| xmlSAXHandler emptySAXHandlerStruct = { |
| NULL, /* internalSubset */ |
| NULL, /* isStandalone */ |
| NULL, /* hasInternalSubset */ |
| NULL, /* hasExternalSubset */ |
| NULL, /* resolveEntity */ |
| NULL, /* getEntity */ |
| NULL, /* entityDecl */ |
| NULL, /* notationDecl */ |
| NULL, /* attributeDecl */ |
| NULL, /* elementDecl */ |
| NULL, /* unparsedEntityDecl */ |
| NULL, /* setDocumentLocator */ |
| NULL, /* startDocument */ |
| NULL, /* endDocument */ |
| NULL, /* startElement */ |
| NULL, /* endElement */ |
| NULL, /* reference */ |
| NULL, /* characters */ |
| NULL, /* ignorableWhitespace */ |
| NULL, /* processingInstruction */ |
| NULL, /* comment */ |
| NULL, /* xmlParserWarning */ |
| NULL, /* xmlParserError */ |
| NULL, /* xmlParserError */ |
| NULL, /* getParameterEntity */ |
| NULL, /* cdataBlock */ |
| NULL, /* externalSubset */ |
| 1, /* initialized */ |
| NULL, /* private */ |
| NULL, /* startElementNsSAX2Func */ |
| NULL, /* endElementNsSAX2Func */ |
| NULL /* xmlStructuredErrorFunc */ |
| }; |
| |
| xmlSAXHandlerPtr emptySAXHandler = &emptySAXHandlerStruct; |
| extern xmlSAXHandlerPtr debugSAXHandler; |
| |
| /************************************************************************ |
| * * |
| * Debug Handlers * |
| * * |
| ************************************************************************/ |
| |
| /** |
| * isStandaloneDebug: |
| * @ctxt: An XML parser context |
| * |
| * Is this document tagged standalone ? |
| * |
| * Returns 1 if true |
| */ |
| static int |
| isStandaloneDebug(void *ctx ATTRIBUTE_UNUSED) |
| { |
| fprintf(stdout, "SAX.isStandalone()\n"); |
| return(0); |
| } |
| |
| /** |
| * hasInternalSubsetDebug: |
| * @ctxt: An XML parser context |
| * |
| * Does this document has an internal subset |
| * |
| * Returns 1 if true |
| */ |
| static int |
| hasInternalSubsetDebug(void *ctx ATTRIBUTE_UNUSED) |
| { |
| fprintf(stdout, "SAX.hasInternalSubset()\n"); |
| return(0); |
| } |
| |
| /** |
| * hasExternalSubsetDebug: |
| * @ctxt: An XML parser context |
| * |
| * Does this document has an external subset |
| * |
| * Returns 1 if true |
| */ |
| static int |
| hasExternalSubsetDebug(void *ctx ATTRIBUTE_UNUSED) |
| { |
| fprintf(stdout, "SAX.hasExternalSubset()\n"); |
| return(0); |
| } |
| |
| /** |
| * hasInternalSubsetDebug: |
| * @ctxt: An XML parser context |
| * |
| * Does this document has an internal subset |
| */ |
| static void |
| internalSubsetDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *name, |
| const xmlChar *ExternalID, const xmlChar *SystemID) |
| { |
| fprintf(stdout, "SAX.internalSubset(%s,", name); |
| if (ExternalID == NULL) |
| fprintf(stdout, " ,"); |
| else |
| fprintf(stdout, " %s,", ExternalID); |
| if (SystemID == NULL) |
| fprintf(stdout, " )\n"); |
| else |
| fprintf(stdout, " %s)\n", SystemID); |
| } |
| |
| /** |
| * resolveEntityDebug: |
| * @ctxt: An XML parser context |
| * @publicId: The public ID of the entity |
| * @systemId: The system ID of the entity |
| * |
| * Special entity resolver, better left to the parser, it has |
| * more context than the application layer. |
| * The default behaviour is to NOT resolve the entities, in that case |
| * the ENTITY_REF nodes are built in the structure (and the parameter |
| * values). |
| * |
| * Returns the xmlParserInputPtr if inlined or NULL for DOM behaviour. |
| */ |
| static xmlParserInputPtr |
| resolveEntityDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *publicId, const xmlChar *systemId) |
| { |
| /* xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; */ |
| |
| |
| fprintf(stdout, "SAX.resolveEntity("); |
| if (publicId != NULL) |
| fprintf(stdout, "%s", (char *)publicId); |
| else |
| fprintf(stdout, " "); |
| if (systemId != NULL) |
| fprintf(stdout, ", %s)\n", (char *)systemId); |
| else |
| fprintf(stdout, ", )\n"); |
| /********* |
| if (systemId != NULL) { |
| return(xmlNewInputFromFile(ctxt, (char *) systemId)); |
| } |
| *********/ |
| return(NULL); |
| } |
| |
| /** |
| * getEntityDebug: |
| * @ctxt: An XML parser context |
| * @name: The entity name |
| * |
| * Get an entity by name |
| * |
| * Returns the xmlParserInputPtr if inlined or NULL for DOM behaviour. |
| */ |
| static xmlEntityPtr |
| getEntityDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *name) |
| { |
| fprintf(stdout, "SAX.getEntity(%s)\n", name); |
| return(NULL); |
| } |
| |
| /** |
| * getParameterEntityDebug: |
| * @ctxt: An XML parser context |
| * @name: The entity name |
| * |
| * Get a parameter entity by name |
| * |
| * Returns the xmlParserInputPtr |
| */ |
| static xmlEntityPtr |
| getParameterEntityDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *name) |
| { |
| fprintf(stdout, "SAX.getParameterEntity(%s)\n", name); |
| return(NULL); |
| } |
| |
| |
| /** |
| * entityDeclDebug: |
| * @ctxt: An XML parser context |
| * @name: the entity name |
| * @type: the entity type |
| * @publicId: The public ID of the entity |
| * @systemId: The system ID of the entity |
| * @content: the entity value (without processing). |
| * |
| * An entity definition has been parsed |
| */ |
| static void |
| entityDeclDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *name, int type, |
| const xmlChar *publicId, const xmlChar *systemId, xmlChar *content) |
| { |
| fprintf(stdout, "SAX.entityDecl(%s, %d, %s, %s, %s)\n", |
| name, type, publicId, systemId, content); |
| } |
| |
| /** |
| * attributeDeclDebug: |
| * @ctxt: An XML parser context |
| * @name: the attribute name |
| * @type: the attribute type |
| * |
| * An attribute definition has been parsed |
| */ |
| static void |
| attributeDeclDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *elem, const xmlChar *name, |
| int type, int def, const xmlChar *defaultValue, |
| xmlEnumerationPtr tree ATTRIBUTE_UNUSED) |
| { |
| fprintf(stdout, "SAX.attributeDecl(%s, %s, %d, %d, %s, ...)\n", |
| elem, name, type, def, defaultValue); |
| } |
| |
| /** |
| * elementDeclDebug: |
| * @ctxt: An XML parser context |
| * @name: the element name |
| * @type: the element type |
| * @content: the element value (without processing). |
| * |
| * An element definition has been parsed |
| */ |
| static void |
| elementDeclDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *name, int type, |
| xmlElementContentPtr content ATTRIBUTE_UNUSED) |
| { |
| fprintf(stdout, "SAX.elementDecl(%s, %d, ...)\n", |
| name, type); |
| } |
| |
| /** |
| * notationDeclDebug: |
| * @ctxt: An XML parser context |
| * @name: The name of the notation |
| * @publicId: The public ID of the entity |
| * @systemId: The system ID of the entity |
| * |
| * What to do when a notation declaration has been parsed. |
| */ |
| static void |
| notationDeclDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *name, |
| const xmlChar *publicId, const xmlChar *systemId) |
| { |
| fprintf(stdout, "SAX.notationDecl(%s, %s, %s)\n", |
| (char *) name, (char *) publicId, (char *) systemId); |
| } |
| |
| /** |
| * unparsedEntityDeclDebug: |
| * @ctxt: An XML parser context |
| * @name: The name of the entity |
| * @publicId: The public ID of the entity |
| * @systemId: The system ID of the entity |
| * @notationName: the name of the notation |
| * |
| * What to do when an unparsed entity declaration is parsed |
| */ |
| static void |
| unparsedEntityDeclDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *name, |
| const xmlChar *publicId, const xmlChar *systemId, |
| const xmlChar *notationName) |
| { |
| fprintf(stdout, "SAX.unparsedEntityDecl(%s, %s, %s, %s)\n", |
| (char *) name, (char *) publicId, (char *) systemId, |
| (char *) notationName); |
| } |
| |
| /** |
| * setDocumentLocatorDebug: |
| * @ctxt: An XML parser context |
| * @loc: A SAX Locator |
| * |
| * Receive the document locator at startup, actually xmlDefaultSAXLocator |
| * Everything is available on the context, so this is useless in our case. |
| */ |
| static void |
| setDocumentLocatorDebug(void *ctx ATTRIBUTE_UNUSED, xmlSAXLocatorPtr loc ATTRIBUTE_UNUSED) |
| { |
| fprintf(stdout, "SAX.setDocumentLocator()\n"); |
| } |
| |
| /** |
| * startDocumentDebug: |
| * @ctxt: An XML parser context |
| * |
| * called when the document start being processed. |
| */ |
| static void |
| startDocumentDebug(void *ctx ATTRIBUTE_UNUSED) |
| { |
| fprintf(stdout, "SAX.startDocument()\n"); |
| } |
| |
| /** |
| * endDocumentDebug: |
| * @ctxt: An XML parser context |
| * |
| * called when the document end has been detected. |
| */ |
| static void |
| endDocumentDebug(void *ctx ATTRIBUTE_UNUSED) |
| { |
| fprintf(stdout, "SAX.endDocument()\n"); |
| } |
| |
| /** |
| * startElementDebug: |
| * @ctxt: An XML parser context |
| * @name: The element name |
| * |
| * called when an opening tag has been processed. |
| */ |
| static void |
| startElementDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *name, const xmlChar **atts) |
| { |
| int i; |
| |
| fprintf(stdout, "SAX.startElement(%s", (char *) name); |
| if (atts != NULL) { |
| for (i = 0;(atts[i] != NULL);i++) { |
| fprintf(stdout, ", %s", atts[i++]); |
| if (atts[i] != NULL) { |
| unsigned char output[40]; |
| const unsigned char *att = atts[i]; |
| int outlen, attlen; |
| fprintf(stdout, "='"); |
| while ((attlen = strlen((char*)att)) > 0) { |
| outlen = sizeof output - 1; |
| htmlEncodeEntities(output, &outlen, att, &attlen, '\''); |
| output[outlen] = 0; |
| fprintf(stdout, "%s", (char *) output); |
| att += attlen; |
| } |
| fprintf(stdout, "'"); |
| } |
| } |
| } |
| fprintf(stdout, ")\n"); |
| } |
| |
| /** |
| * endElementDebug: |
| * @ctxt: An XML parser context |
| * @name: The element name |
| * |
| * called when the end of an element has been detected. |
| */ |
| static void |
| endElementDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *name) |
| { |
| fprintf(stdout, "SAX.endElement(%s)\n", (char *) name); |
| } |
| |
| /** |
| * charactersDebug: |
| * @ctxt: An XML parser context |
| * @ch: a xmlChar string |
| * @len: the number of xmlChar |
| * |
| * receiving some chars from the parser. |
| * Question: how much at a time ??? |
| */ |
| static void |
| charactersDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *ch, int len) |
| { |
| unsigned char output[40]; |
| int inlen = len, outlen = 30; |
| |
| htmlEncodeEntities(output, &outlen, ch, &inlen, 0); |
| output[outlen] = 0; |
| |
| fprintf(stdout, "SAX.characters(%s, %d)\n", output, len); |
| } |
| |
| /** |
| * cdataDebug: |
| * @ctxt: An XML parser context |
| * @ch: a xmlChar string |
| * @len: the number of xmlChar |
| * |
| * receiving some cdata chars from the parser. |
| * Question: how much at a time ??? |
| */ |
| static void |
| cdataDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *ch, int len) |
| { |
| unsigned char output[40]; |
| int inlen = len, outlen = 30; |
| |
| htmlEncodeEntities(output, &outlen, ch, &inlen, 0); |
| output[outlen] = 0; |
| |
| fprintf(stdout, "SAX.cdata(%s, %d)\n", output, len); |
| } |
| |
| /** |
| * referenceDebug: |
| * @ctxt: An XML parser context |
| * @name: The entity name |
| * |
| * called when an entity reference is detected. |
| */ |
| static void |
| referenceDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *name) |
| { |
| fprintf(stdout, "SAX.reference(%s)\n", name); |
| } |
| |
| /** |
| * ignorableWhitespaceDebug: |
| * @ctxt: An XML parser context |
| * @ch: a xmlChar string |
| * @start: the first char in the string |
| * @len: the number of xmlChar |
| * |
| * receiving some ignorable whitespaces from the parser. |
| * Question: how much at a time ??? |
| */ |
| static void |
| ignorableWhitespaceDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *ch, int len) |
| { |
| char output[40]; |
| int i; |
| |
| for (i = 0;(i<len) && (i < 30);i++) |
| output[i] = ch[i]; |
| output[i] = 0; |
| |
| fprintf(stdout, "SAX.ignorableWhitespace(%s, %d)\n", output, len); |
| } |
| |
| /** |
| * processingInstructionDebug: |
| * @ctxt: An XML parser context |
| * @target: the target name |
| * @data: the PI data's |
| * @len: the number of xmlChar |
| * |
| * A processing instruction has been parsed. |
| */ |
| static void |
| processingInstructionDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *target, |
| const xmlChar *data) |
| { |
| fprintf(stdout, "SAX.processingInstruction(%s, %s)\n", |
| (char *) target, (char *) data); |
| } |
| |
| /** |
| * commentDebug: |
| * @ctxt: An XML parser context |
| * @value: the comment content |
| * |
| * A comment has been parsed. |
| */ |
| static void |
| commentDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *value) |
| { |
| fprintf(stdout, "SAX.comment(%s)\n", value); |
| } |
| |
| /** |
| * warningDebug: |
| * @ctxt: An XML parser context |
| * @msg: the message to display/transmit |
| * @...: extra parameters for the message display |
| * |
| * Display and format a warning messages, gives file, line, position and |
| * extra parameters. |
| */ |
| static void |
| warningDebug(void *ctx ATTRIBUTE_UNUSED, const char *msg, ...) |
| { |
| va_list args; |
| |
| va_start(args, msg); |
| fprintf(stdout, "SAX.warning: "); |
| vfprintf(stdout, msg, args); |
| va_end(args); |
| } |
| |
| /** |
| * errorDebug: |
| * @ctxt: An XML parser context |
| * @msg: the message to display/transmit |
| * @...: extra parameters for the message display |
| * |
| * Display and format a error messages, gives file, line, position and |
| * extra parameters. |
| */ |
| static void |
| errorDebug(void *ctx ATTRIBUTE_UNUSED, const char *msg, ...) |
| { |
| va_list args; |
| |
| va_start(args, msg); |
| fprintf(stdout, "SAX.error: "); |
| vfprintf(stdout, msg, args); |
| va_end(args); |
| } |
| |
| /** |
| * fatalErrorDebug: |
| * @ctxt: An XML parser context |
| * @msg: the message to display/transmit |
| * @...: extra parameters for the message display |
| * |
| * Display and format a fatalError messages, gives file, line, position and |
| * extra parameters. |
| */ |
| static void |
| fatalErrorDebug(void *ctx ATTRIBUTE_UNUSED, const char *msg, ...) |
| { |
| va_list args; |
| |
| va_start(args, msg); |
| fprintf(stdout, "SAX.fatalError: "); |
| vfprintf(stdout, msg, args); |
| va_end(args); |
| } |
| |
| xmlSAXHandler debugSAXHandlerStruct = { |
| internalSubsetDebug, |
| isStandaloneDebug, |
| hasInternalSubsetDebug, |
| hasExternalSubsetDebug, |
| resolveEntityDebug, |
| getEntityDebug, |
| entityDeclDebug, |
| notationDeclDebug, |
| attributeDeclDebug, |
| elementDeclDebug, |
| unparsedEntityDeclDebug, |
| setDocumentLocatorDebug, |
| startDocumentDebug, |
| endDocumentDebug, |
| startElementDebug, |
| endElementDebug, |
| referenceDebug, |
| charactersDebug, |
| ignorableWhitespaceDebug, |
| processingInstructionDebug, |
| commentDebug, |
| warningDebug, |
| errorDebug, |
| fatalErrorDebug, |
| getParameterEntityDebug, |
| cdataDebug, |
| NULL, |
| 1, |
| NULL, |
| NULL, |
| NULL, |
| NULL |
| }; |
| |
| xmlSAXHandlerPtr debugSAXHandler = &debugSAXHandlerStruct; |
| /************************************************************************ |
| * * |
| * Debug * |
| * * |
| ************************************************************************/ |
| |
| static void |
| parseSAXFile(char *filename) { |
| htmlDocPtr doc = NULL; |
| |
| /* |
| * Empty callbacks for checking |
| */ |
| #ifdef LIBXML_PUSH_ENABLED |
| if (push) { |
| FILE *f; |
| |
| f = fopen(filename, "r"); |
| if (f != NULL) { |
| int res, size = 3; |
| char chars[4096]; |
| htmlParserCtxtPtr ctxt; |
| |
| /* if (repeat) */ |
| size = 4096; |
| res = fread(chars, 1, 4, f); |
| if (res > 0) { |
| ctxt = htmlCreatePushParserCtxt(emptySAXHandler, NULL, |
| chars, res, filename, XML_CHAR_ENCODING_NONE); |
| while ((res = fread(chars, 1, size, f)) > 0) { |
| htmlParseChunk(ctxt, chars, res, 0); |
| } |
| htmlParseChunk(ctxt, chars, 0, 1); |
| doc = ctxt->myDoc; |
| htmlFreeParserCtxt(ctxt); |
| } |
| if (doc != NULL) { |
| fprintf(stdout, "htmlSAXParseFile returned non-NULL\n"); |
| xmlFreeDoc(doc); |
| } |
| fclose(f); |
| } |
| if (!noout) { |
| f = fopen(filename, "r"); |
| if (f != NULL) { |
| int res, size = 3; |
| char chars[4096]; |
| htmlParserCtxtPtr ctxt; |
| |
| /* if (repeat) */ |
| size = 4096; |
| res = fread(chars, 1, 4, f); |
| if (res > 0) { |
| ctxt = htmlCreatePushParserCtxt(debugSAXHandler, NULL, |
| chars, res, filename, XML_CHAR_ENCODING_NONE); |
| while ((res = fread(chars, 1, size, f)) > 0) { |
| htmlParseChunk(ctxt, chars, res, 0); |
| } |
| htmlParseChunk(ctxt, chars, 0, 1); |
| doc = ctxt->myDoc; |
| htmlFreeParserCtxt(ctxt); |
| } |
| if (doc != NULL) { |
| fprintf(stdout, "htmlSAXParseFile returned non-NULL\n"); |
| xmlFreeDoc(doc); |
| } |
| fclose(f); |
| } |
| } |
| } else { |
| #endif /* LIBXML_PUSH_ENABLED */ |
| doc = htmlSAXParseFile(filename, NULL, emptySAXHandler, NULL); |
| if (doc != NULL) { |
| fprintf(stdout, "htmlSAXParseFile returned non-NULL\n"); |
| xmlFreeDoc(doc); |
| } |
| |
| if (!noout) { |
| /* |
| * Debug callback |
| */ |
| doc = htmlSAXParseFile(filename, NULL, debugSAXHandler, NULL); |
| if (doc != NULL) { |
| fprintf(stdout, "htmlSAXParseFile returned non-NULL\n"); |
| xmlFreeDoc(doc); |
| } |
| } |
| #ifdef LIBXML_PUSH_ENABLED |
| } |
| #endif /* LIBXML_PUSH_ENABLED */ |
| } |
| |
| static void |
| parseAndPrintFile(char *filename) { |
| htmlDocPtr doc = NULL, tmp; |
| |
| /* |
| * build an HTML tree from a string; |
| */ |
| #ifdef LIBXML_PUSH_ENABLED |
| if (push) { |
| FILE *f; |
| |
| f = fopen(filename, "r"); |
| if (f != NULL) { |
| int res, size = 3; |
| char chars[4096]; |
| htmlParserCtxtPtr ctxt; |
| |
| /* if (repeat) */ |
| size = 4096; |
| res = fread(chars, 1, 4, f); |
| if (res > 0) { |
| ctxt = htmlCreatePushParserCtxt(NULL, NULL, |
| chars, res, filename, XML_CHAR_ENCODING_NONE); |
| while ((res = fread(chars, 1, size, f)) > 0) { |
| htmlParseChunk(ctxt, chars, res, 0); |
| } |
| htmlParseChunk(ctxt, chars, 0, 1); |
| doc = ctxt->myDoc; |
| htmlFreeParserCtxt(ctxt); |
| } |
| fclose(f); |
| } |
| } else { |
| doc = htmlReadFile(filename, NULL, options); |
| } |
| #else |
| doc = htmlReadFile(filename,NULL,options); |
| #endif |
| if (doc == NULL) { |
| xmlGenericError(xmlGenericErrorContext, |
| "Could not parse %s\n", filename); |
| } |
| |
| /* |
| * test intermediate copy if needed. |
| */ |
| if (copy) { |
| tmp = doc; |
| doc = xmlCopyDoc(doc, 1); |
| xmlFreeDoc(tmp); |
| } |
| |
| #ifdef LIBXML_OUTPUT_ENABLED |
| /* |
| * print it. |
| */ |
| if (!noout) { |
| #ifdef LIBXML_DEBUG_ENABLED |
| if (!debug) { |
| if (encoding) |
| htmlSaveFileEnc("-", doc, encoding); |
| else |
| htmlDocDump(stdout, doc); |
| } else |
| xmlDebugDumpDocument(stdout, doc); |
| #else |
| if (encoding) |
| htmlSaveFileEnc("-", doc, encoding); |
| else |
| htmlDocDump(stdout, doc); |
| #endif |
| } |
| #endif /* LIBXML_OUTPUT_ENABLED */ |
| |
| /* |
| * free it. |
| */ |
| xmlFreeDoc(doc); |
| } |
| |
| int main(int argc, char **argv) { |
| int i, count; |
| int files = 0; |
| |
| for (i = 1; i < argc ; i++) { |
| #ifdef LIBXML_DEBUG_ENABLED |
| if ((!strcmp(argv[i], "-debug")) || (!strcmp(argv[i], "--debug"))) |
| debug++; |
| else |
| #endif |
| if ((!strcmp(argv[i], "-copy")) || (!strcmp(argv[i], "--copy"))) |
| copy++; |
| #ifdef LIBXML_PUSH_ENABLED |
| else if ((!strcmp(argv[i], "-push")) || (!strcmp(argv[i], "--push"))) |
| push++; |
| #endif /* LIBXML_PUSH_ENABLED */ |
| else if ((!strcmp(argv[i], "-sax")) || (!strcmp(argv[i], "--sax"))) |
| sax++; |
| else if ((!strcmp(argv[i], "-noout")) || (!strcmp(argv[i], "--noout"))) |
| noout++; |
| else if ((!strcmp(argv[i], "-repeat")) || |
| (!strcmp(argv[i], "--repeat"))) |
| repeat++; |
| else if ((!strcmp(argv[i], "-encode")) || |
| (!strcmp(argv[i], "--encode"))) { |
| i++; |
| encoding = argv[i]; |
| } |
| } |
| for (i = 1; i < argc ; i++) { |
| if ((!strcmp(argv[i], "-encode")) || |
| (!strcmp(argv[i], "--encode"))) { |
| i++; |
| continue; |
| } |
| if (argv[i][0] != '-') { |
| if (repeat) { |
| for (count = 0;count < 100 * repeat;count++) { |
| if (sax) |
| parseSAXFile(argv[i]); |
| else |
| parseAndPrintFile(argv[i]); |
| } |
| } else { |
| if (sax) |
| parseSAXFile(argv[i]); |
| else |
| parseAndPrintFile(argv[i]); |
| } |
| files ++; |
| } |
| } |
| if (files == 0) { |
| printf("Usage : %s [--debug] [--copy] [--copy] HTMLfiles ...\n", |
| argv[0]); |
| printf("\tParse the HTML files and output the result of the parsing\n"); |
| #ifdef LIBXML_DEBUG_ENABLED |
| printf("\t--debug : dump a debug tree of the in-memory document\n"); |
| #endif |
| printf("\t--copy : used to test the internal copy implementation\n"); |
| printf("\t--sax : debug the sequence of SAX callbacks\n"); |
| printf("\t--repeat : parse the file 100 times, for timing\n"); |
| printf("\t--noout : do not print the result\n"); |
| #ifdef LIBXML_PUSH_ENABLED |
| printf("\t--push : use the push mode parser\n"); |
| #endif /* LIBXML_PUSH_ENABLED */ |
| printf("\t--encode encoding : output in the given encoding\n"); |
| } |
| xmlCleanupParser(); |
| xmlMemoryDump(); |
| |
| return(0); |
| } |
| #else /* !LIBXML_HTML_ENABLED */ |
| #include <stdio.h> |
| int main(int argc ATTRIBUTE_UNUSED, char **argv ATTRIBUTE_UNUSED) { |
| printf("%s : HTML support not compiled in\n", argv[0]); |
| return(0); |
| } |
| #endif |