more cleanup of the HTML parser to force it to not bypass SAX, Daniel.
Ready for 2.1.1 it seems
diff --git a/valid.c b/valid.c
index 5dc37ed..5235991 100644
--- a/valid.c
+++ b/valid.c
@@ -2031,6 +2031,9 @@
             ((attr->name[1] == 'D') || (attr->name[1] == 'd')) &&
 	    (attr->name[2] == 0)) return(1);
 	 *******************/
+    } else if (doc->type == XML_HTML_DOCUMENT_NODE) {
+	/* TODO @@@ */
+	return(0);    
     } else {
 	xmlAttributePtr attrDecl;