Added a bunch of testsuite realted files missing, Daniel.
diff --git a/SAXresult/dtd13 b/SAXresult/dtd13
new file mode 100644
index 0000000..3cf024e
--- /dev/null
+++ b/SAXresult/dtd13
@@ -0,0 +1,9 @@
+SAX.setDocumentLocator()
+SAX.startDocument()
+SAX.comment( comment before the DTD )
+SAX.internalSubset(doc, (null), (null))
+SAX.elementDecl(doc, 2, ...)
+SAX.comment( comment after the DTD )
+SAX.startElement(doc)
+SAX.endElement(doc)
+SAX.endDocument()
diff --git a/SAXresult/isolat1 b/SAXresult/isolat1
new file mode 100644
index 0000000..51290e0
--- /dev/null
+++ b/SAXresult/isolat1
@@ -0,0 +1,6 @@
+SAX.setDocumentLocator()
+SAX.startDocument()
+SAX.startElement(très)
+SAX.characters(là, 3)
+SAX.endElement(très)
+SAX.endDocument()
diff --git a/SAXresult/isolat2 b/SAXresult/isolat2
new file mode 100644
index 0000000..109b881
--- /dev/null
+++ b/SAXresult/isolat2
@@ -0,0 +1,17 @@
+SAX.setDocumentLocator()
+SAX.startDocument()
+SAX.startElement(tst)
+SAX.characters(
+
+       The following table d, 1000)
+SAX.characters( SIGN
+       257   175   AF   , 1000)
+SAX.characters(LETTER A WITH ACUTE
+       302, 1000)
+SAX.characters( D0     Ð     LATIN CAPITAL L, 1000)
+SAX.characters(  ß     LATIN SMALL LETTER SH, 1000)
+SAX.characters(SMALL LETTER I WITH CIRCUMFLEX, 1000)
+SAX.characters(E
+       376   254   FE     þ, 130)
+SAX.endElement(tst)
+SAX.endDocument()
diff --git a/SAXresult/isolat3 b/SAXresult/isolat3
new file mode 100644
index 0000000..0bea68d
--- /dev/null
+++ b/SAXresult/isolat3
@@ -0,0 +1,25 @@
+SAX.setDocumentLocator()
+SAX.startDocument()
+SAX.startElement(rec)
+SAX.characters(
+, 1)
+SAX.startElement(eg)
+SAX.endElement(eg)
+SAX.characters(
+then the replacement text for, 43)
+SAX.startElement(code)
+SAX.characters(book, 4)
+SAX.endElement(code)
+SAX.characters(" is:
+, 6)
+SAX.startElement(eg)
+SAX.characters(La Peste: Albert Camus, 
+© 19, 54)
+SAX.getEntity(amp)
+SAX.characters(&, 1)
+SAX.characters(rights;, 7)
+SAX.endElement(eg)
+SAX.characters(
+, 1)
+SAX.endElement(rec)
+SAX.endDocument()
diff --git a/SAXresult/title.xml b/SAXresult/title.xml
new file mode 100644
index 0000000..2af71e9
--- /dev/null
+++ b/SAXresult/title.xml
@@ -0,0 +1,6 @@
+SAX.setDocumentLocator()
+SAX.startDocument()
+SAX.startElement(title)
+SAX.characters(my title, 8)
+SAX.endElement(title)
+SAX.endDocument()
diff --git a/SAXresult/wml.xml b/SAXresult/wml.xml
new file mode 100644
index 0000000..102b807
--- /dev/null
+++ b/SAXresult/wml.xml
@@ -0,0 +1,28 @@
+SAX.setDocumentLocator()
+SAX.startDocument()
+SAX.internalSubset(wml, -//WAPFORUM//DTD WML 1.1//EN, http://www.wapforum.org/DTD/wml_1.1.xml)
+SAX.startElement(wml)
+SAX.characters(
+  , 3)
+SAX.startElement(card, id='card1', title='Rubriques 75008')
+SAX.characters(
+	, 2)
+SAX.startElement(p)
+SAX.characters(
+		, 3)
+SAX.startElement(a, href='rubmenu.asp?CP=75008&RB=01')
+SAX.characters(Cinéma, 7)
+SAX.endElement(a)
+SAX.startElement(br)
+SAX.endElement(br)
+SAX.characters(
+	, 2)
+SAX.endElement(p)
+SAX.characters(
+
+, 2)
+SAX.endElement(card)
+SAX.characters(
+, 1)
+SAX.endElement(wml)
+SAX.endDocument()
diff --git a/result/HTML/autoclose.html b/result/HTML/autoclose.html
new file mode 100644
index 0000000..f2cf579
--- /dev/null
+++ b/result/HTML/autoclose.html
@@ -0,0 +1,2 @@
+<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.0 Transitional//EN" "http://www.w3.org/TR/REC-html40/loose.dtd">
+<html><body><hr></body></html>
diff --git a/result/HTML/autoclose.html.err b/result/HTML/autoclose.html.err
new file mode 100644
index 0000000..e69de29
--- /dev/null
+++ b/result/HTML/autoclose.html.err
diff --git a/result/HTML/autoclose2.html b/result/HTML/autoclose2.html
new file mode 100644
index 0000000..dfea5f9
--- /dev/null
+++ b/result/HTML/autoclose2.html
@@ -0,0 +1,3 @@
+<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.0 Transitional//EN" "http://www.w3.org/TR/REC-html40/loose.dtd">
+<html><body><p>toto
+</p></body></html>
diff --git a/result/HTML/autoclose2.html.err b/result/HTML/autoclose2.html.err
new file mode 100644
index 0000000..e69de29
--- /dev/null
+++ b/result/HTML/autoclose2.html.err
diff --git a/result/HTML/autoclose3.html b/result/HTML/autoclose3.html
new file mode 100644
index 0000000..d168183
--- /dev/null
+++ b/result/HTML/autoclose3.html
@@ -0,0 +1,7 @@
+<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.0 Transitional//EN" "http://www.w3.org/TR/REC-html40/loose.dtd">
+<html><body><ul>
+<li>item 1
+</li>
+<li>item 2
+</li>
+</ul></body></html>
diff --git a/result/HTML/autoclose3.html.err b/result/HTML/autoclose3.html.err
new file mode 100644
index 0000000..09b9e33
--- /dev/null
+++ b/result/HTML/autoclose3.html.err
@@ -0,0 +1,3 @@
+./test/HTML/autoclose3.html:4: error: Opening and ending tag mismatch: body and ul
+
+^
diff --git a/result/VC/NS1 b/result/VC/NS1
new file mode 100644
index 0000000..e69de29
--- /dev/null
+++ b/result/VC/NS1
diff --git a/result/VC/NS2 b/result/VC/NS2
new file mode 100644
index 0000000..5baa4dc
--- /dev/null
+++ b/result/VC/NS2
@@ -0,0 +1,3 @@
+./test/VC/NS2:9: validity error: No declaration for attribute attr on element doc
+<ns:doc ns:attr="val" xmlns:ns="http://www.example.org/test/">
+                                                             ^
diff --git a/result/isolat1 b/result/isolat1
new file mode 100644
index 0000000..1e5a059
--- /dev/null
+++ b/result/isolat1
@@ -0,0 +1,2 @@
+<?xml version="1.0" encoding="ISO-8859-1"?>
+<très>là</très>
diff --git a/result/isolat2 b/result/isolat2
new file mode 100644
index 0000000..8c290b9
--- /dev/null
+++ b/result/isolat2
@@ -0,0 +1,107 @@
+<?xml version="1.0" encoding="ISO-8859-1"?>
+<tst>
+
+       The following table displays the characters  in  ISO  8859
+       Latin-1,  which are printable and unlisted in the ascii
+       manual page.
+
+       Oct   Dec   Hex   Char   Description
+       --------------------------------------------------------------------
+       240   160   A0           NO-BREAK SPACE
+       241   161   A1     ¡     INVERTED EXCLAMATION MARK
+       242   162   A2     ¢     CENT SIGN
+       243   163   A3     £     POUND SIGN
+       244   164   A4     ¤     CURRENCY SIGN
+       245   165   A5     ¥     YEN SIGN
+       246   166   A6     ¦     BROKEN BAR
+       247   167   A7     §     SECTION SIGN
+       250   168   A8     ¨     DIAERESIS
+       251   169   A9     ©     COPYRIGHT SIGN
+       252   170   AA     ª     FEMININE ORDINAL INDICATOR
+       253   171   AB     «     LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
+       254   172   AC     ¬     NOT SIGN
+       255   173   AD     ­     SOFT HYPHEN
+       256   174   AE     ®     REGISTERED SIGN
+       257   175   AF     ¯     MACRON
+       260   176   B0     °     DEGREE SIGN
+       261   177   B1     ±     PLUS-MINUS SIGN
+       262   178   B2     ²     SUPERSCRIPT TWO
+       263   179   B3     ³     SUPERSCRIPT THREE
+       264   180   B4     ´     ACUTE ACCENT
+       265   181   B5     µ     MICRO SIGN
+       266   182   B6     ¶     PILCROW SIGN
+       267   183   B7     ·     MIDDLE DOT
+       270   184   B8     ¸     CEDILLA
+       271   185   B9     ¹     SUPERSCRIPT ONE
+       272   186   BA     º     MASCULINE ORDINAL INDICATOR
+       273   187   BB     »     RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
+       274   188   BC     ¼     VULGAR FRACTION ONE QUARTER
+       275   189   BD     ½     VULGAR FRACTION ONE HALF
+       276   190   BE     ¾     VULGAR FRACTION THREE QUARTERS
+       277   191   BF     ¿     INVERTED QUESTION MARK
+       300   192   C0     À     LATIN CAPITAL LETTER A WITH GRAVE
+       301   193   C1     Á     LATIN CAPITAL LETTER A WITH ACUTE
+       302   194   C2     Â     LATIN CAPITAL LETTER A WITH CIRCUMFLEX
+       303   195   C3     Ã     LATIN CAPITAL LETTER A WITH TILDE
+       304   196   C4     Ä     LATIN CAPITAL LETTER A WITH DIAERESIS
+       305   197   C5     Å     LATIN CAPITAL LETTER A WITH RING ABOVE
+       306   198   C6     Æ     LATIN CAPITAL LETTER AE
+       307   199   C7     Ç     LATIN CAPITAL LETTER C WITH CEDILLA
+       310   200   C8     È     LATIN CAPITAL LETTER E WITH GRAVE
+       311   201   C9     É     LATIN CAPITAL LETTER E WITH ACUTE
+       312   202   CA     Ê     LATIN CAPITAL LETTER E WITH CIRCUMFLEX
+       313   203   CB     Ë     LATIN CAPITAL LETTER E WITH DIAERESIS
+       314   204   CC     Ì     LATIN CAPITAL LETTER I WITH GRAVE
+       315   205   CD     Í     LATIN CAPITAL LETTER I WITH ACUTE
+       316   206   CE     Î     LATIN CAPITAL LETTER I WITH CIRCUMFLEX
+       317   207   CF     Ï     LATIN CAPITAL LETTER I WITH DIAERESIS
+       320   208   D0     Ð     LATIN CAPITAL LETTER ETH
+       321   209   D1     Ñ     LATIN CAPITAL LETTER N WITH TILDE
+       322   210   D2     Ò     LATIN CAPITAL LETTER O WITH GRAVE
+       323   211   D3     Ó     LATIN CAPITAL LETTER O WITH ACUTE
+       324   212   D4     Ô     LATIN CAPITAL LETTER O WITH CIRCUMFLEX
+       325   213   D5     Õ     LATIN CAPITAL LETTER O WITH TILDE
+       326   214   D6     Ö     LATIN CAPITAL LETTER O WITH DIAERESIS
+       327   215   D7     ×     MULTIPLICATION SIGN
+       330   216   D8     Ø     LATIN CAPITAL LETTER O WITH STROKE
+       331   217   D9     Ù     LATIN CAPITAL LETTER U WITH GRAVE
+       332   218   DA     Ú     LATIN CAPITAL LETTER U WITH ACUTE
+       333   219   DB     Û     LATIN CAPITAL LETTER U WITH CIRCUMFLEX
+       334   220   DC     Ü     LATIN CAPITAL LETTER U WITH DIAERESIS
+       335   221   DD     Ý     LATIN CAPITAL LETTER Y WITH ACUTE
+       336   222   DE     Þ     LATIN CAPITAL LETTER THORN
+       337   223   DF     ß     LATIN SMALL LETTER SHARP S
+       340   224   E0     à     LATIN SMALL LETTER A WITH GRAVE
+       341   225   E1     á     LATIN SMALL LETTER A WITH ACUTE
+       342   226   E2     â     LATIN SMALL LETTER A WITH CIRCUMFLEX
+       343   227   E3     ã     LATIN SMALL LETTER A WITH TILDE
+       344   228   E4     ä     LATIN SMALL LETTER A WITH DIAERESIS
+       345   229   E5     å     LATIN SMALL LETTER A WITH RING ABOVE
+       346   230   E6     æ     LATIN SMALL LETTER AE
+       347   231   E7     ç     LATIN SMALL LETTER C WITH CEDILLA
+       350   232   E8     è     LATIN SMALL LETTER E WITH GRAVE
+       351   233   E9     é     LATIN SMALL LETTER E WITH ACUTE
+       352   234   EA     ê     LATIN SMALL LETTER E WITH CIRCUMFLEX
+       353   235   EB     ë     LATIN SMALL LETTER E WITH DIAERESIS
+       354   236   EC     ì     LATIN SMALL LETTER I WITH GRAVE
+       355   237   ED     í     LATIN SMALL LETTER I WITH ACUTE
+       356   238   EE     î     LATIN SMALL LETTER I WITH CIRCUMFLEX
+       357   239   EF     ï     LATIN SMALL LETTER I WITH DIAERESIS
+       360   240   F0     ð     LATIN SMALL LETTER ETH
+       361   241   F1     ñ     LATIN SMALL LETTER N WITH TILDE
+       362   242   F2     ò     LATIN SMALL LETTER O WITH GRAVE
+       363   243   F3     ó     LATIN SMALL LETTER O WITH ACUTE
+       364   244   F4     ô     LATIN SMALL LETTER O WITH CIRCUMFLEX
+       365   245   F5     õ     LATIN SMALL LETTER O WITH TILDE
+       366   246   F6     ö     LATIN SMALL LETTER O WITH DIAERESIS
+       367   247   F7     ÷     DIVISION SIGN
+       370   248   F8     ø     LATIN SMALL LETTER O WITH STROKE
+       371   249   F9     ù     LATIN SMALL LETTER U WITH GRAVE
+       372   250   FA     ú     LATIN SMALL LETTER U WITH ACUTE
+       373   251   FB     û     LATIN SMALL LETTER U WITH CIRCUMFLEX
+       374   252   FC     ü     LATIN SMALL LETTER U WITH DIAERESIS
+       375   253   FD     ý     LATIN SMALL LETTER Y WITH ACUTE
+       376   254   FE     þ     LATIN SMALL LETTER THORN
+       377   255   FF     ÿ     LATIN SMALL LETTER Y WITH DIAERESIS
+
+</tst>
diff --git a/result/isolat3 b/result/isolat3
new file mode 100644
index 0000000..9d5bb5b
--- /dev/null
+++ b/result/isolat3
@@ -0,0 +1,10 @@
+<?xml version="1.0" encoding="ISO-8859-1"?>
+<rec>
+<eg><![CDATA[<!ENTITY % pub    "&#xc9;ditions Gallimard" >
+<!ENTITY   rights "All rights reserved" >
+<!ENTITY   book   "La Peste: Albert Camus, 
+&#xA9; 1947 %pub;. &rights;" >]]></eg>
+then the replacement text for the entity &quot;<code>book</code>&quot; is:
+<eg>La Peste: Albert Camus, 
+© 1947 Éditions Gallimard. &amp;rights;</eg>
+</rec>
diff --git a/result/noent/att1 b/result/noent/att1
new file mode 100644
index 0000000..00aa6be
--- /dev/null
+++ b/result/noent/att1
@@ -0,0 +1,2 @@
+<?xml version="1.0"?>
+<doc attr="to normalize with a    space"/>
diff --git a/result/noent/att2 b/result/noent/att2
new file mode 100644
index 0000000..28989a2
--- /dev/null
+++ b/result/noent/att2
@@ -0,0 +1,2 @@
+<?xml version="1.0"?>
+<doc attr="to normalize   with a space"/>
diff --git a/result/noent/dtd13 b/result/noent/dtd13
new file mode 100644
index 0000000..2814146
--- /dev/null
+++ b/result/noent/dtd13
@@ -0,0 +1,7 @@
+<?xml version="1.0"?>
+<!-- comment before the DTD -->
+<!DOCTYPE doc [
+<!ELEMENT doc ANY>
+]>
+<!-- comment after the DTD -->
+<doc/>
diff --git a/result/noent/isolat1 b/result/noent/isolat1
new file mode 100644
index 0000000..1e5a059
--- /dev/null
+++ b/result/noent/isolat1
@@ -0,0 +1,2 @@
+<?xml version="1.0" encoding="ISO-8859-1"?>
+<très>là</très>
diff --git a/result/noent/isolat2 b/result/noent/isolat2
new file mode 100644
index 0000000..8c290b9
--- /dev/null
+++ b/result/noent/isolat2
@@ -0,0 +1,107 @@
+<?xml version="1.0" encoding="ISO-8859-1"?>
+<tst>
+
+       The following table displays the characters  in  ISO  8859
+       Latin-1,  which are printable and unlisted in the ascii
+       manual page.
+
+       Oct   Dec   Hex   Char   Description
+       --------------------------------------------------------------------
+       240   160   A0           NO-BREAK SPACE
+       241   161   A1     ¡     INVERTED EXCLAMATION MARK
+       242   162   A2     ¢     CENT SIGN
+       243   163   A3     £     POUND SIGN
+       244   164   A4     ¤     CURRENCY SIGN
+       245   165   A5     ¥     YEN SIGN
+       246   166   A6     ¦     BROKEN BAR
+       247   167   A7     §     SECTION SIGN
+       250   168   A8     ¨     DIAERESIS
+       251   169   A9     ©     COPYRIGHT SIGN
+       252   170   AA     ª     FEMININE ORDINAL INDICATOR
+       253   171   AB     «     LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
+       254   172   AC     ¬     NOT SIGN
+       255   173   AD     ­     SOFT HYPHEN
+       256   174   AE     ®     REGISTERED SIGN
+       257   175   AF     ¯     MACRON
+       260   176   B0     °     DEGREE SIGN
+       261   177   B1     ±     PLUS-MINUS SIGN
+       262   178   B2     ²     SUPERSCRIPT TWO
+       263   179   B3     ³     SUPERSCRIPT THREE
+       264   180   B4     ´     ACUTE ACCENT
+       265   181   B5     µ     MICRO SIGN
+       266   182   B6     ¶     PILCROW SIGN
+       267   183   B7     ·     MIDDLE DOT
+       270   184   B8     ¸     CEDILLA
+       271   185   B9     ¹     SUPERSCRIPT ONE
+       272   186   BA     º     MASCULINE ORDINAL INDICATOR
+       273   187   BB     »     RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
+       274   188   BC     ¼     VULGAR FRACTION ONE QUARTER
+       275   189   BD     ½     VULGAR FRACTION ONE HALF
+       276   190   BE     ¾     VULGAR FRACTION THREE QUARTERS
+       277   191   BF     ¿     INVERTED QUESTION MARK
+       300   192   C0     À     LATIN CAPITAL LETTER A WITH GRAVE
+       301   193   C1     Á     LATIN CAPITAL LETTER A WITH ACUTE
+       302   194   C2     Â     LATIN CAPITAL LETTER A WITH CIRCUMFLEX
+       303   195   C3     Ã     LATIN CAPITAL LETTER A WITH TILDE
+       304   196   C4     Ä     LATIN CAPITAL LETTER A WITH DIAERESIS
+       305   197   C5     Å     LATIN CAPITAL LETTER A WITH RING ABOVE
+       306   198   C6     Æ     LATIN CAPITAL LETTER AE
+       307   199   C7     Ç     LATIN CAPITAL LETTER C WITH CEDILLA
+       310   200   C8     È     LATIN CAPITAL LETTER E WITH GRAVE
+       311   201   C9     É     LATIN CAPITAL LETTER E WITH ACUTE
+       312   202   CA     Ê     LATIN CAPITAL LETTER E WITH CIRCUMFLEX
+       313   203   CB     Ë     LATIN CAPITAL LETTER E WITH DIAERESIS
+       314   204   CC     Ì     LATIN CAPITAL LETTER I WITH GRAVE
+       315   205   CD     Í     LATIN CAPITAL LETTER I WITH ACUTE
+       316   206   CE     Î     LATIN CAPITAL LETTER I WITH CIRCUMFLEX
+       317   207   CF     Ï     LATIN CAPITAL LETTER I WITH DIAERESIS
+       320   208   D0     Ð     LATIN CAPITAL LETTER ETH
+       321   209   D1     Ñ     LATIN CAPITAL LETTER N WITH TILDE
+       322   210   D2     Ò     LATIN CAPITAL LETTER O WITH GRAVE
+       323   211   D3     Ó     LATIN CAPITAL LETTER O WITH ACUTE
+       324   212   D4     Ô     LATIN CAPITAL LETTER O WITH CIRCUMFLEX
+       325   213   D5     Õ     LATIN CAPITAL LETTER O WITH TILDE
+       326   214   D6     Ö     LATIN CAPITAL LETTER O WITH DIAERESIS
+       327   215   D7     ×     MULTIPLICATION SIGN
+       330   216   D8     Ø     LATIN CAPITAL LETTER O WITH STROKE
+       331   217   D9     Ù     LATIN CAPITAL LETTER U WITH GRAVE
+       332   218   DA     Ú     LATIN CAPITAL LETTER U WITH ACUTE
+       333   219   DB     Û     LATIN CAPITAL LETTER U WITH CIRCUMFLEX
+       334   220   DC     Ü     LATIN CAPITAL LETTER U WITH DIAERESIS
+       335   221   DD     Ý     LATIN CAPITAL LETTER Y WITH ACUTE
+       336   222   DE     Þ     LATIN CAPITAL LETTER THORN
+       337   223   DF     ß     LATIN SMALL LETTER SHARP S
+       340   224   E0     à     LATIN SMALL LETTER A WITH GRAVE
+       341   225   E1     á     LATIN SMALL LETTER A WITH ACUTE
+       342   226   E2     â     LATIN SMALL LETTER A WITH CIRCUMFLEX
+       343   227   E3     ã     LATIN SMALL LETTER A WITH TILDE
+       344   228   E4     ä     LATIN SMALL LETTER A WITH DIAERESIS
+       345   229   E5     å     LATIN SMALL LETTER A WITH RING ABOVE
+       346   230   E6     æ     LATIN SMALL LETTER AE
+       347   231   E7     ç     LATIN SMALL LETTER C WITH CEDILLA
+       350   232   E8     è     LATIN SMALL LETTER E WITH GRAVE
+       351   233   E9     é     LATIN SMALL LETTER E WITH ACUTE
+       352   234   EA     ê     LATIN SMALL LETTER E WITH CIRCUMFLEX
+       353   235   EB     ë     LATIN SMALL LETTER E WITH DIAERESIS
+       354   236   EC     ì     LATIN SMALL LETTER I WITH GRAVE
+       355   237   ED     í     LATIN SMALL LETTER I WITH ACUTE
+       356   238   EE     î     LATIN SMALL LETTER I WITH CIRCUMFLEX
+       357   239   EF     ï     LATIN SMALL LETTER I WITH DIAERESIS
+       360   240   F0     ð     LATIN SMALL LETTER ETH
+       361   241   F1     ñ     LATIN SMALL LETTER N WITH TILDE
+       362   242   F2     ò     LATIN SMALL LETTER O WITH GRAVE
+       363   243   F3     ó     LATIN SMALL LETTER O WITH ACUTE
+       364   244   F4     ô     LATIN SMALL LETTER O WITH CIRCUMFLEX
+       365   245   F5     õ     LATIN SMALL LETTER O WITH TILDE
+       366   246   F6     ö     LATIN SMALL LETTER O WITH DIAERESIS
+       367   247   F7     ÷     DIVISION SIGN
+       370   248   F8     ø     LATIN SMALL LETTER O WITH STROKE
+       371   249   F9     ù     LATIN SMALL LETTER U WITH GRAVE
+       372   250   FA     ú     LATIN SMALL LETTER U WITH ACUTE
+       373   251   FB     û     LATIN SMALL LETTER U WITH CIRCUMFLEX
+       374   252   FC     ü     LATIN SMALL LETTER U WITH DIAERESIS
+       375   253   FD     ý     LATIN SMALL LETTER Y WITH ACUTE
+       376   254   FE     þ     LATIN SMALL LETTER THORN
+       377   255   FF     ÿ     LATIN SMALL LETTER Y WITH DIAERESIS
+
+</tst>
diff --git a/result/noent/isolat3 b/result/noent/isolat3
new file mode 100644
index 0000000..9d5bb5b
--- /dev/null
+++ b/result/noent/isolat3
@@ -0,0 +1,10 @@
+<?xml version="1.0" encoding="ISO-8859-1"?>
+<rec>
+<eg><![CDATA[<!ENTITY % pub    "&#xc9;ditions Gallimard" >
+<!ENTITY   rights "All rights reserved" >
+<!ENTITY   book   "La Peste: Albert Camus, 
+&#xA9; 1947 %pub;. &rights;" >]]></eg>
+then the replacement text for the entity &quot;<code>book</code>&quot; is:
+<eg>La Peste: Albert Camus, 
+© 1947 Éditions Gallimard. &amp;rights;</eg>
+</rec>
diff --git a/result/noent/title.xml b/result/noent/title.xml
new file mode 100644
index 0000000..35c8fc9
--- /dev/null
+++ b/result/noent/title.xml
@@ -0,0 +1,2 @@
+<?xml version="1.0"?>
+<title>my title</title>
diff --git a/result/noent/wml.xml b/result/noent/wml.xml
new file mode 100644
index 0000000..55e20ff
--- /dev/null
+++ b/result/noent/wml.xml
@@ -0,0 +1,10 @@
+<?xml version="1.0"?>
+<!DOCTYPE wml PUBLIC "-//WAPFORUM//DTD WML 1.1//EN" "http://www.wapforum.org/DTD/wml_1.1.xml">
+<wml>
+  <card id="card1" title="Rubriques 75008">
+	<p>
+		<a href="rubmenu.asp?CP=75008&amp;#38;RB=01">Cin&#xE9;ma</a><br/>
+	</p>
+
+</card>
+</wml>
diff --git a/result/title.xml b/result/title.xml
new file mode 100644
index 0000000..35c8fc9
--- /dev/null
+++ b/result/title.xml
@@ -0,0 +1,2 @@
+<?xml version="1.0"?>
+<title>my title</title>
diff --git a/result/wml.xml b/result/wml.xml
new file mode 100644
index 0000000..8215ab0
--- /dev/null
+++ b/result/wml.xml
@@ -0,0 +1,10 @@
+<?xml version="1.0"?>
+<!DOCTYPE wml PUBLIC "-//WAPFORUM//DTD WML 1.1//EN" "http://www.wapforum.org/DTD/wml_1.1.xml">
+<wml>
+  <card id="card1" title="Rubriques 75008">
+	<p>
+		<a href="rubmenu.asp?CP=75008&#38;RB=01">Cin&#xE9;ma</a><br/>
+	</p>
+
+</card>
+</wml>
diff --git a/test/HTML/autoclose.html b/test/HTML/autoclose.html
new file mode 100644
index 0000000..e123ba7
--- /dev/null
+++ b/test/HTML/autoclose.html
@@ -0,0 +1 @@
+<hr>
diff --git a/test/HTML/autoclose2.html b/test/HTML/autoclose2.html
new file mode 100644
index 0000000..d40082c
--- /dev/null
+++ b/test/HTML/autoclose2.html
@@ -0,0 +1 @@
+<p>toto
diff --git a/test/HTML/autoclose3.html b/test/HTML/autoclose3.html
new file mode 100644
index 0000000..8c7a45a
--- /dev/null
+++ b/test/HTML/autoclose3.html
@@ -0,0 +1,3 @@
+<ul>
+<li>item 1
+<li>item 2
diff --git a/test/VC/NS1 b/test/VC/NS1
new file mode 100644
index 0000000..2f74463
--- /dev/null
+++ b/test/VC/NS1
@@ -0,0 +1,13 @@
+<!DOCTYPE ns:doc [
+<!ELEMENT ns:doc (#PCDATA | ns:a | ns:b)*>
+<!ATTLIST ns:doc
+          ns:attr  CDATA #REQUIRED
+          xmlns:ns CDATA #IMPLIED>
+<!ELEMENT ns:a EMPTY>
+<!ELEMENT ns:b (#PCDATA)>
+]>
+<ns:doc ns:attr="val" xmlns:ns="http://www.example.org/test/">
+   <ns:a/>
+   <ns:b>first line</ns:b>
+   <ns:b>second line</ns:b>
+</ns:doc>
diff --git a/test/VC/NS2 b/test/VC/NS2
new file mode 100644
index 0000000..d748d1a
--- /dev/null
+++ b/test/VC/NS2
@@ -0,0 +1,13 @@
+<!DOCTYPE doc [
+<!ELEMENT doc (#PCDATA | ns:a | ns:b)*>
+<!ATTLIST doc
+          attr  CDATA #REQUIRED
+          xmlns:ns CDATA #IMPLIED>
+<!ELEMENT a EMPTY>
+<!ELEMENT b (#PCDATA)>
+]>
+<ns:doc ns:attr="val" xmlns:ns="http://www.example.org/test/">
+   <ns:a/>
+   <ns:b>first line</ns:b>
+   <ns:b>second line</ns:b>
+</ns:doc>
diff --git a/test/dtd13 b/test/dtd13
new file mode 100644
index 0000000..d18d00c
--- /dev/null
+++ b/test/dtd13
@@ -0,0 +1,6 @@
+<!-- comment before the DTD -->
+<!DOCTYPE doc [
+<!ELEMENT doc ANY>
+]>
+<!-- comment after the DTD -->
+<doc/>
diff --git a/test/isolat1 b/test/isolat1
new file mode 100644
index 0000000..1e5a059
--- /dev/null
+++ b/test/isolat1
@@ -0,0 +1,2 @@
+<?xml version="1.0" encoding="ISO-8859-1"?>
+<très>là</très>
diff --git a/test/isolat2 b/test/isolat2
new file mode 100644
index 0000000..8c290b9
--- /dev/null
+++ b/test/isolat2
@@ -0,0 +1,107 @@
+<?xml version="1.0" encoding="ISO-8859-1"?>
+<tst>
+
+       The following table displays the characters  in  ISO  8859
+       Latin-1,  which are printable and unlisted in the ascii
+       manual page.
+
+       Oct   Dec   Hex   Char   Description
+       --------------------------------------------------------------------
+       240   160   A0           NO-BREAK SPACE
+       241   161   A1     ¡     INVERTED EXCLAMATION MARK
+       242   162   A2     ¢     CENT SIGN
+       243   163   A3     £     POUND SIGN
+       244   164   A4     ¤     CURRENCY SIGN
+       245   165   A5     ¥     YEN SIGN
+       246   166   A6     ¦     BROKEN BAR
+       247   167   A7     §     SECTION SIGN
+       250   168   A8     ¨     DIAERESIS
+       251   169   A9     ©     COPYRIGHT SIGN
+       252   170   AA     ª     FEMININE ORDINAL INDICATOR
+       253   171   AB     «     LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
+       254   172   AC     ¬     NOT SIGN
+       255   173   AD     ­     SOFT HYPHEN
+       256   174   AE     ®     REGISTERED SIGN
+       257   175   AF     ¯     MACRON
+       260   176   B0     °     DEGREE SIGN
+       261   177   B1     ±     PLUS-MINUS SIGN
+       262   178   B2     ²     SUPERSCRIPT TWO
+       263   179   B3     ³     SUPERSCRIPT THREE
+       264   180   B4     ´     ACUTE ACCENT
+       265   181   B5     µ     MICRO SIGN
+       266   182   B6     ¶     PILCROW SIGN
+       267   183   B7     ·     MIDDLE DOT
+       270   184   B8     ¸     CEDILLA
+       271   185   B9     ¹     SUPERSCRIPT ONE
+       272   186   BA     º     MASCULINE ORDINAL INDICATOR
+       273   187   BB     »     RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
+       274   188   BC     ¼     VULGAR FRACTION ONE QUARTER
+       275   189   BD     ½     VULGAR FRACTION ONE HALF
+       276   190   BE     ¾     VULGAR FRACTION THREE QUARTERS
+       277   191   BF     ¿     INVERTED QUESTION MARK
+       300   192   C0     À     LATIN CAPITAL LETTER A WITH GRAVE
+       301   193   C1     Á     LATIN CAPITAL LETTER A WITH ACUTE
+       302   194   C2     Â     LATIN CAPITAL LETTER A WITH CIRCUMFLEX
+       303   195   C3     Ã     LATIN CAPITAL LETTER A WITH TILDE
+       304   196   C4     Ä     LATIN CAPITAL LETTER A WITH DIAERESIS
+       305   197   C5     Å     LATIN CAPITAL LETTER A WITH RING ABOVE
+       306   198   C6     Æ     LATIN CAPITAL LETTER AE
+       307   199   C7     Ç     LATIN CAPITAL LETTER C WITH CEDILLA
+       310   200   C8     È     LATIN CAPITAL LETTER E WITH GRAVE
+       311   201   C9     É     LATIN CAPITAL LETTER E WITH ACUTE
+       312   202   CA     Ê     LATIN CAPITAL LETTER E WITH CIRCUMFLEX
+       313   203   CB     Ë     LATIN CAPITAL LETTER E WITH DIAERESIS
+       314   204   CC     Ì     LATIN CAPITAL LETTER I WITH GRAVE
+       315   205   CD     Í     LATIN CAPITAL LETTER I WITH ACUTE
+       316   206   CE     Î     LATIN CAPITAL LETTER I WITH CIRCUMFLEX
+       317   207   CF     Ï     LATIN CAPITAL LETTER I WITH DIAERESIS
+       320   208   D0     Ð     LATIN CAPITAL LETTER ETH
+       321   209   D1     Ñ     LATIN CAPITAL LETTER N WITH TILDE
+       322   210   D2     Ò     LATIN CAPITAL LETTER O WITH GRAVE
+       323   211   D3     Ó     LATIN CAPITAL LETTER O WITH ACUTE
+       324   212   D4     Ô     LATIN CAPITAL LETTER O WITH CIRCUMFLEX
+       325   213   D5     Õ     LATIN CAPITAL LETTER O WITH TILDE
+       326   214   D6     Ö     LATIN CAPITAL LETTER O WITH DIAERESIS
+       327   215   D7     ×     MULTIPLICATION SIGN
+       330   216   D8     Ø     LATIN CAPITAL LETTER O WITH STROKE
+       331   217   D9     Ù     LATIN CAPITAL LETTER U WITH GRAVE
+       332   218   DA     Ú     LATIN CAPITAL LETTER U WITH ACUTE
+       333   219   DB     Û     LATIN CAPITAL LETTER U WITH CIRCUMFLEX
+       334   220   DC     Ü     LATIN CAPITAL LETTER U WITH DIAERESIS
+       335   221   DD     Ý     LATIN CAPITAL LETTER Y WITH ACUTE
+       336   222   DE     Þ     LATIN CAPITAL LETTER THORN
+       337   223   DF     ß     LATIN SMALL LETTER SHARP S
+       340   224   E0     à     LATIN SMALL LETTER A WITH GRAVE
+       341   225   E1     á     LATIN SMALL LETTER A WITH ACUTE
+       342   226   E2     â     LATIN SMALL LETTER A WITH CIRCUMFLEX
+       343   227   E3     ã     LATIN SMALL LETTER A WITH TILDE
+       344   228   E4     ä     LATIN SMALL LETTER A WITH DIAERESIS
+       345   229   E5     å     LATIN SMALL LETTER A WITH RING ABOVE
+       346   230   E6     æ     LATIN SMALL LETTER AE
+       347   231   E7     ç     LATIN SMALL LETTER C WITH CEDILLA
+       350   232   E8     è     LATIN SMALL LETTER E WITH GRAVE
+       351   233   E9     é     LATIN SMALL LETTER E WITH ACUTE
+       352   234   EA     ê     LATIN SMALL LETTER E WITH CIRCUMFLEX
+       353   235   EB     ë     LATIN SMALL LETTER E WITH DIAERESIS
+       354   236   EC     ì     LATIN SMALL LETTER I WITH GRAVE
+       355   237   ED     í     LATIN SMALL LETTER I WITH ACUTE
+       356   238   EE     î     LATIN SMALL LETTER I WITH CIRCUMFLEX
+       357   239   EF     ï     LATIN SMALL LETTER I WITH DIAERESIS
+       360   240   F0     ð     LATIN SMALL LETTER ETH
+       361   241   F1     ñ     LATIN SMALL LETTER N WITH TILDE
+       362   242   F2     ò     LATIN SMALL LETTER O WITH GRAVE
+       363   243   F3     ó     LATIN SMALL LETTER O WITH ACUTE
+       364   244   F4     ô     LATIN SMALL LETTER O WITH CIRCUMFLEX
+       365   245   F5     õ     LATIN SMALL LETTER O WITH TILDE
+       366   246   F6     ö     LATIN SMALL LETTER O WITH DIAERESIS
+       367   247   F7     ÷     DIVISION SIGN
+       370   248   F8     ø     LATIN SMALL LETTER O WITH STROKE
+       371   249   F9     ù     LATIN SMALL LETTER U WITH GRAVE
+       372   250   FA     ú     LATIN SMALL LETTER U WITH ACUTE
+       373   251   FB     û     LATIN SMALL LETTER U WITH CIRCUMFLEX
+       374   252   FC     ü     LATIN SMALL LETTER U WITH DIAERESIS
+       375   253   FD     ý     LATIN SMALL LETTER Y WITH ACUTE
+       376   254   FE     þ     LATIN SMALL LETTER THORN
+       377   255   FF     ÿ     LATIN SMALL LETTER Y WITH DIAERESIS
+
+</tst>
diff --git a/test/isolat3 b/test/isolat3
new file mode 100644
index 0000000..40fb3a0
--- /dev/null
+++ b/test/isolat3
@@ -0,0 +1,10 @@
+<?xml version='1.0' encoding='ISO-8859-1'?>
+<rec>
+<eg><![CDATA[<!ENTITY % pub    "&#xc9;ditions Gallimard" >
+<!ENTITY   rights "All rights reserved" >
+<!ENTITY   book   "La Peste: Albert Camus, 
+&#xA9; 1947 %pub;. &rights;" >]]></eg>
+then the replacement text for the entity "<code>book</code>" is:
+<eg>La Peste: Albert Camus, 
+&#169; 1947 &#201;ditions Gallimard. &amp;rights;</eg>
+</rec>
diff --git a/test/title.xml b/test/title.xml
new file mode 100644
index 0000000..d064d66
--- /dev/null
+++ b/test/title.xml
@@ -0,0 +1 @@
+<title>my title</title>
diff --git a/test/wml.xml b/test/wml.xml
new file mode 100644
index 0000000..1cfecc7
--- /dev/null
+++ b/test/wml.xml
@@ -0,0 +1,11 @@
+<?xml version="1.0" ?>
+<!DOCTYPE wml PUBLIC "-//WAPFORUM//DTD WML 1.1//EN" "http://www.wapforum.org/DTD/wml_1.1.xml">
+<wml>
+  <card id="card1" title="Rubriques 75008">
+	<p>
+		<a href="rubmenu.asp?CP=75008&#38;RB=01">Cin&#233;ma</a><br/>
+	</p>
+
+</card>
+</wml>
+