fixing bug #99190 when UTF8 document are parsed using the progressive * parserInternals.c: fixing bug #99190 when UTF8 document are parsed using the progressive parser and the end of the chunk is in the middle of an UTF8 multibyte character. Daniel

commit: d2ff0394f832b5841fd9af0813acd359b9715cc0 [log] [tgz]
author: Daniel Veillard <veillard@src.gnome.org> Fri Nov 22 12:28:38 2002 +0000
committer: Daniel Veillard <veillard@src.gnome.org> Fri Nov 22 12:28:38 2002 +0000
tree: 346d36a6c54cc3a4ebc240f328d6006f7166ca5a
parent: 8b2c7f10f16dbf1366c7beb89e8c5ab1c4062a1f [diff] [blame]
diff --git a/parserInternals.c b/parserInternals.c
index c9ea6ed..e74801f 100644
--- a/parserInternals.c
+++ b/parserInternals.c

@@ -1349,6 +1349,16 @@
     return((int) *ctxt->input->cur);
 encoding_error:
     /*
+     * An encoding problem may arise from a truncated input buffer
+     * splitting a character in the middle. In that case do not raise
+     * an error but return 0 to endicate an end of stream problem
+     */
+    if (ctxt->input->end - ctxt->input->cur < 4) {
+	*len = 0;
+	return(0);
+    }
+
+    /*
      * If we detect an UTF8 error that probably mean that the
      * input encoding didn't get properly advertised in the
      * declaration header. Report the error and switch the encoding
commit	d2ff0394f832b5841fd9af0813acd359b9715cc0	[log] [tgz]
author	Daniel Veillard <veillard@src.gnome.org>	Fri Nov 22 12:28:38 2002 +0000
committer	Daniel Veillard <veillard@src.gnome.org>	Fri Nov 22 12:28:38 2002 +0000
tree	346d36a6c54cc3a4ebc240f328d6006f7166ca5a
parent	8b2c7f10f16dbf1366c7beb89e8c5ab1c4062a1f [diff] [blame]