blob: 218d5199fbbd887c6660ec2a5f90d1ecbe8b024c [file] [log] [blame]
Antoine Pitroud72402e2010-10-27 18:52:48 +00001# regression test for SAX 2.0
Lars Gustäbel96753b32000-09-24 12:24:24 +00002# $Id$
3
Thomas Wouters0e3f5912006-08-11 14:57:12 +00004from xml.sax import make_parser, ContentHandler, \
5 SAXException, SAXReaderNotAvailable, SAXParseException
Martin v. Löwis962c9e72000-10-06 17:41:52 +00006try:
7 make_parser()
Martin v. Löwis80670bc2000-10-06 21:13:23 +00008except SAXReaderNotAvailable:
Martin v. Löwis962c9e72000-10-06 17:41:52 +00009 # don't try to test this module if we cannot create a parser
10 raise ImportError("no XML parsers available")
Thomas Wouters0e3f5912006-08-11 14:57:12 +000011from xml.sax.saxutils import XMLGenerator, escape, unescape, quoteattr, \
12 XMLFilterBase
13from xml.sax.expatreader import create_parser
Antoine Pitrou6b03ee62010-10-27 18:33:30 +000014from xml.sax.handler import feature_namespaces
Thomas Wouters0e3f5912006-08-11 14:57:12 +000015from xml.sax.xmlreader import InputSource, AttributesImpl, AttributesNSImpl
Serhiy Storchaka88efc522013-02-10 14:29:52 +020016from io import BytesIO, StringIO
Serhiy Storchaka1a4ed4c2013-02-02 12:17:05 +020017import os.path
Serhiy Storchakad5202392013-02-02 10:31:17 +020018import shutil
19from test import support
Benjamin Petersonee8712c2008-05-20 21:35:26 +000020from test.support import findfile, run_unittest
Guido van Rossumd8faa362007-04-27 19:54:29 +000021import unittest
Florent Xiclunaf15351d2010-03-13 23:24:31 +000022
23TEST_XMLFILE = findfile("test.xml", subdir="xmltestdata")
24TEST_XMLFILE_OUT = findfile("test.xml.out", subdir="xmltestdata")
Victor Stinner6c6f8512010-08-07 10:09:35 +000025try:
26 TEST_XMLFILE.encode("utf8")
27 TEST_XMLFILE_OUT.encode("utf8")
28except UnicodeEncodeError:
29 raise unittest.SkipTest("filename is not encodable to utf8")
Lars Gustäbel96753b32000-09-24 12:24:24 +000030
Serhiy Storchaka1a4ed4c2013-02-02 12:17:05 +020031supports_nonascii_filenames = True
32if not os.path.supports_unicode_filenames:
33 try:
34 support.TESTFN_UNICODE.encode(support.TESTFN_ENCODING)
35 except (UnicodeError, TypeError):
36 # Either the file system encoding is None, or the file name
37 # cannot be encoded in the file system encoding.
38 supports_nonascii_filenames = False
39requires_nonascii_filenames = unittest.skipUnless(
40 supports_nonascii_filenames,
41 'Requires non-ascii filenames support')
42
Guido van Rossumd8faa362007-04-27 19:54:29 +000043ns_uri = "http://www.python.org/xml-ns/saxtest/"
Lars Gustäbel96753b32000-09-24 12:24:24 +000044
Guido van Rossumd8faa362007-04-27 19:54:29 +000045class XmlTestBase(unittest.TestCase):
46 def verify_empty_attrs(self, attrs):
47 self.assertRaises(KeyError, attrs.getValue, "attr")
48 self.assertRaises(KeyError, attrs.getValueByQName, "attr")
49 self.assertRaises(KeyError, attrs.getNameByQName, "attr")
50 self.assertRaises(KeyError, attrs.getQNameByName, "attr")
51 self.assertRaises(KeyError, attrs.__getitem__, "attr")
Ezio Melottib3aedd42010-11-20 19:04:17 +000052 self.assertEqual(attrs.getLength(), 0)
53 self.assertEqual(attrs.getNames(), [])
54 self.assertEqual(attrs.getQNames(), [])
55 self.assertEqual(len(attrs), 0)
Ezio Melottib58e0bd2010-01-23 15:40:09 +000056 self.assertNotIn("attr", attrs)
Ezio Melottib3aedd42010-11-20 19:04:17 +000057 self.assertEqual(list(attrs.keys()), [])
58 self.assertEqual(attrs.get("attrs"), None)
59 self.assertEqual(attrs.get("attrs", 25), 25)
60 self.assertEqual(list(attrs.items()), [])
61 self.assertEqual(list(attrs.values()), [])
Lars Gustäbel96753b32000-09-24 12:24:24 +000062
Guido van Rossumd8faa362007-04-27 19:54:29 +000063 def verify_empty_nsattrs(self, attrs):
64 self.assertRaises(KeyError, attrs.getValue, (ns_uri, "attr"))
65 self.assertRaises(KeyError, attrs.getValueByQName, "ns:attr")
66 self.assertRaises(KeyError, attrs.getNameByQName, "ns:attr")
67 self.assertRaises(KeyError, attrs.getQNameByName, (ns_uri, "attr"))
68 self.assertRaises(KeyError, attrs.__getitem__, (ns_uri, "attr"))
Ezio Melottib3aedd42010-11-20 19:04:17 +000069 self.assertEqual(attrs.getLength(), 0)
70 self.assertEqual(attrs.getNames(), [])
71 self.assertEqual(attrs.getQNames(), [])
72 self.assertEqual(len(attrs), 0)
Ezio Melottib58e0bd2010-01-23 15:40:09 +000073 self.assertNotIn((ns_uri, "attr"), attrs)
Ezio Melottib3aedd42010-11-20 19:04:17 +000074 self.assertEqual(list(attrs.keys()), [])
75 self.assertEqual(attrs.get((ns_uri, "attr")), None)
76 self.assertEqual(attrs.get((ns_uri, "attr"), 25), 25)
77 self.assertEqual(list(attrs.items()), [])
78 self.assertEqual(list(attrs.values()), [])
Lars Gustäbel96753b32000-09-24 12:24:24 +000079
Guido van Rossumd8faa362007-04-27 19:54:29 +000080 def verify_attrs_wattr(self, attrs):
Ezio Melottib3aedd42010-11-20 19:04:17 +000081 self.assertEqual(attrs.getLength(), 1)
82 self.assertEqual(attrs.getNames(), ["attr"])
83 self.assertEqual(attrs.getQNames(), ["attr"])
84 self.assertEqual(len(attrs), 1)
Benjamin Peterson577473f2010-01-19 00:09:57 +000085 self.assertIn("attr", attrs)
Ezio Melottib3aedd42010-11-20 19:04:17 +000086 self.assertEqual(list(attrs.keys()), ["attr"])
87 self.assertEqual(attrs.get("attr"), "val")
88 self.assertEqual(attrs.get("attr", 25), "val")
89 self.assertEqual(list(attrs.items()), [("attr", "val")])
90 self.assertEqual(list(attrs.values()), ["val"])
91 self.assertEqual(attrs.getValue("attr"), "val")
92 self.assertEqual(attrs.getValueByQName("attr"), "val")
93 self.assertEqual(attrs.getNameByQName("attr"), "attr")
94 self.assertEqual(attrs["attr"], "val")
95 self.assertEqual(attrs.getQNameByName("attr"), "attr")
Lars Gustäbel96753b32000-09-24 12:24:24 +000096
Guido van Rossumd8faa362007-04-27 19:54:29 +000097class MakeParserTest(unittest.TestCase):
98 def test_make_parser2(self):
Lars Gustäbel2fc52942000-10-24 15:35:07 +000099 # Creating parsers several times in a row should succeed.
100 # Testing this because there have been failures of this kind
101 # before.
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000102 from xml.sax import make_parser
Lars Gustäbel2fc52942000-10-24 15:35:07 +0000103 p = make_parser()
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000104 from xml.sax import make_parser
Lars Gustäbel2fc52942000-10-24 15:35:07 +0000105 p = make_parser()
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000106 from xml.sax import make_parser
Lars Gustäbel2fc52942000-10-24 15:35:07 +0000107 p = make_parser()
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000108 from xml.sax import make_parser
Lars Gustäbel2fc52942000-10-24 15:35:07 +0000109 p = make_parser()
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000110 from xml.sax import make_parser
Lars Gustäbel2fc52942000-10-24 15:35:07 +0000111 p = make_parser()
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000112 from xml.sax import make_parser
Lars Gustäbel2fc52942000-10-24 15:35:07 +0000113 p = make_parser()
Tim Petersd2bf3b72001-01-18 02:22:22 +0000114
115
Lars Gustäbel96753b32000-09-24 12:24:24 +0000116# ===========================================================================
117#
118# saxutils tests
119#
120# ===========================================================================
121
Guido van Rossumd8faa362007-04-27 19:54:29 +0000122class SaxutilsTest(unittest.TestCase):
123 # ===== escape
124 def test_escape_basic(self):
Ezio Melottib3aedd42010-11-20 19:04:17 +0000125 self.assertEqual(escape("Donald Duck & Co"), "Donald Duck & Co")
Lars Gustäbel96753b32000-09-24 12:24:24 +0000126
Guido van Rossumd8faa362007-04-27 19:54:29 +0000127 def test_escape_all(self):
Ezio Melottib3aedd42010-11-20 19:04:17 +0000128 self.assertEqual(escape("<Donald Duck & Co>"),
129 "&lt;Donald Duck &amp; Co&gt;")
Lars Gustäbel96753b32000-09-24 12:24:24 +0000130
Guido van Rossumd8faa362007-04-27 19:54:29 +0000131 def test_escape_extra(self):
Ezio Melottib3aedd42010-11-20 19:04:17 +0000132 self.assertEqual(escape("Hei på deg", {"å" : "&aring;"}),
133 "Hei p&aring; deg")
Lars Gustäbel96753b32000-09-24 12:24:24 +0000134
Guido van Rossumd8faa362007-04-27 19:54:29 +0000135 # ===== unescape
136 def test_unescape_basic(self):
Ezio Melottib3aedd42010-11-20 19:04:17 +0000137 self.assertEqual(unescape("Donald Duck &amp; Co"), "Donald Duck & Co")
Lars Gustäbel96753b32000-09-24 12:24:24 +0000138
Guido van Rossumd8faa362007-04-27 19:54:29 +0000139 def test_unescape_all(self):
Ezio Melottib3aedd42010-11-20 19:04:17 +0000140 self.assertEqual(unescape("&lt;Donald Duck &amp; Co&gt;"),
141 "<Donald Duck & Co>")
Martin v. Löwis74b51ac2002-10-26 14:50:45 +0000142
Guido van Rossumd8faa362007-04-27 19:54:29 +0000143 def test_unescape_extra(self):
Ezio Melottib3aedd42010-11-20 19:04:17 +0000144 self.assertEqual(unescape("Hei på deg", {"å" : "&aring;"}),
145 "Hei p&aring; deg")
Martin v. Löwis74b51ac2002-10-26 14:50:45 +0000146
Guido van Rossumd8faa362007-04-27 19:54:29 +0000147 def test_unescape_amp_extra(self):
Ezio Melottib3aedd42010-11-20 19:04:17 +0000148 self.assertEqual(unescape("&amp;foo;", {"&foo;": "splat"}), "&foo;")
Martin v. Löwis74b51ac2002-10-26 14:50:45 +0000149
Guido van Rossumd8faa362007-04-27 19:54:29 +0000150 # ===== quoteattr
151 def test_quoteattr_basic(self):
Ezio Melottib3aedd42010-11-20 19:04:17 +0000152 self.assertEqual(quoteattr("Donald Duck & Co"),
153 '"Donald Duck &amp; Co"')
Martin v. Löwis74b51ac2002-10-26 14:50:45 +0000154
Guido van Rossumd8faa362007-04-27 19:54:29 +0000155 def test_single_quoteattr(self):
Ezio Melottib3aedd42010-11-20 19:04:17 +0000156 self.assertEqual(quoteattr('Includes "double" quotes'),
157 '\'Includes "double" quotes\'')
Fred Drake32f3add2002-10-28 17:58:48 +0000158
Guido van Rossumd8faa362007-04-27 19:54:29 +0000159 def test_double_quoteattr(self):
Ezio Melottib3aedd42010-11-20 19:04:17 +0000160 self.assertEqual(quoteattr("Includes 'single' quotes"),
161 "\"Includes 'single' quotes\"")
Fred Drakeacd32d32001-07-19 16:10:15 +0000162
Guido van Rossumd8faa362007-04-27 19:54:29 +0000163 def test_single_double_quoteattr(self):
Ezio Melottib3aedd42010-11-20 19:04:17 +0000164 self.assertEqual(quoteattr("Includes 'single' and \"double\" quotes"),
165 "\"Includes 'single' and &quot;double&quot; quotes\"")
Fred Drakeacd32d32001-07-19 16:10:15 +0000166
Guido van Rossumd8faa362007-04-27 19:54:29 +0000167 # ===== make_parser
168 def test_make_parser(self):
Martin v. Löwis962c9e72000-10-06 17:41:52 +0000169 # Creating a parser should succeed - it should fall back
170 # to the expatreader
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000171 p = make_parser(['xml.parsers.no_such_parser'])
Martin v. Löwis962c9e72000-10-06 17:41:52 +0000172
173
Lars Gustäbel96753b32000-09-24 12:24:24 +0000174# ===== XMLGenerator
175
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200176class XmlgenTest:
Guido van Rossumd8faa362007-04-27 19:54:29 +0000177 def test_xmlgen_basic(self):
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200178 result = self.ioclass()
Guido van Rossumd8faa362007-04-27 19:54:29 +0000179 gen = XMLGenerator(result)
180 gen.startDocument()
181 gen.startElement("doc", {})
182 gen.endElement("doc")
183 gen.endDocument()
Lars Gustäbel96753b32000-09-24 12:24:24 +0000184
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200185 self.assertEqual(result.getvalue(), self.xml("<doc></doc>"))
Lars Gustäbel96753b32000-09-24 12:24:24 +0000186
R. David Murraya90032a2010-10-17 22:46:45 +0000187 def test_xmlgen_basic_empty(self):
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200188 result = self.ioclass()
R. David Murraya90032a2010-10-17 22:46:45 +0000189 gen = XMLGenerator(result, short_empty_elements=True)
190 gen.startDocument()
191 gen.startElement("doc", {})
192 gen.endElement("doc")
193 gen.endDocument()
194
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200195 self.assertEqual(result.getvalue(), self.xml("<doc/>"))
R. David Murraya90032a2010-10-17 22:46:45 +0000196
Guido van Rossumd8faa362007-04-27 19:54:29 +0000197 def test_xmlgen_content(self):
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200198 result = self.ioclass()
Guido van Rossumd8faa362007-04-27 19:54:29 +0000199 gen = XMLGenerator(result)
Fred Drake004d5e62000-10-23 17:22:08 +0000200
Guido van Rossumd8faa362007-04-27 19:54:29 +0000201 gen.startDocument()
202 gen.startElement("doc", {})
203 gen.characters("huhei")
204 gen.endElement("doc")
205 gen.endDocument()
Lars Gustäbel96753b32000-09-24 12:24:24 +0000206
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200207 self.assertEqual(result.getvalue(), self.xml("<doc>huhei</doc>"))
Lars Gustäbel96753b32000-09-24 12:24:24 +0000208
R. David Murraya90032a2010-10-17 22:46:45 +0000209 def test_xmlgen_content_empty(self):
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200210 result = self.ioclass()
R. David Murraya90032a2010-10-17 22:46:45 +0000211 gen = XMLGenerator(result, short_empty_elements=True)
212
213 gen.startDocument()
214 gen.startElement("doc", {})
215 gen.characters("huhei")
216 gen.endElement("doc")
217 gen.endDocument()
218
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200219 self.assertEqual(result.getvalue(), self.xml("<doc>huhei</doc>"))
R. David Murraya90032a2010-10-17 22:46:45 +0000220
Guido van Rossumd8faa362007-04-27 19:54:29 +0000221 def test_xmlgen_pi(self):
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200222 result = self.ioclass()
Guido van Rossumd8faa362007-04-27 19:54:29 +0000223 gen = XMLGenerator(result)
Fred Drake004d5e62000-10-23 17:22:08 +0000224
Guido van Rossumd8faa362007-04-27 19:54:29 +0000225 gen.startDocument()
226 gen.processingInstruction("test", "data")
227 gen.startElement("doc", {})
228 gen.endElement("doc")
229 gen.endDocument()
Lars Gustäbel96753b32000-09-24 12:24:24 +0000230
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200231 self.assertEqual(result.getvalue(),
232 self.xml("<?test data?><doc></doc>"))
Lars Gustäbel96753b32000-09-24 12:24:24 +0000233
Guido van Rossumd8faa362007-04-27 19:54:29 +0000234 def test_xmlgen_content_escape(self):
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200235 result = self.ioclass()
Guido van Rossumd8faa362007-04-27 19:54:29 +0000236 gen = XMLGenerator(result)
Fred Drake004d5e62000-10-23 17:22:08 +0000237
Guido van Rossumd8faa362007-04-27 19:54:29 +0000238 gen.startDocument()
239 gen.startElement("doc", {})
240 gen.characters("<huhei&")
241 gen.endElement("doc")
242 gen.endDocument()
Lars Gustäbel96753b32000-09-24 12:24:24 +0000243
Ezio Melottib3aedd42010-11-20 19:04:17 +0000244 self.assertEqual(result.getvalue(),
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200245 self.xml("<doc>&lt;huhei&amp;</doc>"))
Lars Gustäbel96753b32000-09-24 12:24:24 +0000246
Guido van Rossumd8faa362007-04-27 19:54:29 +0000247 def test_xmlgen_attr_escape(self):
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200248 result = self.ioclass()
Guido van Rossumd8faa362007-04-27 19:54:29 +0000249 gen = XMLGenerator(result)
Fred Drakec9fadf92001-08-07 19:17:06 +0000250
Guido van Rossumd8faa362007-04-27 19:54:29 +0000251 gen.startDocument()
252 gen.startElement("doc", {"a": '"'})
253 gen.startElement("e", {"a": "'"})
254 gen.endElement("e")
255 gen.startElement("e", {"a": "'\""})
256 gen.endElement("e")
257 gen.startElement("e", {"a": "\n\r\t"})
258 gen.endElement("e")
259 gen.endElement("doc")
260 gen.endDocument()
Fred Drakec9fadf92001-08-07 19:17:06 +0000261
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200262 self.assertEqual(result.getvalue(), self.xml(
263 "<doc a='\"'><e a=\"'\"></e>"
264 "<e a=\"'&quot;\"></e>"
265 "<e a=\"&#10;&#13;&#9;\"></e></doc>"))
266
267 def test_xmlgen_encoding(self):
268 encodings = ('iso-8859-15', 'utf-8', 'utf-8-sig',
269 'utf-16', 'utf-16be', 'utf-16le',
270 'utf-32', 'utf-32be', 'utf-32le')
271 for encoding in encodings:
272 result = self.ioclass()
273 gen = XMLGenerator(result, encoding=encoding)
274
275 gen.startDocument()
276 gen.startElement("doc", {"a": '\u20ac'})
277 gen.characters("\u20ac")
278 gen.endElement("doc")
279 gen.endDocument()
280
281 self.assertEqual(result.getvalue(),
282 self.xml('<doc a="\u20ac">\u20ac</doc>', encoding=encoding))
283
284 def test_xmlgen_unencodable(self):
285 result = self.ioclass()
286 gen = XMLGenerator(result, encoding='ascii')
287
288 gen.startDocument()
289 gen.startElement("doc", {"a": '\u20ac'})
290 gen.characters("\u20ac")
291 gen.endElement("doc")
292 gen.endDocument()
293
294 self.assertEqual(result.getvalue(),
295 self.xml('<doc a="&#8364;">&#8364;</doc>', encoding='ascii'))
Fred Drakec9fadf92001-08-07 19:17:06 +0000296
Guido van Rossumd8faa362007-04-27 19:54:29 +0000297 def test_xmlgen_ignorable(self):
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200298 result = self.ioclass()
Guido van Rossumd8faa362007-04-27 19:54:29 +0000299 gen = XMLGenerator(result)
Fred Drake004d5e62000-10-23 17:22:08 +0000300
Guido van Rossumd8faa362007-04-27 19:54:29 +0000301 gen.startDocument()
302 gen.startElement("doc", {})
303 gen.ignorableWhitespace(" ")
304 gen.endElement("doc")
305 gen.endDocument()
Lars Gustäbel96753b32000-09-24 12:24:24 +0000306
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200307 self.assertEqual(result.getvalue(), self.xml("<doc> </doc>"))
Lars Gustäbel96753b32000-09-24 12:24:24 +0000308
R. David Murraya90032a2010-10-17 22:46:45 +0000309 def test_xmlgen_ignorable_empty(self):
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200310 result = self.ioclass()
R. David Murraya90032a2010-10-17 22:46:45 +0000311 gen = XMLGenerator(result, short_empty_elements=True)
312
313 gen.startDocument()
314 gen.startElement("doc", {})
315 gen.ignorableWhitespace(" ")
316 gen.endElement("doc")
317 gen.endDocument()
318
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200319 self.assertEqual(result.getvalue(), self.xml("<doc> </doc>"))
R. David Murraya90032a2010-10-17 22:46:45 +0000320
Guido van Rossumd8faa362007-04-27 19:54:29 +0000321 def test_xmlgen_ns(self):
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200322 result = self.ioclass()
Guido van Rossumd8faa362007-04-27 19:54:29 +0000323 gen = XMLGenerator(result)
Lars Gustäbel96753b32000-09-24 12:24:24 +0000324
Guido van Rossumd8faa362007-04-27 19:54:29 +0000325 gen.startDocument()
326 gen.startPrefixMapping("ns1", ns_uri)
327 gen.startElementNS((ns_uri, "doc"), "ns1:doc", {})
328 # add an unqualified name
329 gen.startElementNS((None, "udoc"), None, {})
330 gen.endElementNS((None, "udoc"), None)
331 gen.endElementNS((ns_uri, "doc"), "ns1:doc")
332 gen.endPrefixMapping("ns1")
333 gen.endDocument()
Fred Drake004d5e62000-10-23 17:22:08 +0000334
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200335 self.assertEqual(result.getvalue(), self.xml(
336 '<ns1:doc xmlns:ns1="%s"><udoc></udoc></ns1:doc>' %
Guido van Rossumd8faa362007-04-27 19:54:29 +0000337 ns_uri))
Lars Gustäbel96753b32000-09-24 12:24:24 +0000338
R. David Murraya90032a2010-10-17 22:46:45 +0000339 def test_xmlgen_ns_empty(self):
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200340 result = self.ioclass()
R. David Murraya90032a2010-10-17 22:46:45 +0000341 gen = XMLGenerator(result, short_empty_elements=True)
342
343 gen.startDocument()
344 gen.startPrefixMapping("ns1", ns_uri)
345 gen.startElementNS((ns_uri, "doc"), "ns1:doc", {})
346 # add an unqualified name
347 gen.startElementNS((None, "udoc"), None, {})
348 gen.endElementNS((None, "udoc"), None)
349 gen.endElementNS((ns_uri, "doc"), "ns1:doc")
350 gen.endPrefixMapping("ns1")
351 gen.endDocument()
352
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200353 self.assertEqual(result.getvalue(), self.xml(
354 '<ns1:doc xmlns:ns1="%s"><udoc/></ns1:doc>' %
R. David Murraya90032a2010-10-17 22:46:45 +0000355 ns_uri))
356
Guido van Rossumd8faa362007-04-27 19:54:29 +0000357 def test_1463026_1(self):
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200358 result = self.ioclass()
Guido van Rossumd8faa362007-04-27 19:54:29 +0000359 gen = XMLGenerator(result)
Thomas Wouterscf297e42007-02-23 15:07:44 +0000360
Guido van Rossumd8faa362007-04-27 19:54:29 +0000361 gen.startDocument()
362 gen.startElementNS((None, 'a'), 'a', {(None, 'b'):'c'})
363 gen.endElementNS((None, 'a'), 'a')
364 gen.endDocument()
Thomas Wouterscf297e42007-02-23 15:07:44 +0000365
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200366 self.assertEqual(result.getvalue(), self.xml('<a b="c"></a>'))
Thomas Wouterscf297e42007-02-23 15:07:44 +0000367
R. David Murraya90032a2010-10-17 22:46:45 +0000368 def test_1463026_1_empty(self):
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200369 result = self.ioclass()
R. David Murraya90032a2010-10-17 22:46:45 +0000370 gen = XMLGenerator(result, short_empty_elements=True)
371
372 gen.startDocument()
373 gen.startElementNS((None, 'a'), 'a', {(None, 'b'):'c'})
374 gen.endElementNS((None, 'a'), 'a')
375 gen.endDocument()
376
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200377 self.assertEqual(result.getvalue(), self.xml('<a b="c"/>'))
R. David Murraya90032a2010-10-17 22:46:45 +0000378
Guido van Rossumd8faa362007-04-27 19:54:29 +0000379 def test_1463026_2(self):
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200380 result = self.ioclass()
Guido van Rossumd8faa362007-04-27 19:54:29 +0000381 gen = XMLGenerator(result)
Thomas Wouterscf297e42007-02-23 15:07:44 +0000382
Guido van Rossumd8faa362007-04-27 19:54:29 +0000383 gen.startDocument()
384 gen.startPrefixMapping(None, 'qux')
385 gen.startElementNS(('qux', 'a'), 'a', {})
386 gen.endElementNS(('qux', 'a'), 'a')
387 gen.endPrefixMapping(None)
388 gen.endDocument()
Thomas Wouterscf297e42007-02-23 15:07:44 +0000389
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200390 self.assertEqual(result.getvalue(), self.xml('<a xmlns="qux"></a>'))
Thomas Wouterscf297e42007-02-23 15:07:44 +0000391
R. David Murraya90032a2010-10-17 22:46:45 +0000392 def test_1463026_2_empty(self):
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200393 result = self.ioclass()
R. David Murraya90032a2010-10-17 22:46:45 +0000394 gen = XMLGenerator(result, short_empty_elements=True)
395
396 gen.startDocument()
397 gen.startPrefixMapping(None, 'qux')
398 gen.startElementNS(('qux', 'a'), 'a', {})
399 gen.endElementNS(('qux', 'a'), 'a')
400 gen.endPrefixMapping(None)
401 gen.endDocument()
402
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200403 self.assertEqual(result.getvalue(), self.xml('<a xmlns="qux"/>'))
R. David Murraya90032a2010-10-17 22:46:45 +0000404
Guido van Rossumd8faa362007-04-27 19:54:29 +0000405 def test_1463026_3(self):
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200406 result = self.ioclass()
Guido van Rossumd8faa362007-04-27 19:54:29 +0000407 gen = XMLGenerator(result)
Thomas Wouterscf297e42007-02-23 15:07:44 +0000408
Guido van Rossumd8faa362007-04-27 19:54:29 +0000409 gen.startDocument()
410 gen.startPrefixMapping('my', 'qux')
411 gen.startElementNS(('qux', 'a'), 'a', {(None, 'b'):'c'})
412 gen.endElementNS(('qux', 'a'), 'a')
413 gen.endPrefixMapping('my')
414 gen.endDocument()
Thomas Wouterscf297e42007-02-23 15:07:44 +0000415
Ezio Melottib3aedd42010-11-20 19:04:17 +0000416 self.assertEqual(result.getvalue(),
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200417 self.xml('<my:a xmlns:my="qux" b="c"></my:a>'))
Lars Gustäbel96753b32000-09-24 12:24:24 +0000418
R. David Murraya90032a2010-10-17 22:46:45 +0000419 def test_1463026_3_empty(self):
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200420 result = self.ioclass()
R. David Murraya90032a2010-10-17 22:46:45 +0000421 gen = XMLGenerator(result, short_empty_elements=True)
422
423 gen.startDocument()
424 gen.startPrefixMapping('my', 'qux')
425 gen.startElementNS(('qux', 'a'), 'a', {(None, 'b'):'c'})
426 gen.endElementNS(('qux', 'a'), 'a')
427 gen.endPrefixMapping('my')
428 gen.endDocument()
429
Ezio Melottib3aedd42010-11-20 19:04:17 +0000430 self.assertEqual(result.getvalue(),
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200431 self.xml('<my:a xmlns:my="qux" b="c"/>'))
R. David Murraya90032a2010-10-17 22:46:45 +0000432
Antoine Pitrou6b03ee62010-10-27 18:33:30 +0000433 def test_5027_1(self):
434 # The xml prefix (as in xml:lang below) is reserved and bound by
435 # definition to http://www.w3.org/XML/1998/namespace. XMLGenerator had
Andrew Svetlov737fb892012-12-18 21:14:22 +0200436 # a bug whereby a KeyError is raised because this namespace is missing
Antoine Pitrou6b03ee62010-10-27 18:33:30 +0000437 # from a dictionary.
438 #
439 # This test demonstrates the bug by parsing a document.
440 test_xml = StringIO(
441 '<?xml version="1.0"?>'
442 '<a:g1 xmlns:a="http://example.com/ns">'
443 '<a:g2 xml:lang="en">Hello</a:g2>'
444 '</a:g1>')
445
446 parser = make_parser()
447 parser.setFeature(feature_namespaces, True)
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200448 result = self.ioclass()
Antoine Pitrou6b03ee62010-10-27 18:33:30 +0000449 gen = XMLGenerator(result)
450 parser.setContentHandler(gen)
451 parser.parse(test_xml)
452
Ezio Melottib3aedd42010-11-20 19:04:17 +0000453 self.assertEqual(result.getvalue(),
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200454 self.xml(
Ezio Melottib3aedd42010-11-20 19:04:17 +0000455 '<a:g1 xmlns:a="http://example.com/ns">'
456 '<a:g2 xml:lang="en">Hello</a:g2>'
457 '</a:g1>'))
Antoine Pitrou6b03ee62010-10-27 18:33:30 +0000458
459 def test_5027_2(self):
460 # The xml prefix (as in xml:lang below) is reserved and bound by
461 # definition to http://www.w3.org/XML/1998/namespace. XMLGenerator had
Andrew Svetlov737fb892012-12-18 21:14:22 +0200462 # a bug whereby a KeyError is raised because this namespace is missing
Antoine Pitrou6b03ee62010-10-27 18:33:30 +0000463 # from a dictionary.
464 #
465 # This test demonstrates the bug by direct manipulation of the
466 # XMLGenerator.
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200467 result = self.ioclass()
Antoine Pitrou6b03ee62010-10-27 18:33:30 +0000468 gen = XMLGenerator(result)
469
470 gen.startDocument()
471 gen.startPrefixMapping('a', 'http://example.com/ns')
472 gen.startElementNS(('http://example.com/ns', 'g1'), 'g1', {})
473 lang_attr = {('http://www.w3.org/XML/1998/namespace', 'lang'): 'en'}
474 gen.startElementNS(('http://example.com/ns', 'g2'), 'g2', lang_attr)
475 gen.characters('Hello')
476 gen.endElementNS(('http://example.com/ns', 'g2'), 'g2')
477 gen.endElementNS(('http://example.com/ns', 'g1'), 'g1')
478 gen.endPrefixMapping('a')
479 gen.endDocument()
480
Ezio Melottib3aedd42010-11-20 19:04:17 +0000481 self.assertEqual(result.getvalue(),
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200482 self.xml(
Ezio Melottib3aedd42010-11-20 19:04:17 +0000483 '<a:g1 xmlns:a="http://example.com/ns">'
484 '<a:g2 xml:lang="en">Hello</a:g2>'
485 '</a:g1>'))
Antoine Pitrou6b03ee62010-10-27 18:33:30 +0000486
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200487 def test_no_close_file(self):
488 result = self.ioclass()
489 def func(out):
490 gen = XMLGenerator(out)
491 gen.startDocument()
492 gen.startElement("doc", {})
493 func(result)
494 self.assertFalse(result.closed)
495
496class StringXmlgenTest(XmlgenTest, unittest.TestCase):
497 ioclass = StringIO
498
499 def xml(self, doc, encoding='iso-8859-1'):
500 return '<?xml version="1.0" encoding="%s"?>\n%s' % (encoding, doc)
501
502 test_xmlgen_unencodable = None
503
504class BytesXmlgenTest(XmlgenTest, unittest.TestCase):
505 ioclass = BytesIO
506
507 def xml(self, doc, encoding='iso-8859-1'):
508 return ('<?xml version="1.0" encoding="%s"?>\n%s' %
509 (encoding, doc)).encode(encoding, 'xmlcharrefreplace')
510
511class WriterXmlgenTest(BytesXmlgenTest):
512 class ioclass(list):
513 write = list.append
514 closed = False
515
516 def seekable(self):
517 return True
518
519 def tell(self):
520 # return 0 at start and not 0 after start
521 return len(self)
522
523 def getvalue(self):
524 return b''.join(self)
525
526
527start = b'<?xml version="1.0" encoding="iso-8859-1"?>\n'
528
Fred Drake004d5e62000-10-23 17:22:08 +0000529
Guido van Rossumd8faa362007-04-27 19:54:29 +0000530class XMLFilterBaseTest(unittest.TestCase):
531 def test_filter_basic(self):
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200532 result = BytesIO()
Guido van Rossumd8faa362007-04-27 19:54:29 +0000533 gen = XMLGenerator(result)
534 filter = XMLFilterBase()
535 filter.setContentHandler(gen)
Lars Gustäbel96753b32000-09-24 12:24:24 +0000536
Guido van Rossumd8faa362007-04-27 19:54:29 +0000537 filter.startDocument()
538 filter.startElement("doc", {})
539 filter.characters("content")
540 filter.ignorableWhitespace(" ")
541 filter.endElement("doc")
542 filter.endDocument()
543
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200544 self.assertEqual(result.getvalue(), start + b"<doc>content </doc>")
Lars Gustäbel96753b32000-09-24 12:24:24 +0000545
546# ===========================================================================
547#
548# expatreader tests
549#
550# ===========================================================================
551
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200552with open(TEST_XMLFILE_OUT, 'rb') as f:
Benjamin Petersond5df36d2010-10-31 18:23:23 +0000553 xml_test_out = f.read()
Lars Gustäbelb7536d52000-09-24 18:53:56 +0000554
Guido van Rossumd8faa362007-04-27 19:54:29 +0000555class ExpatReaderTest(XmlTestBase):
Lars Gustäbelb7536d52000-09-24 18:53:56 +0000556
Guido van Rossumd8faa362007-04-27 19:54:29 +0000557 # ===== XMLReader support
Lars Gustäbelb7536d52000-09-24 18:53:56 +0000558
Guido van Rossumd8faa362007-04-27 19:54:29 +0000559 def test_expat_file(self):
560 parser = create_parser()
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200561 result = BytesIO()
Guido van Rossumd8faa362007-04-27 19:54:29 +0000562 xmlgen = XMLGenerator(result)
Lars Gustäbelb7536d52000-09-24 18:53:56 +0000563
Guido van Rossumd8faa362007-04-27 19:54:29 +0000564 parser.setContentHandler(xmlgen)
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200565 with open(TEST_XMLFILE, 'rb') as f:
Benjamin Petersond5df36d2010-10-31 18:23:23 +0000566 parser.parse(f)
Lars Gustäbelb7536d52000-09-24 18:53:56 +0000567
Ezio Melottib3aedd42010-11-20 19:04:17 +0000568 self.assertEqual(result.getvalue(), xml_test_out)
Lars Gustäbelb7536d52000-09-24 18:53:56 +0000569
Serhiy Storchaka1a4ed4c2013-02-02 12:17:05 +0200570 @requires_nonascii_filenames
Serhiy Storchakad5202392013-02-02 10:31:17 +0200571 def test_expat_file_nonascii(self):
572 fname = support.TESTFN_UNICODE
573 shutil.copyfile(TEST_XMLFILE, fname)
574 self.addCleanup(support.unlink, fname)
575
576 parser = create_parser()
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200577 result = BytesIO()
Serhiy Storchakad5202392013-02-02 10:31:17 +0200578 xmlgen = XMLGenerator(result)
579
580 parser.setContentHandler(xmlgen)
581 parser.parse(open(fname))
582
583 self.assertEqual(result.getvalue(), xml_test_out)
584
Guido van Rossumd8faa362007-04-27 19:54:29 +0000585 # ===== DTDHandler support
Lars Gustäbelb7536d52000-09-24 18:53:56 +0000586
Guido van Rossumd8faa362007-04-27 19:54:29 +0000587 class TestDTDHandler:
Lars Gustäbelb7536d52000-09-24 18:53:56 +0000588
Guido van Rossumd8faa362007-04-27 19:54:29 +0000589 def __init__(self):
590 self._notations = []
591 self._entities = []
Lars Gustäbelb7536d52000-09-24 18:53:56 +0000592
Guido van Rossumd8faa362007-04-27 19:54:29 +0000593 def notationDecl(self, name, publicId, systemId):
594 self._notations.append((name, publicId, systemId))
Lars Gustäbelb7536d52000-09-24 18:53:56 +0000595
Guido van Rossumd8faa362007-04-27 19:54:29 +0000596 def unparsedEntityDecl(self, name, publicId, systemId, ndata):
597 self._entities.append((name, publicId, systemId, ndata))
Lars Gustäbel2fc52942000-10-24 15:35:07 +0000598
Guido van Rossumd8faa362007-04-27 19:54:29 +0000599 def test_expat_dtdhandler(self):
600 parser = create_parser()
601 handler = self.TestDTDHandler()
602 parser.setDTDHandler(handler)
Lars Gustäbel2fc52942000-10-24 15:35:07 +0000603
Guido van Rossumd8faa362007-04-27 19:54:29 +0000604 parser.feed('<!DOCTYPE doc [\n')
605 parser.feed(' <!ENTITY img SYSTEM "expat.gif" NDATA GIF>\n')
606 parser.feed(' <!NOTATION GIF PUBLIC "-//CompuServe//NOTATION Graphics Interchange Format 89a//EN">\n')
607 parser.feed(']>\n')
608 parser.feed('<doc></doc>')
609 parser.close()
Lars Gustäbel2fc52942000-10-24 15:35:07 +0000610
Ezio Melottib3aedd42010-11-20 19:04:17 +0000611 self.assertEqual(handler._notations,
Guido van Rossumd8faa362007-04-27 19:54:29 +0000612 [("GIF", "-//CompuServe//NOTATION Graphics Interchange Format 89a//EN", None)])
Ezio Melottib3aedd42010-11-20 19:04:17 +0000613 self.assertEqual(handler._entities, [("img", None, "expat.gif", "GIF")])
Lars Gustäbel2fc52942000-10-24 15:35:07 +0000614
Guido van Rossumd8faa362007-04-27 19:54:29 +0000615 # ===== EntityResolver support
Lars Gustäbel2fc52942000-10-24 15:35:07 +0000616
Guido van Rossumd8faa362007-04-27 19:54:29 +0000617 class TestEntityResolver:
Lars Gustäbel2fc52942000-10-24 15:35:07 +0000618
Guido van Rossumd8faa362007-04-27 19:54:29 +0000619 def resolveEntity(self, publicId, systemId):
620 inpsrc = InputSource()
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200621 inpsrc.setByteStream(BytesIO(b"<entity/>"))
Guido van Rossumd8faa362007-04-27 19:54:29 +0000622 return inpsrc
Lars Gustäbel2fc52942000-10-24 15:35:07 +0000623
Guido van Rossumd8faa362007-04-27 19:54:29 +0000624 def test_expat_entityresolver(self):
625 parser = create_parser()
626 parser.setEntityResolver(self.TestEntityResolver())
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200627 result = BytesIO()
Guido van Rossumd8faa362007-04-27 19:54:29 +0000628 parser.setContentHandler(XMLGenerator(result))
Lars Gustäbel2fc52942000-10-24 15:35:07 +0000629
Guido van Rossumd8faa362007-04-27 19:54:29 +0000630 parser.feed('<!DOCTYPE doc [\n')
631 parser.feed(' <!ENTITY test SYSTEM "whatever">\n')
632 parser.feed(']>\n')
633 parser.feed('<doc>&test;</doc>')
634 parser.close()
Lars Gustäbel2fc52942000-10-24 15:35:07 +0000635
Ezio Melottib3aedd42010-11-20 19:04:17 +0000636 self.assertEqual(result.getvalue(), start +
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200637 b"<doc><entity></entity></doc>")
Lars Gustäbel2fc52942000-10-24 15:35:07 +0000638
Guido van Rossumd8faa362007-04-27 19:54:29 +0000639 # ===== Attributes support
Lars Gustäbel2fc52942000-10-24 15:35:07 +0000640
Guido van Rossumd8faa362007-04-27 19:54:29 +0000641 class AttrGatherer(ContentHandler):
Lars Gustäbel2fc52942000-10-24 15:35:07 +0000642
Guido van Rossumd8faa362007-04-27 19:54:29 +0000643 def startElement(self, name, attrs):
644 self._attrs = attrs
Lars Gustäbel2fc52942000-10-24 15:35:07 +0000645
Guido van Rossumd8faa362007-04-27 19:54:29 +0000646 def startElementNS(self, name, qname, attrs):
647 self._attrs = attrs
Lars Gustäbel2fc52942000-10-24 15:35:07 +0000648
Guido van Rossumd8faa362007-04-27 19:54:29 +0000649 def test_expat_attrs_empty(self):
650 parser = create_parser()
651 gather = self.AttrGatherer()
652 parser.setContentHandler(gather)
653
654 parser.feed("<doc/>")
655 parser.close()
656
657 self.verify_empty_attrs(gather._attrs)
658
659 def test_expat_attrs_wattr(self):
660 parser = create_parser()
661 gather = self.AttrGatherer()
662 parser.setContentHandler(gather)
663
664 parser.feed("<doc attr='val'/>")
665 parser.close()
666
667 self.verify_attrs_wattr(gather._attrs)
668
669 def test_expat_nsattrs_empty(self):
670 parser = create_parser(1)
671 gather = self.AttrGatherer()
672 parser.setContentHandler(gather)
673
674 parser.feed("<doc/>")
675 parser.close()
676
677 self.verify_empty_nsattrs(gather._attrs)
678
679 def test_expat_nsattrs_wattr(self):
680 parser = create_parser(1)
681 gather = self.AttrGatherer()
682 parser.setContentHandler(gather)
683
684 parser.feed("<doc xmlns:ns='%s' ns:attr='val'/>" % ns_uri)
685 parser.close()
686
687 attrs = gather._attrs
688
Ezio Melottib3aedd42010-11-20 19:04:17 +0000689 self.assertEqual(attrs.getLength(), 1)
690 self.assertEqual(attrs.getNames(), [(ns_uri, "attr")])
Guido van Rossumd8faa362007-04-27 19:54:29 +0000691 self.assertTrue((attrs.getQNames() == [] or
692 attrs.getQNames() == ["ns:attr"]))
Ezio Melottib3aedd42010-11-20 19:04:17 +0000693 self.assertEqual(len(attrs), 1)
Benjamin Peterson577473f2010-01-19 00:09:57 +0000694 self.assertIn((ns_uri, "attr"), attrs)
Ezio Melottib3aedd42010-11-20 19:04:17 +0000695 self.assertEqual(attrs.get((ns_uri, "attr")), "val")
696 self.assertEqual(attrs.get((ns_uri, "attr"), 25), "val")
697 self.assertEqual(list(attrs.items()), [((ns_uri, "attr"), "val")])
698 self.assertEqual(list(attrs.values()), ["val"])
699 self.assertEqual(attrs.getValue((ns_uri, "attr")), "val")
700 self.assertEqual(attrs[(ns_uri, "attr")], "val")
Guido van Rossumd8faa362007-04-27 19:54:29 +0000701
702 # ===== InputSource support
703
Benjamin Petersona7f4f5a2008-09-04 02:22:52 +0000704 def test_expat_inpsource_filename(self):
Guido van Rossumd8faa362007-04-27 19:54:29 +0000705 parser = create_parser()
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200706 result = BytesIO()
Guido van Rossumd8faa362007-04-27 19:54:29 +0000707 xmlgen = XMLGenerator(result)
708
709 parser.setContentHandler(xmlgen)
Florent Xiclunaf15351d2010-03-13 23:24:31 +0000710 parser.parse(TEST_XMLFILE)
Guido van Rossumd8faa362007-04-27 19:54:29 +0000711
Ezio Melottib3aedd42010-11-20 19:04:17 +0000712 self.assertEqual(result.getvalue(), xml_test_out)
Guido van Rossumd8faa362007-04-27 19:54:29 +0000713
Benjamin Petersona7f4f5a2008-09-04 02:22:52 +0000714 def test_expat_inpsource_sysid(self):
Guido van Rossumd8faa362007-04-27 19:54:29 +0000715 parser = create_parser()
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200716 result = BytesIO()
Guido van Rossumd8faa362007-04-27 19:54:29 +0000717 xmlgen = XMLGenerator(result)
718
719 parser.setContentHandler(xmlgen)
Florent Xiclunaf15351d2010-03-13 23:24:31 +0000720 parser.parse(InputSource(TEST_XMLFILE))
Guido van Rossumd8faa362007-04-27 19:54:29 +0000721
Ezio Melottib3aedd42010-11-20 19:04:17 +0000722 self.assertEqual(result.getvalue(), xml_test_out)
Guido van Rossumd8faa362007-04-27 19:54:29 +0000723
Serhiy Storchaka1a4ed4c2013-02-02 12:17:05 +0200724 @requires_nonascii_filenames
Serhiy Storchakad5202392013-02-02 10:31:17 +0200725 def test_expat_inpsource_sysid_nonascii(self):
726 fname = support.TESTFN_UNICODE
727 shutil.copyfile(TEST_XMLFILE, fname)
728 self.addCleanup(support.unlink, fname)
729
730 parser = create_parser()
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200731 result = BytesIO()
Serhiy Storchakad5202392013-02-02 10:31:17 +0200732 xmlgen = XMLGenerator(result)
733
734 parser.setContentHandler(xmlgen)
735 parser.parse(InputSource(fname))
736
737 self.assertEqual(result.getvalue(), xml_test_out)
738
Guido van Rossumd8faa362007-04-27 19:54:29 +0000739 def test_expat_inpsource_stream(self):
740 parser = create_parser()
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200741 result = BytesIO()
Guido van Rossumd8faa362007-04-27 19:54:29 +0000742 xmlgen = XMLGenerator(result)
743
744 parser.setContentHandler(xmlgen)
745 inpsrc = InputSource()
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200746 with open(TEST_XMLFILE, 'rb') as f:
Benjamin Petersond5df36d2010-10-31 18:23:23 +0000747 inpsrc.setByteStream(f)
748 parser.parse(inpsrc)
Guido van Rossumd8faa362007-04-27 19:54:29 +0000749
Ezio Melottib3aedd42010-11-20 19:04:17 +0000750 self.assertEqual(result.getvalue(), xml_test_out)
Guido van Rossumd8faa362007-04-27 19:54:29 +0000751
752 # ===== IncrementalParser support
753
754 def test_expat_incremental(self):
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200755 result = BytesIO()
Guido van Rossumd8faa362007-04-27 19:54:29 +0000756 xmlgen = XMLGenerator(result)
757 parser = create_parser()
758 parser.setContentHandler(xmlgen)
759
760 parser.feed("<doc>")
761 parser.feed("</doc>")
762 parser.close()
763
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200764 self.assertEqual(result.getvalue(), start + b"<doc></doc>")
Guido van Rossumd8faa362007-04-27 19:54:29 +0000765
766 def test_expat_incremental_reset(self):
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200767 result = BytesIO()
Guido van Rossumd8faa362007-04-27 19:54:29 +0000768 xmlgen = XMLGenerator(result)
769 parser = create_parser()
770 parser.setContentHandler(xmlgen)
771
772 parser.feed("<doc>")
773 parser.feed("text")
774
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200775 result = BytesIO()
Guido van Rossumd8faa362007-04-27 19:54:29 +0000776 xmlgen = XMLGenerator(result)
777 parser.setContentHandler(xmlgen)
778 parser.reset()
779
780 parser.feed("<doc>")
781 parser.feed("text")
782 parser.feed("</doc>")
783 parser.close()
784
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200785 self.assertEqual(result.getvalue(), start + b"<doc>text</doc>")
Guido van Rossumd8faa362007-04-27 19:54:29 +0000786
787 # ===== Locator support
788
789 def test_expat_locator_noinfo(self):
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200790 result = BytesIO()
Guido van Rossumd8faa362007-04-27 19:54:29 +0000791 xmlgen = XMLGenerator(result)
792 parser = create_parser()
793 parser.setContentHandler(xmlgen)
794
795 parser.feed("<doc>")
796 parser.feed("</doc>")
797 parser.close()
798
Ezio Melottib3aedd42010-11-20 19:04:17 +0000799 self.assertEqual(parser.getSystemId(), None)
800 self.assertEqual(parser.getPublicId(), None)
801 self.assertEqual(parser.getLineNumber(), 1)
Guido van Rossumd8faa362007-04-27 19:54:29 +0000802
Benjamin Petersona7f4f5a2008-09-04 02:22:52 +0000803 def test_expat_locator_withinfo(self):
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200804 result = BytesIO()
Guido van Rossumd8faa362007-04-27 19:54:29 +0000805 xmlgen = XMLGenerator(result)
806 parser = create_parser()
807 parser.setContentHandler(xmlgen)
Florent Xiclunaf15351d2010-03-13 23:24:31 +0000808 parser.parse(TEST_XMLFILE)
Guido van Rossumd8faa362007-04-27 19:54:29 +0000809
Ezio Melottib3aedd42010-11-20 19:04:17 +0000810 self.assertEqual(parser.getSystemId(), TEST_XMLFILE)
811 self.assertEqual(parser.getPublicId(), None)
Lars Gustäbel2fc52942000-10-24 15:35:07 +0000812
Serhiy Storchaka1a4ed4c2013-02-02 12:17:05 +0200813 @requires_nonascii_filenames
Serhiy Storchakad5202392013-02-02 10:31:17 +0200814 def test_expat_locator_withinfo_nonascii(self):
815 fname = support.TESTFN_UNICODE
816 shutil.copyfile(TEST_XMLFILE, fname)
817 self.addCleanup(support.unlink, fname)
818
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200819 result = BytesIO()
Serhiy Storchakad5202392013-02-02 10:31:17 +0200820 xmlgen = XMLGenerator(result)
821 parser = create_parser()
822 parser.setContentHandler(xmlgen)
823 parser.parse(fname)
824
825 self.assertEqual(parser.getSystemId(), fname)
826 self.assertEqual(parser.getPublicId(), None)
827
Martin v. Löwis80670bc2000-10-06 21:13:23 +0000828
829# ===========================================================================
830#
831# error reporting
832#
833# ===========================================================================
834
Guido van Rossumd8faa362007-04-27 19:54:29 +0000835class ErrorReportingTest(unittest.TestCase):
836 def test_expat_inpsource_location(self):
837 parser = create_parser()
838 parser.setContentHandler(ContentHandler()) # do nothing
839 source = InputSource()
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200840 source.setByteStream(BytesIO(b"<foo bar foobar>")) #ill-formed
Guido van Rossumd8faa362007-04-27 19:54:29 +0000841 name = "a file name"
842 source.setSystemId(name)
843 try:
844 parser.parse(source)
845 self.fail()
846 except SAXException as e:
Ezio Melottib3aedd42010-11-20 19:04:17 +0000847 self.assertEqual(e.getSystemId(), name)
Martin v. Löwis80670bc2000-10-06 21:13:23 +0000848
Guido van Rossumd8faa362007-04-27 19:54:29 +0000849 def test_expat_incomplete(self):
850 parser = create_parser()
851 parser.setContentHandler(ContentHandler()) # do nothing
852 self.assertRaises(SAXParseException, parser.parse, StringIO("<foo>"))
Martin v. Löwis80670bc2000-10-06 21:13:23 +0000853
Guido van Rossumd8faa362007-04-27 19:54:29 +0000854 def test_sax_parse_exception_str(self):
855 # pass various values from a locator to the SAXParseException to
856 # make sure that the __str__() doesn't fall apart when None is
857 # passed instead of an integer line and column number
858 #
859 # use "normal" values for the locator:
860 str(SAXParseException("message", None,
861 self.DummyLocator(1, 1)))
862 # use None for the line number:
863 str(SAXParseException("message", None,
864 self.DummyLocator(None, 1)))
865 # use None for the column number:
866 str(SAXParseException("message", None,
867 self.DummyLocator(1, None)))
868 # use None for both:
869 str(SAXParseException("message", None,
870 self.DummyLocator(None, None)))
Fred Drake6fd0b0d2004-03-20 08:15:30 +0000871
Guido van Rossumd8faa362007-04-27 19:54:29 +0000872 class DummyLocator:
873 def __init__(self, lineno, colno):
874 self._lineno = lineno
875 self._colno = colno
Fred Drake6fd0b0d2004-03-20 08:15:30 +0000876
Guido van Rossumd8faa362007-04-27 19:54:29 +0000877 def getPublicId(self):
878 return "pubid"
Fred Drake6fd0b0d2004-03-20 08:15:30 +0000879
Guido van Rossumd8faa362007-04-27 19:54:29 +0000880 def getSystemId(self):
881 return "sysid"
Fred Drake6fd0b0d2004-03-20 08:15:30 +0000882
Guido van Rossumd8faa362007-04-27 19:54:29 +0000883 def getLineNumber(self):
884 return self._lineno
Fred Drake6fd0b0d2004-03-20 08:15:30 +0000885
Guido van Rossumd8faa362007-04-27 19:54:29 +0000886 def getColumnNumber(self):
887 return self._colno
Martin v. Löwis80670bc2000-10-06 21:13:23 +0000888
Lars Gustäbelab647872000-09-24 18:40:52 +0000889# ===========================================================================
890#
891# xmlreader tests
892#
893# ===========================================================================
894
Guido van Rossumd8faa362007-04-27 19:54:29 +0000895class XmlReaderTest(XmlTestBase):
Lars Gustäbelab647872000-09-24 18:40:52 +0000896
Guido van Rossumd8faa362007-04-27 19:54:29 +0000897 # ===== AttributesImpl
898 def test_attrs_empty(self):
899 self.verify_empty_attrs(AttributesImpl({}))
Lars Gustäbelab647872000-09-24 18:40:52 +0000900
Guido van Rossumd8faa362007-04-27 19:54:29 +0000901 def test_attrs_wattr(self):
902 self.verify_attrs_wattr(AttributesImpl({"attr" : "val"}))
Lars Gustäbelab647872000-09-24 18:40:52 +0000903
Guido van Rossumd8faa362007-04-27 19:54:29 +0000904 def test_nsattrs_empty(self):
905 self.verify_empty_nsattrs(AttributesNSImpl({}, {}))
Lars Gustäbelab647872000-09-24 18:40:52 +0000906
Guido van Rossumd8faa362007-04-27 19:54:29 +0000907 def test_nsattrs_wattr(self):
908 attrs = AttributesNSImpl({(ns_uri, "attr") : "val"},
909 {(ns_uri, "attr") : "ns:attr"})
Fred Drake004d5e62000-10-23 17:22:08 +0000910
Ezio Melottib3aedd42010-11-20 19:04:17 +0000911 self.assertEqual(attrs.getLength(), 1)
912 self.assertEqual(attrs.getNames(), [(ns_uri, "attr")])
913 self.assertEqual(attrs.getQNames(), ["ns:attr"])
914 self.assertEqual(len(attrs), 1)
Benjamin Peterson577473f2010-01-19 00:09:57 +0000915 self.assertIn((ns_uri, "attr"), attrs)
Ezio Melottib3aedd42010-11-20 19:04:17 +0000916 self.assertEqual(list(attrs.keys()), [(ns_uri, "attr")])
917 self.assertEqual(attrs.get((ns_uri, "attr")), "val")
918 self.assertEqual(attrs.get((ns_uri, "attr"), 25), "val")
919 self.assertEqual(list(attrs.items()), [((ns_uri, "attr"), "val")])
920 self.assertEqual(list(attrs.values()), ["val"])
921 self.assertEqual(attrs.getValue((ns_uri, "attr")), "val")
922 self.assertEqual(attrs.getValueByQName("ns:attr"), "val")
923 self.assertEqual(attrs.getNameByQName("ns:attr"), (ns_uri, "attr"))
924 self.assertEqual(attrs[(ns_uri, "attr")], "val")
925 self.assertEqual(attrs.getQNameByName((ns_uri, "attr")), "ns:attr")
Fred Drake004d5e62000-10-23 17:22:08 +0000926
Lars Gustäbelab647872000-09-24 18:40:52 +0000927
Christian Heimesbbe741d2008-03-28 10:53:29 +0000928def test_main():
Guido van Rossumd8faa362007-04-27 19:54:29 +0000929 run_unittest(MakeParserTest,
930 SaxutilsTest,
Serhiy Storchaka88efc522013-02-10 14:29:52 +0200931 StringXmlgenTest,
932 BytesXmlgenTest,
933 WriterXmlgenTest,
Guido van Rossumd8faa362007-04-27 19:54:29 +0000934 ExpatReaderTest,
935 ErrorReportingTest,
936 XmlReaderTest)
Lars Gustäbelb7536d52000-09-24 18:53:56 +0000937
Guido van Rossumd8faa362007-04-27 19:54:29 +0000938if __name__ == "__main__":
Christian Heimesbbe741d2008-03-28 10:53:29 +0000939 test_main()