blob: cd243e62051e76713fed54421606c728367ecf94 [file] [log] [blame]
Fred Drake45cd9de2000-06-29 19:34:54 +00001"""
Martin v. Löwis3f1b5282003-01-25 16:51:50 +00002SAX driver for the pyexpat C module. This driver works with
Lars Gustäbelbb757132000-09-24 20:38:18 +00003pyexpat.__version__ == '2.22'.
Fred Drake45cd9de2000-06-29 19:34:54 +00004"""
5
Fred Drake45cd9de2000-06-29 19:34:54 +00006version = "0.20"
7
Fred Drakefbdeaad2006-07-29 16:56:15 +00008from xml.sax._exceptions import *
9from xml.sax.handler import feature_validation, feature_namespaces
10from xml.sax.handler import feature_namespace_prefixes
11from xml.sax.handler import feature_external_ges, feature_external_pes
12from xml.sax.handler import feature_string_interning
13from xml.sax.handler import property_xml_string, property_interning_dict
Martin v. Löwisfb73bb12001-06-17 07:05:43 +000014
Fred Drakefbdeaad2006-07-29 16:56:15 +000015# xml.parsers.expat does not raise ImportError in Jython
Martin v. Löwisfb73bb12001-06-17 07:05:43 +000016import sys
Fred Drakec974bf42001-07-30 22:41:23 +000017if sys.platform[:4] == "java":
Martin v. Löwisfb73bb12001-06-17 07:05:43 +000018 raise SAXReaderNotAvailable("expat not available in Java", None)
19del sys
20
Martin v. Löwis962c9e72000-10-06 17:41:52 +000021try:
Fred Drakefbdeaad2006-07-29 16:56:15 +000022 from xml.parsers import expat
Martin v. Löwis962c9e72000-10-06 17:41:52 +000023except ImportError:
Fred Drakec974bf42001-07-30 22:41:23 +000024 raise SAXReaderNotAvailable("expat not supported", None)
Jeremy Hyltone3c37d62001-07-30 21:49:22 +000025else:
26 if not hasattr(expat, "ParserCreate"):
Fred Drakec974bf42001-07-30 22:41:23 +000027 raise SAXReaderNotAvailable("expat not supported", None)
Fred Drakefbdeaad2006-07-29 16:56:15 +000028from xml.sax import xmlreader, saxutils, handler
Fred Drake45cd9de2000-06-29 19:34:54 +000029
Lars Gustäbel32bf12e2000-09-24 18:39:23 +000030AttributesImpl = xmlreader.AttributesImpl
31AttributesNSImpl = xmlreader.AttributesNSImpl
32
Martin v. Löwis18476a32002-06-30 07:21:24 +000033# If we're using a sufficiently recent version of Python, we can use
34# weak references to avoid cycles between the parser and content
35# handler, otherwise we'll just have to pretend.
36try:
37 import _weakref
38except ImportError:
39 def _mkproxy(o):
40 return o
41else:
42 import weakref
43 _mkproxy = weakref.proxy
44 del weakref, _weakref
Fred Drake012c81f2002-04-04 17:57:08 +000045
46# --- ExpatLocator
47
48class ExpatLocator(xmlreader.Locator):
49 """Locator for use with the ExpatParser class.
50
51 This uses a weak reference to the parser object to avoid creating
52 a circular reference between the parser and the content handler.
53 """
54 def __init__(self, parser):
Martin v. Löwis18476a32002-06-30 07:21:24 +000055 self._ref = _mkproxy(parser)
Fred Drake012c81f2002-04-04 17:57:08 +000056
57 def getColumnNumber(self):
Martin v. Löwis18476a32002-06-30 07:21:24 +000058 parser = self._ref
59 if parser._parser is None:
Fred Drake012c81f2002-04-04 17:57:08 +000060 return None
61 return parser._parser.ErrorColumnNumber
62
63 def getLineNumber(self):
Martin v. Löwis18476a32002-06-30 07:21:24 +000064 parser = self._ref
65 if parser._parser is None:
Fred Drake012c81f2002-04-04 17:57:08 +000066 return 1
Fred Drakeda204da2002-04-04 19:12:31 +000067 return parser._parser.ErrorLineNumber
Fred Drake012c81f2002-04-04 17:57:08 +000068
69 def getPublicId(self):
Martin v. Löwis18476a32002-06-30 07:21:24 +000070 parser = self._ref
Fred Drake012c81f2002-04-04 17:57:08 +000071 if parser is None:
72 return None
73 return parser._source.getPublicId()
74
75 def getSystemId(self):
Martin v. Löwis18476a32002-06-30 07:21:24 +000076 parser = self._ref
Fred Drake012c81f2002-04-04 17:57:08 +000077 if parser is None:
78 return None
79 return parser._source.getSystemId()
80
Martin v. Löwis3f0969f2000-09-29 19:00:40 +000081
Fred Drake45cd9de2000-06-29 19:34:54 +000082# --- ExpatParser
83
Fred Drakeddb48672000-09-23 05:32:26 +000084class ExpatParser(xmlreader.IncrementalParser, xmlreader.Locator):
Martin v. Löwis3f1b5282003-01-25 16:51:50 +000085 """SAX driver for the pyexpat C module."""
Fred Drake45cd9de2000-06-29 19:34:54 +000086
87 def __init__(self, namespaceHandling=0, bufsize=2**16-20):
88 xmlreader.IncrementalParser.__init__(self, bufsize)
Lars Gustäbele292a242000-09-24 20:19:45 +000089 self._source = xmlreader.InputSource()
Fred Drake45cd9de2000-06-29 19:34:54 +000090 self._parser = None
91 self._namespaces = namespaceHandling
Martin v. Löwis05917252001-01-27 08:56:24 +000092 self._lex_handler_prop = None
Fred Drake45cd9de2000-06-29 19:34:54 +000093 self._parsing = 0
Lars Gustäbele292a242000-09-24 20:19:45 +000094 self._entity_stack = []
Martin v. Löwis18476a32002-06-30 07:21:24 +000095 self._external_ges = 1
96 self._interning = None
Fred Drake45cd9de2000-06-29 19:34:54 +000097
98 # XMLReader methods
99
Lars Gustäbel523b0a62000-09-24 18:54:49 +0000100 def parse(self, source):
Lars Gustäbelbb757132000-09-24 20:38:18 +0000101 "Parse an XML document from a URL or an InputSource."
Lars Gustäbel523b0a62000-09-24 18:54:49 +0000102 source = saxutils.prepare_input_source(source)
103
104 self._source = source
Fred Drake45cd9de2000-06-29 19:34:54 +0000105 self.reset()
Fred Drake012c81f2002-04-04 17:57:08 +0000106 self._cont_handler.setDocumentLocator(ExpatLocator(self))
Fred Drake16f63292000-10-23 18:09:50 +0000107 xmlreader.IncrementalParser.parse(self, source)
Fred Drake45cd9de2000-06-29 19:34:54 +0000108
Lars Gustäbel523b0a62000-09-24 18:54:49 +0000109 def prepareParser(self, source):
Benjamin Peterson5b63acd2008-03-29 15:24:25 +0000110 if source.getSystemId() is not None:
Serhiy Storchaka8673ab92013-02-02 10:28:30 +0200111 base = source.getSystemId()
112 if isinstance(base, unicode):
113 base = base.encode('utf-8')
114 self._parser.SetBase(base)
Fred Drake16f63292000-10-23 18:09:50 +0000115
Martin v. Löwis3f1b5282003-01-25 16:51:50 +0000116 # Redefined setContentHandler to allow changing handlers during parsing
Martin v. Löwisfb73bb12001-06-17 07:05:43 +0000117
118 def setContentHandler(self, handler):
119 xmlreader.IncrementalParser.setContentHandler(self, handler)
120 if self._parsing:
121 self._reset_cont_handler()
122
Fred Drake45cd9de2000-06-29 19:34:54 +0000123 def getFeature(self, name):
Martin v. Löwis18476a32002-06-30 07:21:24 +0000124 if name == feature_namespaces:
Lars Gustäbelf43cf312000-09-24 18:29:24 +0000125 return self._namespaces
Martin v. Löwis18476a32002-06-30 07:21:24 +0000126 elif name == feature_string_interning:
127 return self._interning is not None
128 elif name in (feature_validation, feature_external_pes,
129 feature_namespace_prefixes):
130 return 0
131 elif name == feature_external_ges:
132 return self._external_ges
Fred Drake45cd9de2000-06-29 19:34:54 +0000133 raise SAXNotRecognizedException("Feature '%s' not recognized" % name)
134
135 def setFeature(self, name, state):
Lars Gustäbelf43cf312000-09-24 18:29:24 +0000136 if self._parsing:
137 raise SAXNotSupportedException("Cannot set features while parsing")
Martin v. Löwis18476a32002-06-30 07:21:24 +0000138
139 if name == feature_namespaces:
Lars Gustäbelf43cf312000-09-24 18:29:24 +0000140 self._namespaces = state
Martin v. Löwis18476a32002-06-30 07:21:24 +0000141 elif name == feature_external_ges:
142 self._external_ges = state
143 elif name == feature_string_interning:
144 if state:
145 if self._interning is None:
146 self._interning = {}
147 else:
148 self._interning = None
149 elif name == feature_validation:
150 if state:
Martin v. Löwis3f1b5282003-01-25 16:51:50 +0000151 raise SAXNotSupportedException(
152 "expat does not support validation")
Martin v. Löwis18476a32002-06-30 07:21:24 +0000153 elif name == feature_external_pes:
154 if state:
Martin v. Löwis3f1b5282003-01-25 16:51:50 +0000155 raise SAXNotSupportedException(
156 "expat does not read external parameter entities")
Martin v. Löwis18476a32002-06-30 07:21:24 +0000157 elif name == feature_namespace_prefixes:
158 if state:
Martin v. Löwis3f1b5282003-01-25 16:51:50 +0000159 raise SAXNotSupportedException(
160 "expat does not report namespace prefixes")
Lars Gustäbelf43cf312000-09-24 18:29:24 +0000161 else:
Martin v. Löwis3f1b5282003-01-25 16:51:50 +0000162 raise SAXNotRecognizedException(
163 "Feature '%s' not recognized" % name)
Fred Drake45cd9de2000-06-29 19:34:54 +0000164
165 def getProperty(self, name):
Martin v. Löwis05917252001-01-27 08:56:24 +0000166 if name == handler.property_lexical_handler:
167 return self._lex_handler_prop
Martin v. Löwis18476a32002-06-30 07:21:24 +0000168 elif name == property_interning_dict:
169 return self._interning
170 elif name == property_xml_string:
171 if self._parser:
172 if hasattr(self._parser, "GetInputContext"):
173 return self._parser.GetInputContext()
174 else:
Martin v. Löwis3f1b5282003-01-25 16:51:50 +0000175 raise SAXNotRecognizedException(
176 "This version of expat does not support getting"
177 " the XML string")
Martin v. Löwis18476a32002-06-30 07:21:24 +0000178 else:
Martin v. Löwis3f1b5282003-01-25 16:51:50 +0000179 raise SAXNotSupportedException(
180 "XML string cannot be returned when not parsing")
Fred Drake45cd9de2000-06-29 19:34:54 +0000181 raise SAXNotRecognizedException("Property '%s' not recognized" % name)
182
183 def setProperty(self, name, value):
Martin v. Löwis05917252001-01-27 08:56:24 +0000184 if name == handler.property_lexical_handler:
185 self._lex_handler_prop = value
Martin v. Löwisfb73bb12001-06-17 07:05:43 +0000186 if self._parsing:
187 self._reset_lex_handler_prop()
Martin v. Löwis18476a32002-06-30 07:21:24 +0000188 elif name == property_interning_dict:
189 self._interning = value
190 elif name == property_xml_string:
191 raise SAXNotSupportedException("Property '%s' cannot be set" %
192 name)
Martin v. Löwis05917252001-01-27 08:56:24 +0000193 else:
Martin v. Löwis18476a32002-06-30 07:21:24 +0000194 raise SAXNotRecognizedException("Property '%s' not recognized" %
195 name)
Fred Drake45cd9de2000-06-29 19:34:54 +0000196
197 # IncrementalParser methods
198
Martin v. Löwisee1dc152000-10-06 21:08:59 +0000199 def feed(self, data, isFinal = 0):
Fred Drake45cd9de2000-06-29 19:34:54 +0000200 if not self._parsing:
Fred Drake45cd9de2000-06-29 19:34:54 +0000201 self.reset()
Lars Gustäbel55b4efd2000-10-14 10:28:01 +0000202 self._parsing = 1
Fred Drake45cd9de2000-06-29 19:34:54 +0000203 self._cont_handler.startDocument()
Lars Gustäbelf43cf312000-09-24 18:29:24 +0000204
Martin v. Löwisee1dc152000-10-06 21:08:59 +0000205 try:
206 # The isFinal parameter is internal to the expat reader.
207 # If it is set to true, expat will check validity of the entire
208 # document. When feeding chunks, they are not normally final -
209 # except when invoked from close.
210 self._parser.Parse(data, isFinal)
Martin v. Löwis3f1b5282003-01-25 16:51:50 +0000211 except expat.error, e:
212 exc = SAXParseException(expat.ErrorString(e.code), e, self)
Martin v. Löwis05917252001-01-27 08:56:24 +0000213 # FIXME: when to invoke error()?
Martin v. Löwis04f49432000-10-09 16:45:54 +0000214 self._err_handler.fatalError(exc)
Fred Drake45cd9de2000-06-29 19:34:54 +0000215
216 def close(self):
Serhiy Storchaka1aa2c0f2015-04-10 13:24:10 +0300217 if self._entity_stack or self._parser is None:
Martin v. Löwisee1dc152000-10-06 21:08:59 +0000218 # If we are completing an external entity, do nothing here
219 return
Serhiy Storchaka1aa2c0f2015-04-10 13:24:10 +0300220 try:
221 self.feed("", isFinal = 1)
222 self._cont_handler.endDocument()
223 finally:
224 self._parsing = 0
225 # break cycle created by expat handlers pointing to our methods
226 self._parser = None
Fred Drake16f63292000-10-23 18:09:50 +0000227
Martin v. Löwisfb73bb12001-06-17 07:05:43 +0000228 def _reset_cont_handler(self):
229 self._parser.ProcessingInstructionHandler = \
230 self._cont_handler.processingInstruction
231 self._parser.CharacterDataHandler = self._cont_handler.characters
232
233 def _reset_lex_handler_prop(self):
Martin v. Löwis3f1b5282003-01-25 16:51:50 +0000234 lex = self._lex_handler_prop
235 parser = self._parser
236 if lex is None:
237 parser.CommentHandler = None
238 parser.StartCdataSectionHandler = None
239 parser.EndCdataSectionHandler = None
240 parser.StartDoctypeDeclHandler = None
241 parser.EndDoctypeDeclHandler = None
242 else:
243 parser.CommentHandler = lex.comment
244 parser.StartCdataSectionHandler = lex.startCDATA
245 parser.EndCdataSectionHandler = lex.endCDATA
246 parser.StartDoctypeDeclHandler = self.start_doctype_decl
247 parser.EndDoctypeDeclHandler = lex.endDTD
Martin v. Löwisfb73bb12001-06-17 07:05:43 +0000248
Fred Drake45cd9de2000-06-29 19:34:54 +0000249 def reset(self):
250 if self._namespaces:
Andrew M. Kuchling593d6b32005-12-04 19:53:45 +0000251 self._parser = expat.ParserCreate(self._source.getEncoding(), " ",
Martin v. Löwis3f1b5282003-01-25 16:51:50 +0000252 intern=self._interning)
253 self._parser.namespace_prefixes = 1
Fred Drake45cd9de2000-06-29 19:34:54 +0000254 self._parser.StartElementHandler = self.start_element_ns
255 self._parser.EndElementHandler = self.end_element_ns
256 else:
Andrew M. Kuchling593d6b32005-12-04 19:53:45 +0000257 self._parser = expat.ParserCreate(self._source.getEncoding(),
258 intern = self._interning)
Paul Prescod6c4753f2000-07-04 03:39:33 +0000259 self._parser.StartElementHandler = self.start_element
260 self._parser.EndElementHandler = self.end_element
Fred Drake45cd9de2000-06-29 19:34:54 +0000261
Martin v. Löwisfb73bb12001-06-17 07:05:43 +0000262 self._reset_cont_handler()
Fred Drake45cd9de2000-06-29 19:34:54 +0000263 self._parser.UnparsedEntityDeclHandler = self.unparsed_entity_decl
264 self._parser.NotationDeclHandler = self.notation_decl
265 self._parser.StartNamespaceDeclHandler = self.start_namespace_decl
266 self._parser.EndNamespaceDeclHandler = self.end_namespace_decl
Martin v. Löwis70d39a62001-01-27 09:01:20 +0000267
Martin v. Löwis05917252001-01-27 08:56:24 +0000268 self._decl_handler_prop = None
269 if self._lex_handler_prop:
Martin v. Löwisfb73bb12001-06-17 07:05:43 +0000270 self._reset_lex_handler_prop()
Martin v. Löwis70d39a62001-01-27 09:01:20 +0000271# self._parser.DefaultHandler =
272# self._parser.DefaultHandlerExpand =
273# self._parser.NotStandaloneHandler =
Fred Drake45cd9de2000-06-29 19:34:54 +0000274 self._parser.ExternalEntityRefHandler = self.external_entity_ref
Martin v. Löwis3f1b5282003-01-25 16:51:50 +0000275 try:
276 self._parser.SkippedEntityHandler = self.skipped_entity_handler
277 except AttributeError:
278 # This pyexpat does not support SkippedEntity
279 pass
280 self._parser.SetParamEntityParsing(
281 expat.XML_PARAM_ENTITY_PARSING_UNLESS_STANDALONE)
Lars Gustäbelbb757132000-09-24 20:38:18 +0000282
Lars Gustäbel55b4efd2000-10-14 10:28:01 +0000283 self._parsing = 0
Lars Gustäbelbb757132000-09-24 20:38:18 +0000284 self._entity_stack = []
Fred Drake16f63292000-10-23 18:09:50 +0000285
Fred Drake45cd9de2000-06-29 19:34:54 +0000286 # Locator methods
287
288 def getColumnNumber(self):
Martin v. Löwis05917252001-01-27 08:56:24 +0000289 if self._parser is None:
290 return None
Fred Drake45cd9de2000-06-29 19:34:54 +0000291 return self._parser.ErrorColumnNumber
292
293 def getLineNumber(self):
Martin v. Löwis05917252001-01-27 08:56:24 +0000294 if self._parser is None:
295 return 1
Fred Drake45cd9de2000-06-29 19:34:54 +0000296 return self._parser.ErrorLineNumber
297
298 def getPublicId(self):
299 return self._source.getPublicId()
300
301 def getSystemId(self):
Martin v. Löwisee1dc152000-10-06 21:08:59 +0000302 return self._source.getSystemId()
Fred Drake16f63292000-10-23 18:09:50 +0000303
Fred Drake45cd9de2000-06-29 19:34:54 +0000304 # event handlers
Fred Drake45cd9de2000-06-29 19:34:54 +0000305 def start_element(self, name, attrs):
Lars Gustäbel32bf12e2000-09-24 18:39:23 +0000306 self._cont_handler.startElement(name, AttributesImpl(attrs))
Fred Drake45cd9de2000-06-29 19:34:54 +0000307
308 def end_element(self, name):
Lars Gustäbelf43cf312000-09-24 18:29:24 +0000309 self._cont_handler.endElement(name)
Fred Drake45cd9de2000-06-29 19:34:54 +0000310
311 def start_element_ns(self, name, attrs):
Neal Norwitzab199622002-05-31 20:46:39 +0000312 pair = name.split()
Fred Drake45cd9de2000-06-29 19:34:54 +0000313 if len(pair) == 1:
Martin v. Löwis3f1b5282003-01-25 16:51:50 +0000314 # no namespace
Lars Gustäbelf43cf312000-09-24 18:29:24 +0000315 pair = (None, name)
Martin v. Löwis3f1b5282003-01-25 16:51:50 +0000316 elif len(pair) == 3:
317 pair = pair[0], pair[1]
Lars Gustäbeld2f5a9a2000-10-19 07:36:29 +0000318 else:
Martin v. Löwis3f1b5282003-01-25 16:51:50 +0000319 # default namespace
Lars Gustäbeld2f5a9a2000-10-19 07:36:29 +0000320 pair = tuple(pair)
Fred Drake45cd9de2000-06-29 19:34:54 +0000321
Lars Gustäbel32bf12e2000-09-24 18:39:23 +0000322 newattrs = {}
Martin v. Löwis3f1b5282003-01-25 16:51:50 +0000323 qnames = {}
Lars Gustäbel32bf12e2000-09-24 18:39:23 +0000324 for (aname, value) in attrs.items():
Martin v. Löwis3f1b5282003-01-25 16:51:50 +0000325 parts = aname.split()
326 length = len(parts)
327 if length == 1:
328 # no namespace
329 qname = aname
Lars Gustäbel32bf12e2000-09-24 18:39:23 +0000330 apair = (None, aname)
Martin v. Löwis3f1b5282003-01-25 16:51:50 +0000331 elif length == 3:
332 qname = "%s:%s" % (parts[2], parts[1])
333 apair = parts[0], parts[1]
Lars Gustäbel32bf12e2000-09-24 18:39:23 +0000334 else:
Martin v. Löwis3f1b5282003-01-25 16:51:50 +0000335 # default namespace
336 qname = parts[1]
337 apair = tuple(parts)
Lars Gustäbel32bf12e2000-09-24 18:39:23 +0000338
339 newattrs[apair] = value
Martin v. Löwis3f1b5282003-01-25 16:51:50 +0000340 qnames[apair] = qname
Lars Gustäbel32bf12e2000-09-24 18:39:23 +0000341
Fred Drake16f63292000-10-23 18:09:50 +0000342 self._cont_handler.startElementNS(pair, None,
Martin v. Löwis3f1b5282003-01-25 16:51:50 +0000343 AttributesNSImpl(newattrs, qnames))
Fred Drake45cd9de2000-06-29 19:34:54 +0000344
345 def end_element_ns(self, name):
Neal Norwitzab199622002-05-31 20:46:39 +0000346 pair = name.split()
Fred Drake45cd9de2000-06-29 19:34:54 +0000347 if len(pair) == 1:
Lars Gustäbel32bf12e2000-09-24 18:39:23 +0000348 pair = (None, name)
Martin v. Löwis3f1b5282003-01-25 16:51:50 +0000349 elif len(pair) == 3:
350 pair = pair[0], pair[1]
Martin v. Löwis05917252001-01-27 08:56:24 +0000351 else:
352 pair = tuple(pair)
Fred Drake16f63292000-10-23 18:09:50 +0000353
Lars Gustäbelf43cf312000-09-24 18:29:24 +0000354 self._cont_handler.endElementNS(pair, None)
Fred Drake45cd9de2000-06-29 19:34:54 +0000355
Lars Gustäbelf43cf312000-09-24 18:29:24 +0000356 # this is not used (call directly to ContentHandler)
Fred Drake45cd9de2000-06-29 19:34:54 +0000357 def processing_instruction(self, target, data):
358 self._cont_handler.processingInstruction(target, data)
359
Lars Gustäbelf43cf312000-09-24 18:29:24 +0000360 # this is not used (call directly to ContentHandler)
Fred Drake45cd9de2000-06-29 19:34:54 +0000361 def character_data(self, data):
362 self._cont_handler.characters(data)
363
364 def start_namespace_decl(self, prefix, uri):
365 self._cont_handler.startPrefixMapping(prefix, uri)
366
367 def end_namespace_decl(self, prefix):
368 self._cont_handler.endPrefixMapping(prefix)
Fred Drake16f63292000-10-23 18:09:50 +0000369
Martin v. Löwis456ab1d2004-05-06 01:54:36 +0000370 def start_doctype_decl(self, name, sysid, pubid, has_internal_subset):
Martin v. Löwis3f1b5282003-01-25 16:51:50 +0000371 self._lex_handler_prop.startDTD(name, pubid, sysid)
372
Fred Drake45cd9de2000-06-29 19:34:54 +0000373 def unparsed_entity_decl(self, name, base, sysid, pubid, notation_name):
374 self._dtd_handler.unparsedEntityDecl(name, pubid, sysid, notation_name)
375
376 def notation_decl(self, name, base, sysid, pubid):
377 self._dtd_handler.notationDecl(name, pubid, sysid)
378
379 def external_entity_ref(self, context, base, sysid, pubid):
Martin v. Löwis18476a32002-06-30 07:21:24 +0000380 if not self._external_ges:
381 return 1
Martin v. Löwisd1b516c2002-06-30 07:27:30 +0000382
Fred Drake45cd9de2000-06-29 19:34:54 +0000383 source = self._ent_handler.resolveEntity(pubid, sysid)
Lars Gustäbele292a242000-09-24 20:19:45 +0000384 source = saxutils.prepare_input_source(source,
385 self._source.getSystemId() or
386 "")
Fred Drake16f63292000-10-23 18:09:50 +0000387
Lars Gustäbele292a242000-09-24 20:19:45 +0000388 self._entity_stack.append((self._parser, self._source))
389 self._parser = self._parser.ExternalEntityParserCreate(context)
390 self._source = source
391
392 try:
393 xmlreader.IncrementalParser.parse(self, source)
Lars Gustäbele292a242000-09-24 20:19:45 +0000394 except:
395 return 0 # FIXME: save error info here?
396
397 (self._parser, self._source) = self._entity_stack[-1]
398 del self._entity_stack[-1]
Fred Drake45cd9de2000-06-29 19:34:54 +0000399 return 1
Fred Drake16f63292000-10-23 18:09:50 +0000400
Martin v. Löwis3f1b5282003-01-25 16:51:50 +0000401 def skipped_entity_handler(self, name, is_pe):
402 if is_pe:
403 # The SAX spec requires to report skipped PEs with a '%'
404 name = '%'+name
405 self._cont_handler.skippedEntity(name)
406
Fred Drake45cd9de2000-06-29 19:34:54 +0000407# ---
Fred Drake16f63292000-10-23 18:09:50 +0000408
Fred Drake45cd9de2000-06-29 19:34:54 +0000409def create_parser(*args, **kwargs):
Guido van Rossum68468eb2003-02-27 20:14:51 +0000410 return ExpatParser(*args, **kwargs)
Fred Drake16f63292000-10-23 18:09:50 +0000411
Fred Drake45cd9de2000-06-29 19:34:54 +0000412# ---
413
414if __name__ == "__main__":
Amaury Forgeot d'Arce71bd812009-06-22 19:33:48 +0000415 import xml.sax.saxutils
Fred Drake45cd9de2000-06-29 19:34:54 +0000416 p = create_parser()
Amaury Forgeot d'Arce71bd812009-06-22 19:33:48 +0000417 p.setContentHandler(xml.sax.saxutils.XMLGenerator())
Fred Drakefbdeaad2006-07-29 16:56:15 +0000418 p.setErrorHandler(xml.sax.ErrorHandler())
Amaury Forgeot d'Arce71bd812009-06-22 19:33:48 +0000419 p.parse("http://www.ibiblio.org/xml/examples/shakespeare/hamlet.xml")