blob: 33ad736ea81026f19d01d7fa5fbd572da80f660f [file] [log] [blame]
Fred Drake1f549022000-09-24 05:21:58 +00001"""\
Fred Drakef7cf40d2000-12-14 18:16:11 +00002minidom.py -- a lightweight DOM implementation.
Fred Drake55c38192000-06-29 19:39:57 +00003
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +00004parse("foo.xml")
Paul Prescod623511b2000-07-21 22:05:49 +00005
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +00006parseString("<foo><bar/></foo>")
Paul Prescod623511b2000-07-21 22:05:49 +00007
Fred Drake55c38192000-06-29 19:39:57 +00008Todo:
9=====
10 * convenience methods for getting elements and text.
11 * more testing
12 * bring some of the writer and linearizer code into conformance with this
13 interface
14 * SAX 2 namespaces
15"""
16
Fred Drake49a5d032001-11-30 22:21:58 +000017from xml.dom import HierarchyRequestErr, EMPTY_NAMESPACE
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +000018
Fred Drake4ccf4a12000-11-21 22:02:22 +000019# localize the types, and allow support for Unicode values if available:
Fred Drake1f549022000-09-24 05:21:58 +000020import types
Fred Drake4ccf4a12000-11-21 22:02:22 +000021_TupleType = types.TupleType
22try:
23 _StringTypes = (types.StringType, types.UnicodeType)
24except AttributeError:
25 _StringTypes = (types.StringType,)
26del types
27
Fred Drakef7cf40d2000-12-14 18:16:11 +000028import xml.dom
Fred Drake55c38192000-06-29 19:39:57 +000029
Fred Drake3ac6a092001-09-28 04:33:06 +000030
31if list is type([]):
32 class NodeList(list):
33 def item(self, index):
34 if 0 <= index < len(self):
35 return self[index]
36
Fred Drake575712e2001-09-28 20:25:45 +000037 length = property(lambda self: len(self),
38 doc="The number of nodes in the NodeList.")
Fred Drake3ac6a092001-09-28 04:33:06 +000039
40else:
41 def NodeList():
42 return []
Martin v. Löwis95700f72002-03-15 13:51:59 +000043
Fred Drake3ac6a092001-09-28 04:33:06 +000044
Fred Drake575712e2001-09-28 20:25:45 +000045class Node(xml.dom.Node):
Fred Drake1f549022000-09-24 05:21:58 +000046 allnodes = {}
47 _debug = 0
48 _makeParentNodes = 1
49 debug = None
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +000050 childNodeTypes = ()
Martin v. Löwis126f2f62001-03-13 10:50:13 +000051 namespaceURI = None # this is non-null only for elements and attributes
Fred Drake575712e2001-09-28 20:25:45 +000052 parentNode = None
53 ownerDocument = None
Martin v. Löwis52ce0d02001-01-27 08:47:37 +000054
Fred Drake1f549022000-09-24 05:21:58 +000055 def __init__(self):
Fred Drake3ac6a092001-09-28 04:33:06 +000056 self.childNodes = NodeList()
Fred Drake16f63292000-10-23 18:09:50 +000057 if Node._debug:
Fred Drake1f549022000-09-24 05:21:58 +000058 index = repr(id(self)) + repr(self.__class__)
59 Node.allnodes[index] = repr(self.__dict__)
60 if Node.debug is None:
Fred Drake4ccf4a12000-11-21 22:02:22 +000061 Node.debug = _get_StringIO()
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +000062 #open("debug4.out", "w")
Fred Drake1f549022000-09-24 05:21:58 +000063 Node.debug.write("create %s\n" % index)
Fred Drake55c38192000-06-29 19:39:57 +000064
Fred Drake1f549022000-09-24 05:21:58 +000065 def __nonzero__(self):
66 return 1
Fred Drake55c38192000-06-29 19:39:57 +000067
Martin v. Löwis7d650ca2002-06-30 15:05:00 +000068 def toxml(self, encoding = None):
69 return self.toprettyxml("", "", encoding)
Fred Drake55c38192000-06-29 19:39:57 +000070
Martin v. Löwis7d650ca2002-06-30 15:05:00 +000071 def toprettyxml(self, indent="\t", newl="\n", encoding = None):
Martin v. Löwiscb67ea12001-03-31 16:30:40 +000072 # indent = the indentation string to prepend, per level
73 # newl = the newline string to append
74 writer = _get_StringIO()
Martin v. Löwis7d650ca2002-06-30 15:05:00 +000075 if encoding is not None:
76 import codecs
77 # Can't use codecs.getwriter to preserve 2.0 compatibility
78 writer = codecs.lookup(encoding)[3](writer)
79 if self.nodeType == Node.DOCUMENT_NODE:
80 # Can pass encoding only to document, to put it into XML header
81 self.writexml(writer, "", indent, newl, encoding)
82 else:
83 self.writexml(writer, "", indent, newl)
Martin v. Löwiscb67ea12001-03-31 16:30:40 +000084 return writer.getvalue()
Martin v. Löwis46fa39a2001-02-06 00:14:08 +000085
Fred Drake1f549022000-09-24 05:21:58 +000086 def hasChildNodes(self):
87 if self.childNodes:
88 return 1
89 else:
90 return 0
Fred Drake55c38192000-06-29 19:39:57 +000091
Fred Drake1f549022000-09-24 05:21:58 +000092 def _get_firstChild(self):
Fred Drake4ccf4a12000-11-21 22:02:22 +000093 if self.childNodes:
94 return self.childNodes[0]
Paul Prescod73678da2000-07-01 04:58:47 +000095
Fred Drake1f549022000-09-24 05:21:58 +000096 def _get_lastChild(self):
Fred Drake4ccf4a12000-11-21 22:02:22 +000097 if self.childNodes:
98 return self.childNodes[-1]
Paul Prescod73678da2000-07-01 04:58:47 +000099
Fred Draked1572372001-09-29 04:58:32 +0000100 try:
101 property
102 except NameError:
103 def __getattr__(self, key):
104 if key[0:2] == "__":
105 raise AttributeError, key
106 # getattr should never call getattr!
107 if self.__dict__.has_key("inGetAttr"):
108 del self.inGetAttr
109 raise AttributeError, key
110
111 prefix, attrname = key[:5], key[5:]
112 if prefix == "_get_":
113 self.inGetAttr = 1
114 if hasattr(self, attrname):
115 del self.inGetAttr
116 return (lambda self=self, attrname=attrname:
117 getattr(self, attrname))
118 else:
119 del self.inGetAttr
120 raise AttributeError, key
121 else:
122 self.inGetAttr = 1
123 try:
124 func = getattr(self, "_get_" + key)
125 except AttributeError:
126 raise AttributeError, key
127 del self.inGetAttr
128 return func()
129 else:
130 firstChild = property(_get_firstChild,
131 doc="First child node, or None.")
132 lastChild = property(_get_lastChild,
133 doc="Last child node, or None.")
134
Fred Drake1f549022000-09-24 05:21:58 +0000135 def insertBefore(self, newChild, refChild):
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000136 if newChild.nodeType == self.DOCUMENT_FRAGMENT_NODE:
Fred Drakee50959a2001-12-06 04:32:18 +0000137 for c in tuple(newChild.childNodes):
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000138 self.insertBefore(c, refChild)
139 ### The DOM does not clearly specify what to return in this case
140 return newChild
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000141 if newChild.nodeType not in self.childNodeTypes:
142 raise HierarchyRequestErr, \
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000143 "%s cannot be child of %s" % (repr(newChild), repr(self))
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000144 if newChild.parentNode is not None:
145 newChild.parentNode.removeChild(newChild)
Fred Drake4ccf4a12000-11-21 22:02:22 +0000146 if refChild is None:
147 self.appendChild(newChild)
148 else:
149 index = self.childNodes.index(refChild)
150 self.childNodes.insert(index, newChild)
151 newChild.nextSibling = refChild
152 refChild.previousSibling = newChild
153 if index:
154 node = self.childNodes[index-1]
155 node.nextSibling = newChild
156 newChild.previousSibling = node
157 else:
158 newChild.previousSibling = None
159 if self._makeParentNodes:
160 newChild.parentNode = self
161 return newChild
Fred Drake55c38192000-06-29 19:39:57 +0000162
Fred Drake1f549022000-09-24 05:21:58 +0000163 def appendChild(self, node):
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000164 if node.nodeType == self.DOCUMENT_FRAGMENT_NODE:
Fred Drakee50959a2001-12-06 04:32:18 +0000165 for c in tuple(node.childNodes):
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000166 self.appendChild(c)
167 ### The DOM does not clearly specify what to return in this case
168 return node
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000169 if node.nodeType not in self.childNodeTypes:
170 raise HierarchyRequestErr, \
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000171 "%s cannot be child of %s" % (repr(node), repr(self))
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000172 if node.parentNode is not None:
173 node.parentNode.removeChild(node)
Fred Drake13a30692000-10-09 20:04:16 +0000174 if self.childNodes:
175 last = self.lastChild
176 node.previousSibling = last
177 last.nextSibling = node
178 else:
179 node.previousSibling = None
180 node.nextSibling = None
Fred Drake1f549022000-09-24 05:21:58 +0000181 self.childNodes.append(node)
Fred Drake4ccf4a12000-11-21 22:02:22 +0000182 if self._makeParentNodes:
183 node.parentNode = self
Paul Prescod73678da2000-07-01 04:58:47 +0000184 return node
185
Fred Drake1f549022000-09-24 05:21:58 +0000186 def replaceChild(self, newChild, oldChild):
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000187 if newChild.nodeType == self.DOCUMENT_FRAGMENT_NODE:
188 refChild = oldChild.nextSibling
189 self.removeChild(oldChild)
190 return self.insertBefore(newChild, refChild)
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000191 if newChild.nodeType not in self.childNodeTypes:
192 raise HierarchyRequestErr, \
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000193 "%s cannot be child of %s" % (repr(newChild), repr(self))
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000194 if newChild.parentNode is not None:
195 newChild.parentNode.removeChild(newChild)
Fred Drake4ccf4a12000-11-21 22:02:22 +0000196 if newChild is oldChild:
197 return
Fred Drake1f549022000-09-24 05:21:58 +0000198 index = self.childNodes.index(oldChild)
Fred Drake4ccf4a12000-11-21 22:02:22 +0000199 self.childNodes[index] = newChild
200 if self._makeParentNodes:
201 newChild.parentNode = self
202 oldChild.parentNode = None
203 newChild.nextSibling = oldChild.nextSibling
204 newChild.previousSibling = oldChild.previousSibling
Martin v. Löwis156c3372000-12-28 18:40:56 +0000205 oldChild.nextSibling = None
Fred Drake4ccf4a12000-11-21 22:02:22 +0000206 oldChild.previousSibling = None
Martin v. Löwis156c3372000-12-28 18:40:56 +0000207 if newChild.previousSibling:
208 newChild.previousSibling.nextSibling = newChild
209 if newChild.nextSibling:
210 newChild.nextSibling.previousSibling = newChild
Fred Drake4ccf4a12000-11-21 22:02:22 +0000211 return oldChild
Paul Prescod73678da2000-07-01 04:58:47 +0000212
Fred Drake1f549022000-09-24 05:21:58 +0000213 def removeChild(self, oldChild):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000214 self.childNodes.remove(oldChild)
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000215 if oldChild.nextSibling is not None:
216 oldChild.nextSibling.previousSibling = oldChild.previousSibling
217 if oldChild.previousSibling is not None:
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000218 oldChild.previousSibling.nextSibling = oldChild.nextSibling
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000219 oldChild.nextSibling = oldChild.previousSibling = None
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000220
Fred Drake4ccf4a12000-11-21 22:02:22 +0000221 if self._makeParentNodes:
222 oldChild.parentNode = None
223 return oldChild
224
225 def normalize(self):
Fred Drakef7cf40d2000-12-14 18:16:11 +0000226 L = []
227 for child in self.childNodes:
228 if child.nodeType == Node.TEXT_NODE:
229 data = child.data
230 if data and L and L[-1].nodeType == child.nodeType:
Fred Drake4ccf4a12000-11-21 22:02:22 +0000231 # collapse text node
232 node = L[-1]
233 node.data = node.nodeValue = node.data + child.data
234 node.nextSibling = child.nextSibling
235 child.unlink()
Fred Drakef7cf40d2000-12-14 18:16:11 +0000236 elif data:
237 if L:
238 L[-1].nextSibling = child
239 child.previousSibling = L[-1]
240 else:
241 child.previousSibling = None
242 L.append(child)
Fred Drake4ccf4a12000-11-21 22:02:22 +0000243 else:
Fred Drakef7cf40d2000-12-14 18:16:11 +0000244 # empty text node; discard
245 child.unlink()
246 else:
247 if L:
Fred Drake4ccf4a12000-11-21 22:02:22 +0000248 L[-1].nextSibling = child
249 child.previousSibling = L[-1]
Fred Drakef7cf40d2000-12-14 18:16:11 +0000250 else:
251 child.previousSibling = None
252 L.append(child)
253 if child.nodeType == Node.ELEMENT_NODE:
Fred Drake4ccf4a12000-11-21 22:02:22 +0000254 child.normalize()
Fred Drakef7cf40d2000-12-14 18:16:11 +0000255 self.childNodes[:] = L
Paul Prescod73678da2000-07-01 04:58:47 +0000256
Fred Drake1f549022000-09-24 05:21:58 +0000257 def cloneNode(self, deep):
Paul Prescod73678da2000-07-01 04:58:47 +0000258 import new
Fred Drake4ccf4a12000-11-21 22:02:22 +0000259 clone = new.instance(self.__class__, self.__dict__.copy())
260 if self._makeParentNodes:
261 clone.parentNode = None
Fred Drake3ac6a092001-09-28 04:33:06 +0000262 clone.childNodes = NodeList()
Fred Drake4ccf4a12000-11-21 22:02:22 +0000263 if deep:
264 for child in self.childNodes:
265 clone.appendChild(child.cloneNode(1))
Paul Prescod73678da2000-07-01 04:58:47 +0000266 return clone
Fred Drake55c38192000-06-29 19:39:57 +0000267
Fred Drake25239772001-02-02 19:40:19 +0000268 # DOM Level 3 (Working Draft 2001-Jan-26)
269
270 def isSameNode(self, other):
271 return self is other
272
273 # minidom-specific API:
274
Fred Drake1f549022000-09-24 05:21:58 +0000275 def unlink(self):
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000276 self.parentNode = self.ownerDocument = None
Fred Drake4ccf4a12000-11-21 22:02:22 +0000277 for child in self.childNodes:
278 child.unlink()
Fred Drake1f549022000-09-24 05:21:58 +0000279 self.childNodes = None
Paul Prescod4221ff02000-10-13 20:11:42 +0000280 self.previousSibling = None
281 self.nextSibling = None
Paul Prescod73678da2000-07-01 04:58:47 +0000282 if Node._debug:
Fred Drake1f549022000-09-24 05:21:58 +0000283 index = repr(id(self)) + repr(self.__class__)
284 self.debug.write("Deleting: %s\n" % index)
Paul Prescod73678da2000-07-01 04:58:47 +0000285 del Node.allnodes[index]
Fred Drake55c38192000-06-29 19:39:57 +0000286
Fred Drake1f549022000-09-24 05:21:58 +0000287def _write_data(writer, data):
Fred Drake55c38192000-06-29 19:39:57 +0000288 "Writes datachars to writer."
Neal Norwitzab199622002-05-31 20:46:39 +0000289 data = data.replace("&", "&amp;")
290 data = data.replace("<", "&lt;")
291 data = data.replace("\"", "&quot;")
292 data = data.replace(">", "&gt;")
Fred Drake55c38192000-06-29 19:39:57 +0000293 writer.write(data)
294
Fred Drake1f549022000-09-24 05:21:58 +0000295def _getElementsByTagNameHelper(parent, name, rc):
Fred Drake55c38192000-06-29 19:39:57 +0000296 for node in parent.childNodes:
Fred Drake1f549022000-09-24 05:21:58 +0000297 if node.nodeType == Node.ELEMENT_NODE and \
298 (name == "*" or node.tagName == name):
299 rc.append(node)
300 _getElementsByTagNameHelper(node, name, rc)
Fred Drake55c38192000-06-29 19:39:57 +0000301 return rc
302
Fred Drake1f549022000-09-24 05:21:58 +0000303def _getElementsByTagNameNSHelper(parent, nsURI, localName, rc):
Fred Drake55c38192000-06-29 19:39:57 +0000304 for node in parent.childNodes:
Fred Drake1f549022000-09-24 05:21:58 +0000305 if node.nodeType == Node.ELEMENT_NODE:
Martin v. Löwised525fb2001-06-03 14:06:42 +0000306 if ((localName == "*" or node.localName == localName) and
Fred Drake1f549022000-09-24 05:21:58 +0000307 (nsURI == "*" or node.namespaceURI == nsURI)):
308 rc.append(node)
Fred Drakef7cf40d2000-12-14 18:16:11 +0000309 _getElementsByTagNameNSHelper(node, nsURI, localName, rc)
310 return rc
Fred Drake55c38192000-06-29 19:39:57 +0000311
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000312class DocumentFragment(Node):
313 nodeType = Node.DOCUMENT_FRAGMENT_NODE
314 nodeName = "#document-fragment"
315 nodeValue = None
316 attributes = None
317 parentNode = None
318 childNodeTypes = (Node.ELEMENT_NODE,
319 Node.TEXT_NODE,
320 Node.CDATA_SECTION_NODE,
321 Node.ENTITY_REFERENCE_NODE,
322 Node.PROCESSING_INSTRUCTION_NODE,
323 Node.COMMENT_NODE,
324 Node.NOTATION_NODE)
325
326
Fred Drake55c38192000-06-29 19:39:57 +0000327class Attr(Node):
Fred Drake1f549022000-09-24 05:21:58 +0000328 nodeType = Node.ATTRIBUTE_NODE
Fred Drake4ccf4a12000-11-21 22:02:22 +0000329 attributes = None
330 ownerElement = None
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000331 childNodeTypes = (Node.TEXT_NODE, Node.ENTITY_REFERENCE_NODE)
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000332
Fred Drake49a5d032001-11-30 22:21:58 +0000333 def __init__(self, qName, namespaceURI=EMPTY_NAMESPACE, localName=None, prefix=None):
Fred Drake55c38192000-06-29 19:39:57 +0000334 # skip setattr for performance
Fred Drake4ccf4a12000-11-21 22:02:22 +0000335 d = self.__dict__
336 d["localName"] = localName or qName
337 d["nodeName"] = d["name"] = qName
338 d["namespaceURI"] = namespaceURI
339 d["prefix"] = prefix
Fred Drake1f549022000-09-24 05:21:58 +0000340 Node.__init__(self)
Paul Prescod73678da2000-07-01 04:58:47 +0000341 # nodeValue and value are set elsewhere
Fred Drake55c38192000-06-29 19:39:57 +0000342
Fred Drake1f549022000-09-24 05:21:58 +0000343 def __setattr__(self, name, value):
Fred Drakef7cf40d2000-12-14 18:16:11 +0000344 d = self.__dict__
Fred Drake1f549022000-09-24 05:21:58 +0000345 if name in ("value", "nodeValue"):
Fred Drakef7cf40d2000-12-14 18:16:11 +0000346 d["value"] = d["nodeValue"] = value
347 elif name in ("name", "nodeName"):
348 d["name"] = d["nodeName"] = value
Fred Drake55c38192000-06-29 19:39:57 +0000349 else:
Fred Drakef7cf40d2000-12-14 18:16:11 +0000350 d[name] = value
Fred Drake55c38192000-06-29 19:39:57 +0000351
Fred Drake4ccf4a12000-11-21 22:02:22 +0000352 def cloneNode(self, deep):
353 clone = Node.cloneNode(self, deep)
354 if clone.__dict__.has_key("ownerElement"):
355 del clone.ownerElement
356 return clone
357
Fred Drakef7cf40d2000-12-14 18:16:11 +0000358
359class NamedNodeMap:
Fred Drake4ccf4a12000-11-21 22:02:22 +0000360 """The attribute list is a transient interface to the underlying
361 dictionaries. Mutations here will change the underlying element's
Fred Drakef7cf40d2000-12-14 18:16:11 +0000362 dictionary.
363
364 Ordering is imposed artificially and does not reflect the order of
365 attributes as found in an input document.
366 """
Fred Drake4ccf4a12000-11-21 22:02:22 +0000367
Fred Drake2998a552001-12-06 18:27:48 +0000368 def __init__(self, attrs, attrsNS, ownerElement):
Fred Drake1f549022000-09-24 05:21:58 +0000369 self._attrs = attrs
370 self._attrsNS = attrsNS
Fred Drake2998a552001-12-06 18:27:48 +0000371 self._ownerElement = ownerElement
Fred Drakef7cf40d2000-12-14 18:16:11 +0000372
Fred Draked1572372001-09-29 04:58:32 +0000373 try:
374 property
375 except NameError:
376 def __getattr__(self, name):
377 if name == "length":
378 return len(self._attrs)
379 raise AttributeError, name
380 else:
381 length = property(lambda self: len(self._attrs),
382 doc="Number of nodes in the NamedNodeMap.")
Fred Drake55c38192000-06-29 19:39:57 +0000383
Fred Drake1f549022000-09-24 05:21:58 +0000384 def item(self, index):
Fred Drake55c38192000-06-29 19:39:57 +0000385 try:
Fred Drakef7cf40d2000-12-14 18:16:11 +0000386 return self[self._attrs.keys()[index]]
Fred Drake55c38192000-06-29 19:39:57 +0000387 except IndexError:
388 return None
Fred Drake55c38192000-06-29 19:39:57 +0000389
Fred Drake1f549022000-09-24 05:21:58 +0000390 def items(self):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000391 L = []
392 for node in self._attrs.values():
Martin v. Löwisd5fb58f2001-01-27 08:38:34 +0000393 L.append((node.nodeName, node.value))
Fred Drake4ccf4a12000-11-21 22:02:22 +0000394 return L
Fred Drake1f549022000-09-24 05:21:58 +0000395
396 def itemsNS(self):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000397 L = []
398 for node in self._attrs.values():
Fred Drake49a5d032001-11-30 22:21:58 +0000399 L.append(((node.namespaceURI, node.localName), node.value))
Fred Drake4ccf4a12000-11-21 22:02:22 +0000400 return L
Fred Drake16f63292000-10-23 18:09:50 +0000401
Fred Drake1f549022000-09-24 05:21:58 +0000402 def keys(self):
Paul Prescod73678da2000-07-01 04:58:47 +0000403 return self._attrs.keys()
Fred Drake55c38192000-06-29 19:39:57 +0000404
Fred Drake1f549022000-09-24 05:21:58 +0000405 def keysNS(self):
Paul Prescod73678da2000-07-01 04:58:47 +0000406 return self._attrsNS.keys()
Fred Drake55c38192000-06-29 19:39:57 +0000407
Fred Drake1f549022000-09-24 05:21:58 +0000408 def values(self):
Paul Prescod73678da2000-07-01 04:58:47 +0000409 return self._attrs.values()
Fred Drake55c38192000-06-29 19:39:57 +0000410
Martin v. Löwisd5fb58f2001-01-27 08:38:34 +0000411 def get(self, name, value = None):
412 return self._attrs.get(name, value)
413
Fred Drake1f549022000-09-24 05:21:58 +0000414 def __len__(self):
Fred Drake55c38192000-06-29 19:39:57 +0000415 return self.length
416
Fred Drake1f549022000-09-24 05:21:58 +0000417 def __cmp__(self, other):
418 if self._attrs is getattr(other, "_attrs", None):
Fred Drake55c38192000-06-29 19:39:57 +0000419 return 0
Fred Drake16f63292000-10-23 18:09:50 +0000420 else:
Fred Drake1f549022000-09-24 05:21:58 +0000421 return cmp(id(self), id(other))
Fred Drake55c38192000-06-29 19:39:57 +0000422
423 #FIXME: is it appropriate to return .value?
Fred Drake1f549022000-09-24 05:21:58 +0000424 def __getitem__(self, attname_or_tuple):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000425 if type(attname_or_tuple) is _TupleType:
Paul Prescod73678da2000-07-01 04:58:47 +0000426 return self._attrsNS[attname_or_tuple]
Fred Drake55c38192000-06-29 19:39:57 +0000427 else:
Paul Prescod73678da2000-07-01 04:58:47 +0000428 return self._attrs[attname_or_tuple]
Fred Drake55c38192000-06-29 19:39:57 +0000429
Paul Prescod1e688272000-07-01 19:21:47 +0000430 # same as set
Fred Drake1f549022000-09-24 05:21:58 +0000431 def __setitem__(self, attname, value):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000432 if type(value) in _StringTypes:
Fred Drake1f549022000-09-24 05:21:58 +0000433 node = Attr(attname)
Fred Drake4ccf4a12000-11-21 22:02:22 +0000434 node.value = value
Fred Drake2998a552001-12-06 18:27:48 +0000435 node.ownerDocument = self._ownerElement.ownerDocument
Paul Prescod1e688272000-07-01 19:21:47 +0000436 else:
Fred Drake4ccf4a12000-11-21 22:02:22 +0000437 if not isinstance(value, Attr):
438 raise TypeError, "value must be a string or Attr object"
Fred Drake1f549022000-09-24 05:21:58 +0000439 node = value
Fred Drakef7cf40d2000-12-14 18:16:11 +0000440 self.setNamedItem(node)
441
442 def setNamedItem(self, node):
Andrew M. Kuchlingbc8f72c2001-02-21 01:30:26 +0000443 if not isinstance(node, Attr):
444 raise HierarchyRequestErr, \
445 "%s cannot be child of %s" % (repr(node), repr(self))
Fred Drakef7cf40d2000-12-14 18:16:11 +0000446 old = self._attrs.get(node.name)
Paul Prescod1e688272000-07-01 19:21:47 +0000447 if old:
448 old.unlink()
Fred Drake1f549022000-09-24 05:21:58 +0000449 self._attrs[node.name] = node
450 self._attrsNS[(node.namespaceURI, node.localName)] = node
Fred Drake2998a552001-12-06 18:27:48 +0000451 node.ownerElement = self._ownerElement
Fred Drakef7cf40d2000-12-14 18:16:11 +0000452 return old
453
454 def setNamedItemNS(self, node):
455 return self.setNamedItem(node)
Paul Prescod73678da2000-07-01 04:58:47 +0000456
Fred Drake1f549022000-09-24 05:21:58 +0000457 def __delitem__(self, attname_or_tuple):
458 node = self[attname_or_tuple]
Paul Prescod73678da2000-07-01 04:58:47 +0000459 node.unlink()
460 del self._attrs[node.name]
461 del self._attrsNS[(node.namespaceURI, node.localName)]
Fred Drakef7cf40d2000-12-14 18:16:11 +0000462 self.length = len(self._attrs)
463
464AttributeList = NamedNodeMap
465
Fred Drake1f549022000-09-24 05:21:58 +0000466
Martin v. Löwisa2fda0d2000-10-07 12:10:28 +0000467class Element(Node):
Fred Drake1f549022000-09-24 05:21:58 +0000468 nodeType = Node.ELEMENT_NODE
Fred Drake4ccf4a12000-11-21 22:02:22 +0000469 nextSibling = None
470 previousSibling = None
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000471 childNodeTypes = (Node.ELEMENT_NODE, Node.PROCESSING_INSTRUCTION_NODE,
472 Node.COMMENT_NODE, Node.TEXT_NODE,
473 Node.CDATA_SECTION_NODE, Node.ENTITY_REFERENCE_NODE)
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000474
Fred Drake49a5d032001-11-30 22:21:58 +0000475 def __init__(self, tagName, namespaceURI=EMPTY_NAMESPACE, prefix=None,
Fred Drake1f549022000-09-24 05:21:58 +0000476 localName=None):
477 Node.__init__(self)
Fred Drake55c38192000-06-29 19:39:57 +0000478 self.tagName = self.nodeName = tagName
Fred Drake1f549022000-09-24 05:21:58 +0000479 self.localName = localName or tagName
480 self.prefix = prefix
481 self.namespaceURI = namespaceURI
482 self.nodeValue = None
Fred Drake55c38192000-06-29 19:39:57 +0000483
Fred Drake4ccf4a12000-11-21 22:02:22 +0000484 self._attrs = {} # attributes are double-indexed:
485 self._attrsNS = {} # tagName -> Attribute
486 # URI,localName -> Attribute
487 # in the future: consider lazy generation
488 # of attribute objects this is too tricky
489 # for now because of headaches with
490 # namespaces.
491
492 def cloneNode(self, deep):
493 clone = Node.cloneNode(self, deep)
494 clone._attrs = {}
495 clone._attrsNS = {}
496 for attr in self._attrs.values():
497 node = attr.cloneNode(1)
498 clone._attrs[node.name] = node
499 clone._attrsNS[(node.namespaceURI, node.localName)] = node
500 node.ownerElement = clone
501 return clone
502
503 def unlink(self):
504 for attr in self._attrs.values():
505 attr.unlink()
506 self._attrs = None
507 self._attrsNS = None
508 Node.unlink(self)
Fred Drake55c38192000-06-29 19:39:57 +0000509
Fred Drake1f549022000-09-24 05:21:58 +0000510 def getAttribute(self, attname):
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000511 try:
512 return self._attrs[attname].value
513 except KeyError:
514 return ""
Fred Drake55c38192000-06-29 19:39:57 +0000515
Fred Drake1f549022000-09-24 05:21:58 +0000516 def getAttributeNS(self, namespaceURI, localName):
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000517 try:
518 return self._attrsNS[(namespaceURI, localName)].value
519 except KeyError:
520 return ""
Fred Drake1f549022000-09-24 05:21:58 +0000521
522 def setAttribute(self, attname, value):
523 attr = Attr(attname)
Fred Drake55c38192000-06-29 19:39:57 +0000524 # for performance
Fred Drake2998a552001-12-06 18:27:48 +0000525 d = attr.__dict__
526 d["value"] = d["nodeValue"] = value
527 d["ownerDocument"] = self.ownerDocument
Fred Drake1f549022000-09-24 05:21:58 +0000528 self.setAttributeNode(attr)
Fred Drake55c38192000-06-29 19:39:57 +0000529
Fred Drake1f549022000-09-24 05:21:58 +0000530 def setAttributeNS(self, namespaceURI, qualifiedName, value):
531 prefix, localname = _nssplit(qualifiedName)
Fred Drake55c38192000-06-29 19:39:57 +0000532 # for performance
Fred Drake1f549022000-09-24 05:21:58 +0000533 attr = Attr(qualifiedName, namespaceURI, localname, prefix)
Fred Drake2998a552001-12-06 18:27:48 +0000534 d = attr.__dict__
535 d["value"] = d["nodeValue"] = value
536 d["ownerDocument"] = self.ownerDocument
Fred Drake1f549022000-09-24 05:21:58 +0000537 self.setAttributeNode(attr)
Fred Drake55c38192000-06-29 19:39:57 +0000538
Fred Drake1f549022000-09-24 05:21:58 +0000539 def getAttributeNode(self, attrname):
540 return self._attrs.get(attrname)
Paul Prescod73678da2000-07-01 04:58:47 +0000541
Fred Drake1f549022000-09-24 05:21:58 +0000542 def getAttributeNodeNS(self, namespaceURI, localName):
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000543 return self._attrsNS.get((namespaceURI, localName))
Paul Prescod73678da2000-07-01 04:58:47 +0000544
Fred Drake1f549022000-09-24 05:21:58 +0000545 def setAttributeNode(self, attr):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000546 if attr.ownerElement not in (None, self):
Martin v. Löwisd5fb58f2001-01-27 08:38:34 +0000547 raise xml.dom.InuseAttributeErr("attribute node already owned")
Fred Drake1f549022000-09-24 05:21:58 +0000548 old = self._attrs.get(attr.name, None)
Paul Prescod73678da2000-07-01 04:58:47 +0000549 if old:
550 old.unlink()
Fred Drake1f549022000-09-24 05:21:58 +0000551 self._attrs[attr.name] = attr
552 self._attrsNS[(attr.namespaceURI, attr.localName)] = attr
Fred Drake4ccf4a12000-11-21 22:02:22 +0000553
554 # This creates a circular reference, but Element.unlink()
555 # breaks the cycle since the references to the attribute
556 # dictionaries are tossed.
557 attr.ownerElement = self
558
559 if old is not attr:
560 # It might have already been part of this node, in which case
561 # it doesn't represent a change, and should not be returned.
562 return old
Fred Drake55c38192000-06-29 19:39:57 +0000563
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000564 setAttributeNodeNS = setAttributeNode
565
Fred Drake1f549022000-09-24 05:21:58 +0000566 def removeAttribute(self, name):
Paul Prescod73678da2000-07-01 04:58:47 +0000567 attr = self._attrs[name]
Fred Drake1f549022000-09-24 05:21:58 +0000568 self.removeAttributeNode(attr)
Fred Drake55c38192000-06-29 19:39:57 +0000569
Fred Drake1f549022000-09-24 05:21:58 +0000570 def removeAttributeNS(self, namespaceURI, localName):
Paul Prescod73678da2000-07-01 04:58:47 +0000571 attr = self._attrsNS[(namespaceURI, localName)]
Fred Drake1f549022000-09-24 05:21:58 +0000572 self.removeAttributeNode(attr)
Fred Drake55c38192000-06-29 19:39:57 +0000573
Fred Drake1f549022000-09-24 05:21:58 +0000574 def removeAttributeNode(self, node):
Paul Prescod73678da2000-07-01 04:58:47 +0000575 node.unlink()
576 del self._attrs[node.name]
577 del self._attrsNS[(node.namespaceURI, node.localName)]
Fred Drake16f63292000-10-23 18:09:50 +0000578
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000579 removeAttributeNodeNS = removeAttributeNode
580
Martin v. Löwis156c3372000-12-28 18:40:56 +0000581 def hasAttribute(self, name):
582 return self._attrs.has_key(name)
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000583
Martin v. Löwis156c3372000-12-28 18:40:56 +0000584 def hasAttributeNS(self, namespaceURI, localName):
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000585 return self._attrsNS.has_key((namespaceURI, localName))
586
Fred Drake1f549022000-09-24 05:21:58 +0000587 def getElementsByTagName(self, name):
Martin v. Löwis95700f72002-03-15 13:51:59 +0000588 return _getElementsByTagNameHelper(self, name, NodeList())
Fred Drake55c38192000-06-29 19:39:57 +0000589
Fred Drake1f549022000-09-24 05:21:58 +0000590 def getElementsByTagNameNS(self, namespaceURI, localName):
Fred Drake15b68932002-03-15 14:37:23 +0000591 return _getElementsByTagNameNSHelper(self, namespaceURI, localName,
592 NodeList())
Fred Drake55c38192000-06-29 19:39:57 +0000593
Fred Drake1f549022000-09-24 05:21:58 +0000594 def __repr__(self):
595 return "<DOM Element: %s at %s>" % (self.tagName, id(self))
Fred Drake55c38192000-06-29 19:39:57 +0000596
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000597 def writexml(self, writer, indent="", addindent="", newl=""):
598 # indent = current indentation
599 # addindent = indentation to add to higher levels
600 # newl = newline string
601 writer.write(indent+"<" + self.tagName)
Fred Drake16f63292000-10-23 18:09:50 +0000602
Fred Drake4ccf4a12000-11-21 22:02:22 +0000603 attrs = self._get_attributes()
604 a_names = attrs.keys()
Fred Drake55c38192000-06-29 19:39:57 +0000605 a_names.sort()
606
607 for a_name in a_names:
Fred Drake1f549022000-09-24 05:21:58 +0000608 writer.write(" %s=\"" % a_name)
Fred Drake4ccf4a12000-11-21 22:02:22 +0000609 _write_data(writer, attrs[a_name].value)
Fred Drake55c38192000-06-29 19:39:57 +0000610 writer.write("\"")
611 if self.childNodes:
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000612 writer.write(">%s"%(newl))
Fred Drake55c38192000-06-29 19:39:57 +0000613 for node in self.childNodes:
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000614 node.writexml(writer,indent+addindent,addindent,newl)
615 writer.write("%s</%s>%s" % (indent,self.tagName,newl))
Fred Drake55c38192000-06-29 19:39:57 +0000616 else:
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000617 writer.write("/>%s"%(newl))
Fred Drake55c38192000-06-29 19:39:57 +0000618
Fred Drake1f549022000-09-24 05:21:58 +0000619 def _get_attributes(self):
Fred Drake2998a552001-12-06 18:27:48 +0000620 return NamedNodeMap(self._attrs, self._attrsNS, self)
Fred Drake55c38192000-06-29 19:39:57 +0000621
Fred Draked1572372001-09-29 04:58:32 +0000622 try:
623 property
624 except NameError:
625 pass
626 else:
627 attributes = property(_get_attributes,
628 doc="NamedNodeMap of attributes on the element.")
629
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000630 def hasAttributes(self):
631 if self._attrs or self._attrsNS:
632 return 1
633 else:
634 return 0
635
Fred Drake1f549022000-09-24 05:21:58 +0000636class Comment(Node):
637 nodeType = Node.COMMENT_NODE
Fred Drake4ccf4a12000-11-21 22:02:22 +0000638 nodeName = "#comment"
639 attributes = None
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000640 childNodeTypes = ()
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000641
Fred Drake1f549022000-09-24 05:21:58 +0000642 def __init__(self, data):
643 Node.__init__(self)
644 self.data = self.nodeValue = data
Fred Drake55c38192000-06-29 19:39:57 +0000645
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000646 def writexml(self, writer, indent="", addindent="", newl=""):
647 writer.write("%s<!--%s-->%s" % (indent,self.data,newl))
Fred Drake1f549022000-09-24 05:21:58 +0000648
649class ProcessingInstruction(Node):
650 nodeType = Node.PROCESSING_INSTRUCTION_NODE
Fred Drake4ccf4a12000-11-21 22:02:22 +0000651 attributes = None
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000652 childNodeTypes = ()
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000653
Fred Drake1f549022000-09-24 05:21:58 +0000654 def __init__(self, target, data):
655 Node.__init__(self)
Fred Drake55c38192000-06-29 19:39:57 +0000656 self.target = self.nodeName = target
657 self.data = self.nodeValue = data
Fred Drake55c38192000-06-29 19:39:57 +0000658
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000659 def writexml(self, writer, indent="", addindent="", newl=""):
660 writer.write("%s<?%s %s?>%s" % (indent,self.target, self.data, newl))
Fred Drake55c38192000-06-29 19:39:57 +0000661
Fred Drake87432f42001-04-04 14:09:46 +0000662class CharacterData(Node):
Fred Drake1f549022000-09-24 05:21:58 +0000663 def __init__(self, data):
Fred Drakedaa823a2001-01-08 04:04:34 +0000664 if type(data) not in _StringTypes:
665 raise TypeError, "node contents must be a string"
Fred Drake1f549022000-09-24 05:21:58 +0000666 Node.__init__(self)
Fred Drake55c38192000-06-29 19:39:57 +0000667 self.data = self.nodeValue = data
Fred Drake33d2b842001-04-04 15:15:18 +0000668 self.length = len(data)
Fred Drake87432f42001-04-04 14:09:46 +0000669
Fred Drake55c38192000-06-29 19:39:57 +0000670 def __repr__(self):
Fred Drake1f549022000-09-24 05:21:58 +0000671 if len(self.data) > 10:
672 dotdotdot = "..."
Fred Drake55c38192000-06-29 19:39:57 +0000673 else:
Fred Drake1f549022000-09-24 05:21:58 +0000674 dotdotdot = ""
Fred Drake87432f42001-04-04 14:09:46 +0000675 return "<DOM %s node \"%s%s\">" % (
676 self.__class__.__name__, self.data[0:10], dotdotdot)
677
678 def substringData(self, offset, count):
679 if offset < 0:
680 raise xml.dom.IndexSizeErr("offset cannot be negative")
681 if offset >= len(self.data):
682 raise xml.dom.IndexSizeErr("offset cannot be beyond end of data")
683 if count < 0:
684 raise xml.dom.IndexSizeErr("count cannot be negative")
685 return self.data[offset:offset+count]
686
687 def appendData(self, arg):
688 self.data = self.data + arg
689 self.nodeValue = self.data
Fred Drake33d2b842001-04-04 15:15:18 +0000690 self.length = len(self.data)
Fred Drake87432f42001-04-04 14:09:46 +0000691
692 def insertData(self, offset, arg):
693 if offset < 0:
694 raise xml.dom.IndexSizeErr("offset cannot be negative")
695 if offset >= len(self.data):
696 raise xml.dom.IndexSizeErr("offset cannot be beyond end of data")
697 if arg:
698 self.data = "%s%s%s" % (
699 self.data[:offset], arg, self.data[offset:])
700 self.nodeValue = self.data
Fred Drake33d2b842001-04-04 15:15:18 +0000701 self.length = len(self.data)
Fred Drake87432f42001-04-04 14:09:46 +0000702
703 def deleteData(self, offset, count):
704 if offset < 0:
705 raise xml.dom.IndexSizeErr("offset cannot be negative")
706 if offset >= len(self.data):
707 raise xml.dom.IndexSizeErr("offset cannot be beyond end of data")
708 if count < 0:
709 raise xml.dom.IndexSizeErr("count cannot be negative")
710 if count:
711 self.data = self.data[:offset] + self.data[offset+count:]
712 self.nodeValue = self.data
Fred Drake33d2b842001-04-04 15:15:18 +0000713 self.length = len(self.data)
Fred Drake87432f42001-04-04 14:09:46 +0000714
715 def replaceData(self, offset, count, arg):
716 if offset < 0:
717 raise xml.dom.IndexSizeErr("offset cannot be negative")
718 if offset >= len(self.data):
719 raise xml.dom.IndexSizeErr("offset cannot be beyond end of data")
720 if count < 0:
721 raise xml.dom.IndexSizeErr("count cannot be negative")
722 if count:
723 self.data = "%s%s%s" % (
724 self.data[:offset], arg, self.data[offset+count:])
725 self.nodeValue = self.data
Fred Drake33d2b842001-04-04 15:15:18 +0000726 self.length = len(self.data)
Fred Drake87432f42001-04-04 14:09:46 +0000727
728class Text(CharacterData):
729 nodeType = Node.TEXT_NODE
730 nodeName = "#text"
731 attributes = None
732 childNodeTypes = ()
Fred Drake55c38192000-06-29 19:39:57 +0000733
Fred Drakef7cf40d2000-12-14 18:16:11 +0000734 def splitText(self, offset):
735 if offset < 0 or offset > len(self.data):
Martin v. Löwisd5fb58f2001-01-27 08:38:34 +0000736 raise xml.dom.IndexSizeErr("illegal offset value")
Fred Drakef7cf40d2000-12-14 18:16:11 +0000737 newText = Text(self.data[offset:])
738 next = self.nextSibling
739 if self.parentNode and self in self.parentNode.childNodes:
740 if next is None:
741 self.parentNode.appendChild(newText)
742 else:
743 self.parentNode.insertBefore(newText, next)
744 self.data = self.data[:offset]
Fred Drake33d2b842001-04-04 15:15:18 +0000745 self.nodeValue = self.data
746 self.length = len(self.data)
Fred Drakef7cf40d2000-12-14 18:16:11 +0000747 return newText
748
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000749 def writexml(self, writer, indent="", addindent="", newl=""):
750 _write_data(writer, "%s%s%s"%(indent, self.data, newl))
Fred Drake55c38192000-06-29 19:39:57 +0000751
Fred Drake87432f42001-04-04 14:09:46 +0000752
753class CDATASection(Text):
754 nodeType = Node.CDATA_SECTION_NODE
755 nodeName = "#cdata-section"
756
757 def writexml(self, writer, indent="", addindent="", newl=""):
Guido van Rossum5b5e0b92001-09-19 13:28:25 +0000758 writer.write("<![CDATA[%s]]>" % self.data)
Fred Drake87432f42001-04-04 14:09:46 +0000759
760
Fred Drake1f549022000-09-24 05:21:58 +0000761def _nssplit(qualifiedName):
Neal Norwitzab199622002-05-31 20:46:39 +0000762 fields = qualifiedName.split(':', 1)
Paul Prescod73678da2000-07-01 04:58:47 +0000763 if len(fields) == 2:
764 return fields
765 elif len(fields) == 1:
Fred Drake49a5d032001-11-30 22:21:58 +0000766 return (None, fields[0])
Paul Prescod73678da2000-07-01 04:58:47 +0000767
Fred Drakef7cf40d2000-12-14 18:16:11 +0000768
769class DocumentType(Node):
770 nodeType = Node.DOCUMENT_TYPE_NODE
771 nodeValue = None
772 attributes = None
773 name = None
774 publicId = None
775 systemId = None
Fred Drakedc806702001-04-05 14:41:30 +0000776 internalSubset = None
Fred Drakef7cf40d2000-12-14 18:16:11 +0000777 entities = None
778 notations = None
779
780 def __init__(self, qualifiedName):
781 Node.__init__(self)
782 if qualifiedName:
783 prefix, localname = _nssplit(qualifiedName)
784 self.name = localname
785
786
787class DOMImplementation:
788 def hasFeature(self, feature, version):
789 if version not in ("1.0", "2.0"):
790 return 0
Neal Norwitzab199622002-05-31 20:46:39 +0000791 feature = feature.lower()
Fred Drakef7cf40d2000-12-14 18:16:11 +0000792 return feature == "core"
793
794 def createDocument(self, namespaceURI, qualifiedName, doctype):
795 if doctype and doctype.parentNode is not None:
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000796 raise xml.dom.WrongDocumentErr(
797 "doctype object owned by another DOM tree")
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000798 doc = self._createDocument()
Fred Drakef7cf40d2000-12-14 18:16:11 +0000799 if doctype is None:
800 doctype = self.createDocumentType(qualifiedName, None, None)
Martin v. Löwisb417be22001-02-06 01:16:06 +0000801 if not qualifiedName:
802 # The spec is unclear what to raise here; SyntaxErr
803 # would be the other obvious candidate. Since Xerces raises
804 # InvalidCharacterErr, and since SyntaxErr is not listed
805 # for createDocument, that seems to be the better choice.
806 # XXX: need to check for illegal characters here and in
807 # createElement.
808 raise xml.dom.InvalidCharacterErr("Element with no name")
809 prefix, localname = _nssplit(qualifiedName)
810 if prefix == "xml" \
811 and namespaceURI != "http://www.w3.org/XML/1998/namespace":
812 raise xml.dom.NamespaceErr("illegal use of 'xml' prefix")
813 if prefix and not namespaceURI:
814 raise xml.dom.NamespaceErr(
815 "illegal use of prefix without namespaces")
816 element = doc.createElementNS(namespaceURI, qualifiedName)
817 doc.appendChild(element)
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000818 doctype.parentNode = doctype.ownerDocument = doc
Fred Drakef7cf40d2000-12-14 18:16:11 +0000819 doc.doctype = doctype
820 doc.implementation = self
821 return doc
822
823 def createDocumentType(self, qualifiedName, publicId, systemId):
824 doctype = DocumentType(qualifiedName)
825 doctype.publicId = publicId
826 doctype.systemId = systemId
827 return doctype
828
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000829 # internal
830 def _createDocument(self):
831 return Document()
Fred Drakef7cf40d2000-12-14 18:16:11 +0000832
Fred Drake1f549022000-09-24 05:21:58 +0000833class Document(Node):
834 nodeType = Node.DOCUMENT_NODE
Fred Drake4ccf4a12000-11-21 22:02:22 +0000835 nodeName = "#document"
836 nodeValue = None
837 attributes = None
Fred Drakef7cf40d2000-12-14 18:16:11 +0000838 doctype = None
839 parentNode = None
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000840 previousSibling = nextSibling = None
Fred Drakef7cf40d2000-12-14 18:16:11 +0000841
842 implementation = DOMImplementation()
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000843 childNodeTypes = (Node.ELEMENT_NODE, Node.PROCESSING_INSTRUCTION_NODE,
844 Node.COMMENT_NODE, Node.DOCUMENT_TYPE_NODE)
Fred Drake55c38192000-06-29 19:39:57 +0000845
Fred Drake1f549022000-09-24 05:21:58 +0000846 def appendChild(self, node):
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000847 if node.nodeType not in self.childNodeTypes:
848 raise HierarchyRequestErr, \
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000849 "%s cannot be child of %s" % (repr(node), repr(self))
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000850 if node.parentNode is not None:
851 node.parentNode.removeChild(node)
852
Fred Drakef7cf40d2000-12-14 18:16:11 +0000853 if node.nodeType == Node.ELEMENT_NODE \
854 and self._get_documentElement():
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000855 raise xml.dom.HierarchyRequestErr(
856 "two document elements disallowed")
Fred Drake4ccf4a12000-11-21 22:02:22 +0000857 return Node.appendChild(self, node)
Paul Prescod73678da2000-07-01 04:58:47 +0000858
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000859 def removeChild(self, oldChild):
860 self.childNodes.remove(oldChild)
861 oldChild.nextSibling = oldChild.previousSibling = None
862 oldChild.parentNode = None
863 if self.documentElement is oldChild:
864 self.documentElement = None
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000865
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000866 return oldChild
867
Fred Drakef7cf40d2000-12-14 18:16:11 +0000868 def _get_documentElement(self):
869 for node in self.childNodes:
870 if node.nodeType == Node.ELEMENT_NODE:
871 return node
872
Fred Draked1572372001-09-29 04:58:32 +0000873 try:
874 property
875 except NameError:
876 pass
877 else:
878 documentElement = property(_get_documentElement,
879 doc="Top-level element of this document.")
880
Fred Drakef7cf40d2000-12-14 18:16:11 +0000881 def unlink(self):
882 if self.doctype is not None:
883 self.doctype.unlink()
884 self.doctype = None
885 Node.unlink(self)
886
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000887 def createDocumentFragment(self):
888 d = DocumentFragment()
889 d.ownerDoc = self
890 return d
Fred Drake55c38192000-06-29 19:39:57 +0000891
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000892 def createElement(self, tagName):
893 e = Element(tagName)
894 e.ownerDocument = self
895 return e
Fred Drake55c38192000-06-29 19:39:57 +0000896
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000897 def createTextNode(self, data):
898 t = Text(data)
899 t.ownerDocument = self
900 return t
Fred Drake55c38192000-06-29 19:39:57 +0000901
Fred Drake87432f42001-04-04 14:09:46 +0000902 def createCDATASection(self, data):
903 c = CDATASection(data)
904 c.ownerDocument = self
905 return c
906
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000907 def createComment(self, data):
908 c = Comment(data)
909 c.ownerDocument = self
910 return c
Fred Drake55c38192000-06-29 19:39:57 +0000911
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000912 def createProcessingInstruction(self, target, data):
913 p = ProcessingInstruction(target, data)
914 p.ownerDocument = self
915 return p
916
917 def createAttribute(self, qName):
918 a = Attr(qName)
919 a.ownerDocument = self
Martin v. Löwiscb67ea12001-03-31 16:30:40 +0000920 a.value = ""
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000921 return a
Fred Drake55c38192000-06-29 19:39:57 +0000922
923 def createElementNS(self, namespaceURI, qualifiedName):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000924 prefix, localName = _nssplit(qualifiedName)
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000925 e = Element(qualifiedName, namespaceURI, prefix, localName)
926 e.ownerDocument = self
927 return e
Fred Drake55c38192000-06-29 19:39:57 +0000928
929 def createAttributeNS(self, namespaceURI, qualifiedName):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000930 prefix, localName = _nssplit(qualifiedName)
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000931 a = Attr(qualifiedName, namespaceURI, localName, prefix)
932 a.ownerDocument = self
Martin v. Löwiscb67ea12001-03-31 16:30:40 +0000933 a.value = ""
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000934 return a
Fred Drake55c38192000-06-29 19:39:57 +0000935
Fred Drake1f549022000-09-24 05:21:58 +0000936 def getElementsByTagName(self, name):
Martin v. Löwis95700f72002-03-15 13:51:59 +0000937 return _getElementsByTagNameHelper(self, name, NodeList())
Fred Drakefbe7b4f2001-07-04 06:25:53 +0000938
939 def getElementsByTagNameNS(self, namespaceURI, localName):
Fred Drake15b68932002-03-15 14:37:23 +0000940 return _getElementsByTagNameNSHelper(self, namespaceURI, localName,
941 NodeList())
Fred Drake55c38192000-06-29 19:39:57 +0000942
Martin v. Löwis7d650ca2002-06-30 15:05:00 +0000943 def writexml(self, writer, indent="", addindent="", newl="",
944 encoding = None):
945 if encoding is None:
946 writer.write('<?xml version="1.0" ?>\n')
947 else:
948 writer.write('<?xml version="1.0" encoding="%s"?>\n' % encoding)
Fred Drake55c38192000-06-29 19:39:57 +0000949 for node in self.childNodes:
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000950 node.writexml(writer, indent, addindent, newl)
Fred Drake55c38192000-06-29 19:39:57 +0000951
Fred Drake4ccf4a12000-11-21 22:02:22 +0000952def _get_StringIO():
Fred Drakef7cf40d2000-12-14 18:16:11 +0000953 # we can't use cStringIO since it doesn't support Unicode strings
954 from StringIO import StringIO
Fred Drake4ccf4a12000-11-21 22:02:22 +0000955 return StringIO()
956
Fred Drake1f549022000-09-24 05:21:58 +0000957def _doparse(func, args, kwargs):
958 events = apply(func, args, kwargs)
959 toktype, rootNode = events.getEvent()
960 events.expandNode(rootNode)
Martin v. Löwisb417be22001-02-06 01:16:06 +0000961 events.clear()
Fred Drake55c38192000-06-29 19:39:57 +0000962 return rootNode
963
Fred Drake1f549022000-09-24 05:21:58 +0000964def parse(*args, **kwargs):
Fred Drakef7cf40d2000-12-14 18:16:11 +0000965 """Parse a file into a DOM by filename or file object."""
Fred Drake4ccf4a12000-11-21 22:02:22 +0000966 from xml.dom import pulldom
Fred Drake1f549022000-09-24 05:21:58 +0000967 return _doparse(pulldom.parse, args, kwargs)
Fred Drake55c38192000-06-29 19:39:57 +0000968
Fred Drake1f549022000-09-24 05:21:58 +0000969def parseString(*args, **kwargs):
Fred Drakef7cf40d2000-12-14 18:16:11 +0000970 """Parse a file into a DOM from a string."""
Fred Drake4ccf4a12000-11-21 22:02:22 +0000971 from xml.dom import pulldom
Fred Drake1f549022000-09-24 05:21:58 +0000972 return _doparse(pulldom.parseString, args, kwargs)
Martin v. Löwis7edbd4f2001-02-22 14:05:50 +0000973
974def getDOMImplementation():
975 return Document.implementation