blob: 18b0e270de6d33e6a800b3adaa5201172f4ce5ab [file] [log] [blame]
Fred Drake1f549022000-09-24 05:21:58 +00001"""\
Fred Drakef7cf40d2000-12-14 18:16:11 +00002minidom.py -- a lightweight DOM implementation.
Fred Drake55c38192000-06-29 19:39:57 +00003
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +00004parse("foo.xml")
Paul Prescod623511b2000-07-21 22:05:49 +00005
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +00006parseString("<foo><bar/></foo>")
Paul Prescod623511b2000-07-21 22:05:49 +00007
Fred Drake55c38192000-06-29 19:39:57 +00008Todo:
9=====
10 * convenience methods for getting elements and text.
11 * more testing
12 * bring some of the writer and linearizer code into conformance with this
13 interface
14 * SAX 2 namespaces
15"""
16
Fred Drake1f549022000-09-24 05:21:58 +000017import string
Fred Drake4ccf4a12000-11-21 22:02:22 +000018_string = string
19del string
20
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +000021from xml.dom import HierarchyRequestErr
22
Fred Drake4ccf4a12000-11-21 22:02:22 +000023# localize the types, and allow support for Unicode values if available:
Fred Drake1f549022000-09-24 05:21:58 +000024import types
Fred Drake4ccf4a12000-11-21 22:02:22 +000025_TupleType = types.TupleType
26try:
27 _StringTypes = (types.StringType, types.UnicodeType)
28except AttributeError:
29 _StringTypes = (types.StringType,)
30del types
31
Fred Drakef7cf40d2000-12-14 18:16:11 +000032import xml.dom
33_Node = xml.dom.Node
Fred Drake55c38192000-06-29 19:39:57 +000034
Fred Drake3ac6a092001-09-28 04:33:06 +000035
36if list is type([]):
37 class NodeList(list):
38 def item(self, index):
39 if 0 <= index < len(self):
40 return self[index]
41
42 def __getattr__(self, name):
43 if name == "length":
44 return len(self)
45 raise AttributeError, name
46
47else:
48 def NodeList():
49 return []
50
51
Fred Drakef7cf40d2000-12-14 18:16:11 +000052class Node(_Node):
Fred Drake1f549022000-09-24 05:21:58 +000053 allnodes = {}
54 _debug = 0
55 _makeParentNodes = 1
56 debug = None
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +000057 childNodeTypes = ()
Martin v. Löwis126f2f62001-03-13 10:50:13 +000058 namespaceURI = None # this is non-null only for elements and attributes
Martin v. Löwis52ce0d02001-01-27 08:47:37 +000059
Fred Drake1f549022000-09-24 05:21:58 +000060 def __init__(self):
Fred Drake3ac6a092001-09-28 04:33:06 +000061 self.childNodes = NodeList()
Martin v. Löwis126f2f62001-03-13 10:50:13 +000062 self.parentNode = self.ownerDocument = None
Fred Drake16f63292000-10-23 18:09:50 +000063 if Node._debug:
Fred Drake1f549022000-09-24 05:21:58 +000064 index = repr(id(self)) + repr(self.__class__)
65 Node.allnodes[index] = repr(self.__dict__)
66 if Node.debug is None:
Fred Drake4ccf4a12000-11-21 22:02:22 +000067 Node.debug = _get_StringIO()
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +000068 #open("debug4.out", "w")
Fred Drake1f549022000-09-24 05:21:58 +000069 Node.debug.write("create %s\n" % index)
Fred Drake55c38192000-06-29 19:39:57 +000070
Fred Drake1f549022000-09-24 05:21:58 +000071 def __getattr__(self, key):
72 if key[0:2] == "__":
Fred Drakef7cf40d2000-12-14 18:16:11 +000073 raise AttributeError, key
Fred Drake55c38192000-06-29 19:39:57 +000074 # getattr should never call getattr!
Fred Drake16f63292000-10-23 18:09:50 +000075 if self.__dict__.has_key("inGetAttr"):
Fred Drake55c38192000-06-29 19:39:57 +000076 del self.inGetAttr
77 raise AttributeError, key
78
Fred Drake1f549022000-09-24 05:21:58 +000079 prefix, attrname = key[:5], key[5:]
80 if prefix == "_get_":
81 self.inGetAttr = 1
Fred Drake16f63292000-10-23 18:09:50 +000082 if hasattr(self, attrname):
Fred Drake55c38192000-06-29 19:39:57 +000083 del self.inGetAttr
Fred Drake16f63292000-10-23 18:09:50 +000084 return (lambda self=self, attrname=attrname:
Fred Drake1f549022000-09-24 05:21:58 +000085 getattr(self, attrname))
Fred Drake55c38192000-06-29 19:39:57 +000086 else:
87 del self.inGetAttr
88 raise AttributeError, key
89 else:
Fred Drake1f549022000-09-24 05:21:58 +000090 self.inGetAttr = 1
Fred Drake55c38192000-06-29 19:39:57 +000091 try:
Fred Drake1f549022000-09-24 05:21:58 +000092 func = getattr(self, "_get_" + key)
Fred Drake55c38192000-06-29 19:39:57 +000093 except AttributeError:
94 raise AttributeError, key
95 del self.inGetAttr
96 return func()
97
Fred Drake1f549022000-09-24 05:21:58 +000098 def __nonzero__(self):
99 return 1
Fred Drake55c38192000-06-29 19:39:57 +0000100
Fred Drake1f549022000-09-24 05:21:58 +0000101 def toxml(self):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000102 writer = _get_StringIO()
Fred Drake1f549022000-09-24 05:21:58 +0000103 self.writexml(writer)
Fred Drake55c38192000-06-29 19:39:57 +0000104 return writer.getvalue()
105
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000106 def toprettyxml(self, indent="\t", newl="\n"):
Martin v. Löwiscb67ea12001-03-31 16:30:40 +0000107 # indent = the indentation string to prepend, per level
108 # newl = the newline string to append
109 writer = _get_StringIO()
110 self.writexml(writer, "", indent, newl)
111 return writer.getvalue()
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000112
Fred Drake1f549022000-09-24 05:21:58 +0000113 def hasChildNodes(self):
114 if self.childNodes:
115 return 1
116 else:
117 return 0
Fred Drake55c38192000-06-29 19:39:57 +0000118
Fred Drake1f549022000-09-24 05:21:58 +0000119 def _get_firstChild(self):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000120 if self.childNodes:
121 return self.childNodes[0]
Paul Prescod73678da2000-07-01 04:58:47 +0000122
Fred Drake1f549022000-09-24 05:21:58 +0000123 def _get_lastChild(self):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000124 if self.childNodes:
125 return self.childNodes[-1]
Paul Prescod73678da2000-07-01 04:58:47 +0000126
Fred Drake1f549022000-09-24 05:21:58 +0000127 def insertBefore(self, newChild, refChild):
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000128 if newChild.nodeType == self.DOCUMENT_FRAGMENT_NODE:
129 for c in newChild.childNodes:
130 self.insertBefore(c, refChild)
131 ### The DOM does not clearly specify what to return in this case
132 return newChild
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000133 if newChild.nodeType not in self.childNodeTypes:
134 raise HierarchyRequestErr, \
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000135 "%s cannot be child of %s" % (repr(newChild), repr(self))
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000136 if newChild.parentNode is not None:
137 newChild.parentNode.removeChild(newChild)
Fred Drake4ccf4a12000-11-21 22:02:22 +0000138 if refChild is None:
139 self.appendChild(newChild)
140 else:
141 index = self.childNodes.index(refChild)
142 self.childNodes.insert(index, newChild)
143 newChild.nextSibling = refChild
144 refChild.previousSibling = newChild
145 if index:
146 node = self.childNodes[index-1]
147 node.nextSibling = newChild
148 newChild.previousSibling = node
149 else:
150 newChild.previousSibling = None
151 if self._makeParentNodes:
152 newChild.parentNode = self
153 return newChild
Fred Drake55c38192000-06-29 19:39:57 +0000154
Fred Drake1f549022000-09-24 05:21:58 +0000155 def appendChild(self, node):
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000156 if node.nodeType == self.DOCUMENT_FRAGMENT_NODE:
157 for c in node.childNodes:
158 self.appendChild(c)
159 ### The DOM does not clearly specify what to return in this case
160 return node
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000161 if node.nodeType not in self.childNodeTypes:
162 raise HierarchyRequestErr, \
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000163 "%s cannot be child of %s" % (repr(node), repr(self))
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000164 if node.parentNode is not None:
165 node.parentNode.removeChild(node)
Fred Drake13a30692000-10-09 20:04:16 +0000166 if self.childNodes:
167 last = self.lastChild
168 node.previousSibling = last
169 last.nextSibling = node
170 else:
171 node.previousSibling = None
172 node.nextSibling = None
Fred Drake1f549022000-09-24 05:21:58 +0000173 self.childNodes.append(node)
Fred Drake4ccf4a12000-11-21 22:02:22 +0000174 if self._makeParentNodes:
175 node.parentNode = self
Paul Prescod73678da2000-07-01 04:58:47 +0000176 return node
177
Fred Drake1f549022000-09-24 05:21:58 +0000178 def replaceChild(self, newChild, oldChild):
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000179 if newChild.nodeType == self.DOCUMENT_FRAGMENT_NODE:
180 refChild = oldChild.nextSibling
181 self.removeChild(oldChild)
182 return self.insertBefore(newChild, refChild)
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000183 if newChild.nodeType not in self.childNodeTypes:
184 raise HierarchyRequestErr, \
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000185 "%s cannot be child of %s" % (repr(newChild), repr(self))
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000186 if newChild.parentNode is not None:
187 newChild.parentNode.removeChild(newChild)
Fred Drake4ccf4a12000-11-21 22:02:22 +0000188 if newChild is oldChild:
189 return
Fred Drake1f549022000-09-24 05:21:58 +0000190 index = self.childNodes.index(oldChild)
Fred Drake4ccf4a12000-11-21 22:02:22 +0000191 self.childNodes[index] = newChild
192 if self._makeParentNodes:
193 newChild.parentNode = self
194 oldChild.parentNode = None
195 newChild.nextSibling = oldChild.nextSibling
196 newChild.previousSibling = oldChild.previousSibling
Martin v. Löwis156c3372000-12-28 18:40:56 +0000197 oldChild.nextSibling = None
Fred Drake4ccf4a12000-11-21 22:02:22 +0000198 oldChild.previousSibling = None
Martin v. Löwis156c3372000-12-28 18:40:56 +0000199 if newChild.previousSibling:
200 newChild.previousSibling.nextSibling = newChild
201 if newChild.nextSibling:
202 newChild.nextSibling.previousSibling = newChild
Fred Drake4ccf4a12000-11-21 22:02:22 +0000203 return oldChild
Paul Prescod73678da2000-07-01 04:58:47 +0000204
Fred Drake1f549022000-09-24 05:21:58 +0000205 def removeChild(self, oldChild):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000206 self.childNodes.remove(oldChild)
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000207 if oldChild.nextSibling is not None:
208 oldChild.nextSibling.previousSibling = oldChild.previousSibling
209 if oldChild.previousSibling is not None:
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000210 oldChild.previousSibling.nextSibling = oldChild.nextSibling
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000211 oldChild.nextSibling = oldChild.previousSibling = None
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000212
Fred Drake4ccf4a12000-11-21 22:02:22 +0000213 if self._makeParentNodes:
214 oldChild.parentNode = None
215 return oldChild
216
217 def normalize(self):
Fred Drakef7cf40d2000-12-14 18:16:11 +0000218 L = []
219 for child in self.childNodes:
220 if child.nodeType == Node.TEXT_NODE:
221 data = child.data
222 if data and L and L[-1].nodeType == child.nodeType:
Fred Drake4ccf4a12000-11-21 22:02:22 +0000223 # collapse text node
224 node = L[-1]
225 node.data = node.nodeValue = node.data + child.data
226 node.nextSibling = child.nextSibling
227 child.unlink()
Fred Drakef7cf40d2000-12-14 18:16:11 +0000228 elif data:
229 if L:
230 L[-1].nextSibling = child
231 child.previousSibling = L[-1]
232 else:
233 child.previousSibling = None
234 L.append(child)
Fred Drake4ccf4a12000-11-21 22:02:22 +0000235 else:
Fred Drakef7cf40d2000-12-14 18:16:11 +0000236 # empty text node; discard
237 child.unlink()
238 else:
239 if L:
Fred Drake4ccf4a12000-11-21 22:02:22 +0000240 L[-1].nextSibling = child
241 child.previousSibling = L[-1]
Fred Drakef7cf40d2000-12-14 18:16:11 +0000242 else:
243 child.previousSibling = None
244 L.append(child)
245 if child.nodeType == Node.ELEMENT_NODE:
Fred Drake4ccf4a12000-11-21 22:02:22 +0000246 child.normalize()
Fred Drakef7cf40d2000-12-14 18:16:11 +0000247 self.childNodes[:] = L
Paul Prescod73678da2000-07-01 04:58:47 +0000248
Fred Drake1f549022000-09-24 05:21:58 +0000249 def cloneNode(self, deep):
Paul Prescod73678da2000-07-01 04:58:47 +0000250 import new
Fred Drake4ccf4a12000-11-21 22:02:22 +0000251 clone = new.instance(self.__class__, self.__dict__.copy())
252 if self._makeParentNodes:
253 clone.parentNode = None
Fred Drake3ac6a092001-09-28 04:33:06 +0000254 clone.childNodes = NodeList()
Fred Drake4ccf4a12000-11-21 22:02:22 +0000255 if deep:
256 for child in self.childNodes:
257 clone.appendChild(child.cloneNode(1))
Paul Prescod73678da2000-07-01 04:58:47 +0000258 return clone
Fred Drake55c38192000-06-29 19:39:57 +0000259
Fred Drake25239772001-02-02 19:40:19 +0000260 # DOM Level 3 (Working Draft 2001-Jan-26)
261
262 def isSameNode(self, other):
263 return self is other
264
265 # minidom-specific API:
266
Fred Drake1f549022000-09-24 05:21:58 +0000267 def unlink(self):
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000268 self.parentNode = self.ownerDocument = None
Fred Drake4ccf4a12000-11-21 22:02:22 +0000269 for child in self.childNodes:
270 child.unlink()
Fred Drake1f549022000-09-24 05:21:58 +0000271 self.childNodes = None
Paul Prescod4221ff02000-10-13 20:11:42 +0000272 self.previousSibling = None
273 self.nextSibling = None
Paul Prescod73678da2000-07-01 04:58:47 +0000274 if Node._debug:
Fred Drake1f549022000-09-24 05:21:58 +0000275 index = repr(id(self)) + repr(self.__class__)
276 self.debug.write("Deleting: %s\n" % index)
Paul Prescod73678da2000-07-01 04:58:47 +0000277 del Node.allnodes[index]
Fred Drake55c38192000-06-29 19:39:57 +0000278
Fred Drake1f549022000-09-24 05:21:58 +0000279def _write_data(writer, data):
Fred Drake55c38192000-06-29 19:39:57 +0000280 "Writes datachars to writer."
Fred Drake4ccf4a12000-11-21 22:02:22 +0000281 replace = _string.replace
282 data = replace(data, "&", "&amp;")
283 data = replace(data, "<", "&lt;")
284 data = replace(data, "\"", "&quot;")
285 data = replace(data, ">", "&gt;")
Fred Drake55c38192000-06-29 19:39:57 +0000286 writer.write(data)
287
Fred Drake1f549022000-09-24 05:21:58 +0000288def _getElementsByTagNameHelper(parent, name, rc):
Fred Drake55c38192000-06-29 19:39:57 +0000289 for node in parent.childNodes:
Fred Drake1f549022000-09-24 05:21:58 +0000290 if node.nodeType == Node.ELEMENT_NODE and \
291 (name == "*" or node.tagName == name):
292 rc.append(node)
293 _getElementsByTagNameHelper(node, name, rc)
Fred Drake55c38192000-06-29 19:39:57 +0000294 return rc
295
Fred Drake1f549022000-09-24 05:21:58 +0000296def _getElementsByTagNameNSHelper(parent, nsURI, localName, rc):
Fred Drake55c38192000-06-29 19:39:57 +0000297 for node in parent.childNodes:
Fred Drake1f549022000-09-24 05:21:58 +0000298 if node.nodeType == Node.ELEMENT_NODE:
Martin v. Löwised525fb2001-06-03 14:06:42 +0000299 if ((localName == "*" or node.localName == localName) and
Fred Drake1f549022000-09-24 05:21:58 +0000300 (nsURI == "*" or node.namespaceURI == nsURI)):
301 rc.append(node)
Fred Drakef7cf40d2000-12-14 18:16:11 +0000302 _getElementsByTagNameNSHelper(node, nsURI, localName, rc)
303 return rc
Fred Drake55c38192000-06-29 19:39:57 +0000304
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000305class DocumentFragment(Node):
306 nodeType = Node.DOCUMENT_FRAGMENT_NODE
307 nodeName = "#document-fragment"
308 nodeValue = None
309 attributes = None
310 parentNode = None
311 childNodeTypes = (Node.ELEMENT_NODE,
312 Node.TEXT_NODE,
313 Node.CDATA_SECTION_NODE,
314 Node.ENTITY_REFERENCE_NODE,
315 Node.PROCESSING_INSTRUCTION_NODE,
316 Node.COMMENT_NODE,
317 Node.NOTATION_NODE)
318
319
Fred Drake55c38192000-06-29 19:39:57 +0000320class Attr(Node):
Fred Drake1f549022000-09-24 05:21:58 +0000321 nodeType = Node.ATTRIBUTE_NODE
Fred Drake4ccf4a12000-11-21 22:02:22 +0000322 attributes = None
323 ownerElement = None
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000324 childNodeTypes = (Node.TEXT_NODE, Node.ENTITY_REFERENCE_NODE)
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000325
Fred Drake1f549022000-09-24 05:21:58 +0000326 def __init__(self, qName, namespaceURI="", localName=None, prefix=None):
Fred Drake55c38192000-06-29 19:39:57 +0000327 # skip setattr for performance
Fred Drake4ccf4a12000-11-21 22:02:22 +0000328 d = self.__dict__
329 d["localName"] = localName or qName
330 d["nodeName"] = d["name"] = qName
331 d["namespaceURI"] = namespaceURI
332 d["prefix"] = prefix
Fred Drake1f549022000-09-24 05:21:58 +0000333 Node.__init__(self)
Paul Prescod73678da2000-07-01 04:58:47 +0000334 # nodeValue and value are set elsewhere
Fred Drake55c38192000-06-29 19:39:57 +0000335
Fred Drake1f549022000-09-24 05:21:58 +0000336 def __setattr__(self, name, value):
Fred Drakef7cf40d2000-12-14 18:16:11 +0000337 d = self.__dict__
Fred Drake1f549022000-09-24 05:21:58 +0000338 if name in ("value", "nodeValue"):
Fred Drakef7cf40d2000-12-14 18:16:11 +0000339 d["value"] = d["nodeValue"] = value
340 elif name in ("name", "nodeName"):
341 d["name"] = d["nodeName"] = value
Fred Drake55c38192000-06-29 19:39:57 +0000342 else:
Fred Drakef7cf40d2000-12-14 18:16:11 +0000343 d[name] = value
Fred Drake55c38192000-06-29 19:39:57 +0000344
Fred Drake4ccf4a12000-11-21 22:02:22 +0000345 def cloneNode(self, deep):
346 clone = Node.cloneNode(self, deep)
347 if clone.__dict__.has_key("ownerElement"):
348 del clone.ownerElement
349 return clone
350
Fred Drakef7cf40d2000-12-14 18:16:11 +0000351
352class NamedNodeMap:
Fred Drake4ccf4a12000-11-21 22:02:22 +0000353 """The attribute list is a transient interface to the underlying
354 dictionaries. Mutations here will change the underlying element's
Fred Drakef7cf40d2000-12-14 18:16:11 +0000355 dictionary.
356
357 Ordering is imposed artificially and does not reflect the order of
358 attributes as found in an input document.
359 """
Fred Drake4ccf4a12000-11-21 22:02:22 +0000360
Fred Drake1f549022000-09-24 05:21:58 +0000361 def __init__(self, attrs, attrsNS):
362 self._attrs = attrs
363 self._attrsNS = attrsNS
Fred Drakef7cf40d2000-12-14 18:16:11 +0000364
365 def __getattr__(self, name):
366 if name == "length":
367 return len(self._attrs)
368 raise AttributeError, name
Fred Drake55c38192000-06-29 19:39:57 +0000369
Fred Drake1f549022000-09-24 05:21:58 +0000370 def item(self, index):
Fred Drake55c38192000-06-29 19:39:57 +0000371 try:
Fred Drakef7cf40d2000-12-14 18:16:11 +0000372 return self[self._attrs.keys()[index]]
Fred Drake55c38192000-06-29 19:39:57 +0000373 except IndexError:
374 return None
Fred Drake55c38192000-06-29 19:39:57 +0000375
Fred Drake1f549022000-09-24 05:21:58 +0000376 def items(self):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000377 L = []
378 for node in self._attrs.values():
Martin v. Löwisd5fb58f2001-01-27 08:38:34 +0000379 L.append((node.nodeName, node.value))
Fred Drake4ccf4a12000-11-21 22:02:22 +0000380 return L
Fred Drake1f549022000-09-24 05:21:58 +0000381
382 def itemsNS(self):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000383 L = []
384 for node in self._attrs.values():
385 L.append(((node.URI, node.localName), node.value))
386 return L
Fred Drake16f63292000-10-23 18:09:50 +0000387
Fred Drake1f549022000-09-24 05:21:58 +0000388 def keys(self):
Paul Prescod73678da2000-07-01 04:58:47 +0000389 return self._attrs.keys()
Fred Drake55c38192000-06-29 19:39:57 +0000390
Fred Drake1f549022000-09-24 05:21:58 +0000391 def keysNS(self):
Paul Prescod73678da2000-07-01 04:58:47 +0000392 return self._attrsNS.keys()
Fred Drake55c38192000-06-29 19:39:57 +0000393
Fred Drake1f549022000-09-24 05:21:58 +0000394 def values(self):
Paul Prescod73678da2000-07-01 04:58:47 +0000395 return self._attrs.values()
Fred Drake55c38192000-06-29 19:39:57 +0000396
Martin v. Löwisd5fb58f2001-01-27 08:38:34 +0000397 def get(self, name, value = None):
398 return self._attrs.get(name, value)
399
Fred Drake1f549022000-09-24 05:21:58 +0000400 def __len__(self):
Fred Drake55c38192000-06-29 19:39:57 +0000401 return self.length
402
Fred Drake1f549022000-09-24 05:21:58 +0000403 def __cmp__(self, other):
404 if self._attrs is getattr(other, "_attrs", None):
Fred Drake55c38192000-06-29 19:39:57 +0000405 return 0
Fred Drake16f63292000-10-23 18:09:50 +0000406 else:
Fred Drake1f549022000-09-24 05:21:58 +0000407 return cmp(id(self), id(other))
Fred Drake55c38192000-06-29 19:39:57 +0000408
409 #FIXME: is it appropriate to return .value?
Fred Drake1f549022000-09-24 05:21:58 +0000410 def __getitem__(self, attname_or_tuple):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000411 if type(attname_or_tuple) is _TupleType:
Paul Prescod73678da2000-07-01 04:58:47 +0000412 return self._attrsNS[attname_or_tuple]
Fred Drake55c38192000-06-29 19:39:57 +0000413 else:
Paul Prescod73678da2000-07-01 04:58:47 +0000414 return self._attrs[attname_or_tuple]
Fred Drake55c38192000-06-29 19:39:57 +0000415
Paul Prescod1e688272000-07-01 19:21:47 +0000416 # same as set
Fred Drake1f549022000-09-24 05:21:58 +0000417 def __setitem__(self, attname, value):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000418 if type(value) in _StringTypes:
Fred Drake1f549022000-09-24 05:21:58 +0000419 node = Attr(attname)
Fred Drake4ccf4a12000-11-21 22:02:22 +0000420 node.value = value
Paul Prescod1e688272000-07-01 19:21:47 +0000421 else:
Fred Drake4ccf4a12000-11-21 22:02:22 +0000422 if not isinstance(value, Attr):
423 raise TypeError, "value must be a string or Attr object"
Fred Drake1f549022000-09-24 05:21:58 +0000424 node = value
Fred Drakef7cf40d2000-12-14 18:16:11 +0000425 self.setNamedItem(node)
426
427 def setNamedItem(self, node):
Andrew M. Kuchlingbc8f72c2001-02-21 01:30:26 +0000428 if not isinstance(node, Attr):
429 raise HierarchyRequestErr, \
430 "%s cannot be child of %s" % (repr(node), repr(self))
Fred Drakef7cf40d2000-12-14 18:16:11 +0000431 old = self._attrs.get(node.name)
Paul Prescod1e688272000-07-01 19:21:47 +0000432 if old:
433 old.unlink()
Fred Drake1f549022000-09-24 05:21:58 +0000434 self._attrs[node.name] = node
435 self._attrsNS[(node.namespaceURI, node.localName)] = node
Fred Drakef7cf40d2000-12-14 18:16:11 +0000436 return old
437
438 def setNamedItemNS(self, node):
439 return self.setNamedItem(node)
Paul Prescod73678da2000-07-01 04:58:47 +0000440
Fred Drake1f549022000-09-24 05:21:58 +0000441 def __delitem__(self, attname_or_tuple):
442 node = self[attname_or_tuple]
Paul Prescod73678da2000-07-01 04:58:47 +0000443 node.unlink()
444 del self._attrs[node.name]
445 del self._attrsNS[(node.namespaceURI, node.localName)]
Fred Drakef7cf40d2000-12-14 18:16:11 +0000446 self.length = len(self._attrs)
447
448AttributeList = NamedNodeMap
449
Fred Drake1f549022000-09-24 05:21:58 +0000450
Martin v. Löwisa2fda0d2000-10-07 12:10:28 +0000451class Element(Node):
Fred Drake1f549022000-09-24 05:21:58 +0000452 nodeType = Node.ELEMENT_NODE
Fred Drake4ccf4a12000-11-21 22:02:22 +0000453 nextSibling = None
454 previousSibling = None
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000455 childNodeTypes = (Node.ELEMENT_NODE, Node.PROCESSING_INSTRUCTION_NODE,
456 Node.COMMENT_NODE, Node.TEXT_NODE,
457 Node.CDATA_SECTION_NODE, Node.ENTITY_REFERENCE_NODE)
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000458
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000459 def __init__(self, tagName, namespaceURI=None, prefix="",
Fred Drake1f549022000-09-24 05:21:58 +0000460 localName=None):
461 Node.__init__(self)
Fred Drake55c38192000-06-29 19:39:57 +0000462 self.tagName = self.nodeName = tagName
Fred Drake1f549022000-09-24 05:21:58 +0000463 self.localName = localName or tagName
464 self.prefix = prefix
465 self.namespaceURI = namespaceURI
466 self.nodeValue = None
Fred Drake55c38192000-06-29 19:39:57 +0000467
Fred Drake4ccf4a12000-11-21 22:02:22 +0000468 self._attrs = {} # attributes are double-indexed:
469 self._attrsNS = {} # tagName -> Attribute
470 # URI,localName -> Attribute
471 # in the future: consider lazy generation
472 # of attribute objects this is too tricky
473 # for now because of headaches with
474 # namespaces.
475
476 def cloneNode(self, deep):
477 clone = Node.cloneNode(self, deep)
478 clone._attrs = {}
479 clone._attrsNS = {}
480 for attr in self._attrs.values():
481 node = attr.cloneNode(1)
482 clone._attrs[node.name] = node
483 clone._attrsNS[(node.namespaceURI, node.localName)] = node
484 node.ownerElement = clone
485 return clone
486
487 def unlink(self):
488 for attr in self._attrs.values():
489 attr.unlink()
490 self._attrs = None
491 self._attrsNS = None
492 Node.unlink(self)
Fred Drake55c38192000-06-29 19:39:57 +0000493
Fred Drake1f549022000-09-24 05:21:58 +0000494 def getAttribute(self, attname):
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000495 try:
496 return self._attrs[attname].value
497 except KeyError:
498 return ""
Fred Drake55c38192000-06-29 19:39:57 +0000499
Fred Drake1f549022000-09-24 05:21:58 +0000500 def getAttributeNS(self, namespaceURI, localName):
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000501 try:
502 return self._attrsNS[(namespaceURI, localName)].value
503 except KeyError:
504 return ""
Fred Drake1f549022000-09-24 05:21:58 +0000505
506 def setAttribute(self, attname, value):
507 attr = Attr(attname)
Fred Drake55c38192000-06-29 19:39:57 +0000508 # for performance
Fred Drake1f549022000-09-24 05:21:58 +0000509 attr.__dict__["value"] = attr.__dict__["nodeValue"] = value
510 self.setAttributeNode(attr)
Fred Drake55c38192000-06-29 19:39:57 +0000511
Fred Drake1f549022000-09-24 05:21:58 +0000512 def setAttributeNS(self, namespaceURI, qualifiedName, value):
513 prefix, localname = _nssplit(qualifiedName)
Fred Drake55c38192000-06-29 19:39:57 +0000514 # for performance
Fred Drake1f549022000-09-24 05:21:58 +0000515 attr = Attr(qualifiedName, namespaceURI, localname, prefix)
516 attr.__dict__["value"] = attr.__dict__["nodeValue"] = value
517 self.setAttributeNode(attr)
Fred Drake55c38192000-06-29 19:39:57 +0000518
Fred Drake1f549022000-09-24 05:21:58 +0000519 def getAttributeNode(self, attrname):
520 return self._attrs.get(attrname)
Paul Prescod73678da2000-07-01 04:58:47 +0000521
Fred Drake1f549022000-09-24 05:21:58 +0000522 def getAttributeNodeNS(self, namespaceURI, localName):
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000523 return self._attrsNS.get((namespaceURI, localName))
Paul Prescod73678da2000-07-01 04:58:47 +0000524
Fred Drake1f549022000-09-24 05:21:58 +0000525 def setAttributeNode(self, attr):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000526 if attr.ownerElement not in (None, self):
Martin v. Löwisd5fb58f2001-01-27 08:38:34 +0000527 raise xml.dom.InuseAttributeErr("attribute node already owned")
Fred Drake1f549022000-09-24 05:21:58 +0000528 old = self._attrs.get(attr.name, None)
Paul Prescod73678da2000-07-01 04:58:47 +0000529 if old:
530 old.unlink()
Fred Drake1f549022000-09-24 05:21:58 +0000531 self._attrs[attr.name] = attr
532 self._attrsNS[(attr.namespaceURI, attr.localName)] = attr
Fred Drake4ccf4a12000-11-21 22:02:22 +0000533
534 # This creates a circular reference, but Element.unlink()
535 # breaks the cycle since the references to the attribute
536 # dictionaries are tossed.
537 attr.ownerElement = self
538
539 if old is not attr:
540 # It might have already been part of this node, in which case
541 # it doesn't represent a change, and should not be returned.
542 return old
Fred Drake55c38192000-06-29 19:39:57 +0000543
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000544 setAttributeNodeNS = setAttributeNode
545
Fred Drake1f549022000-09-24 05:21:58 +0000546 def removeAttribute(self, name):
Paul Prescod73678da2000-07-01 04:58:47 +0000547 attr = self._attrs[name]
Fred Drake1f549022000-09-24 05:21:58 +0000548 self.removeAttributeNode(attr)
Fred Drake55c38192000-06-29 19:39:57 +0000549
Fred Drake1f549022000-09-24 05:21:58 +0000550 def removeAttributeNS(self, namespaceURI, localName):
Paul Prescod73678da2000-07-01 04:58:47 +0000551 attr = self._attrsNS[(namespaceURI, localName)]
Fred Drake1f549022000-09-24 05:21:58 +0000552 self.removeAttributeNode(attr)
Fred Drake55c38192000-06-29 19:39:57 +0000553
Fred Drake1f549022000-09-24 05:21:58 +0000554 def removeAttributeNode(self, node):
Paul Prescod73678da2000-07-01 04:58:47 +0000555 node.unlink()
556 del self._attrs[node.name]
557 del self._attrsNS[(node.namespaceURI, node.localName)]
Fred Drake16f63292000-10-23 18:09:50 +0000558
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000559 removeAttributeNodeNS = removeAttributeNode
560
Martin v. Löwis156c3372000-12-28 18:40:56 +0000561 def hasAttribute(self, name):
562 return self._attrs.has_key(name)
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000563
Martin v. Löwis156c3372000-12-28 18:40:56 +0000564 def hasAttributeNS(self, namespaceURI, localName):
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000565 return self._attrsNS.has_key((namespaceURI, localName))
566
Fred Drake1f549022000-09-24 05:21:58 +0000567 def getElementsByTagName(self, name):
568 return _getElementsByTagNameHelper(self, name, [])
Fred Drake55c38192000-06-29 19:39:57 +0000569
Fred Drake1f549022000-09-24 05:21:58 +0000570 def getElementsByTagNameNS(self, namespaceURI, localName):
Fred Drakefbe7b4f2001-07-04 06:25:53 +0000571 return _getElementsByTagNameNSHelper(self, namespaceURI, localName, [])
Fred Drake55c38192000-06-29 19:39:57 +0000572
Fred Drake1f549022000-09-24 05:21:58 +0000573 def __repr__(self):
574 return "<DOM Element: %s at %s>" % (self.tagName, id(self))
Fred Drake55c38192000-06-29 19:39:57 +0000575
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000576 def writexml(self, writer, indent="", addindent="", newl=""):
577 # indent = current indentation
578 # addindent = indentation to add to higher levels
579 # newl = newline string
580 writer.write(indent+"<" + self.tagName)
Fred Drake16f63292000-10-23 18:09:50 +0000581
Fred Drake4ccf4a12000-11-21 22:02:22 +0000582 attrs = self._get_attributes()
583 a_names = attrs.keys()
Fred Drake55c38192000-06-29 19:39:57 +0000584 a_names.sort()
585
586 for a_name in a_names:
Fred Drake1f549022000-09-24 05:21:58 +0000587 writer.write(" %s=\"" % a_name)
Fred Drake4ccf4a12000-11-21 22:02:22 +0000588 _write_data(writer, attrs[a_name].value)
Fred Drake55c38192000-06-29 19:39:57 +0000589 writer.write("\"")
590 if self.childNodes:
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000591 writer.write(">%s"%(newl))
Fred Drake55c38192000-06-29 19:39:57 +0000592 for node in self.childNodes:
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000593 node.writexml(writer,indent+addindent,addindent,newl)
594 writer.write("%s</%s>%s" % (indent,self.tagName,newl))
Fred Drake55c38192000-06-29 19:39:57 +0000595 else:
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000596 writer.write("/>%s"%(newl))
Fred Drake55c38192000-06-29 19:39:57 +0000597
Fred Drake1f549022000-09-24 05:21:58 +0000598 def _get_attributes(self):
599 return AttributeList(self._attrs, self._attrsNS)
Fred Drake55c38192000-06-29 19:39:57 +0000600
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000601 def hasAttributes(self):
602 if self._attrs or self._attrsNS:
603 return 1
604 else:
605 return 0
606
Fred Drake1f549022000-09-24 05:21:58 +0000607class Comment(Node):
608 nodeType = Node.COMMENT_NODE
Fred Drake4ccf4a12000-11-21 22:02:22 +0000609 nodeName = "#comment"
610 attributes = None
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000611 childNodeTypes = ()
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000612
Fred Drake1f549022000-09-24 05:21:58 +0000613 def __init__(self, data):
614 Node.__init__(self)
615 self.data = self.nodeValue = data
Fred Drake55c38192000-06-29 19:39:57 +0000616
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000617 def writexml(self, writer, indent="", addindent="", newl=""):
618 writer.write("%s<!--%s-->%s" % (indent,self.data,newl))
Fred Drake1f549022000-09-24 05:21:58 +0000619
620class ProcessingInstruction(Node):
621 nodeType = Node.PROCESSING_INSTRUCTION_NODE
Fred Drake4ccf4a12000-11-21 22:02:22 +0000622 attributes = None
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000623 childNodeTypes = ()
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000624
Fred Drake1f549022000-09-24 05:21:58 +0000625 def __init__(self, target, data):
626 Node.__init__(self)
Fred Drake55c38192000-06-29 19:39:57 +0000627 self.target = self.nodeName = target
628 self.data = self.nodeValue = data
Fred Drake55c38192000-06-29 19:39:57 +0000629
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000630 def writexml(self, writer, indent="", addindent="", newl=""):
631 writer.write("%s<?%s %s?>%s" % (indent,self.target, self.data, newl))
Fred Drake55c38192000-06-29 19:39:57 +0000632
Fred Drake87432f42001-04-04 14:09:46 +0000633class CharacterData(Node):
Fred Drake1f549022000-09-24 05:21:58 +0000634 def __init__(self, data):
Fred Drakedaa823a2001-01-08 04:04:34 +0000635 if type(data) not in _StringTypes:
636 raise TypeError, "node contents must be a string"
Fred Drake1f549022000-09-24 05:21:58 +0000637 Node.__init__(self)
Fred Drake55c38192000-06-29 19:39:57 +0000638 self.data = self.nodeValue = data
Fred Drake33d2b842001-04-04 15:15:18 +0000639 self.length = len(data)
Fred Drake87432f42001-04-04 14:09:46 +0000640
Fred Drake55c38192000-06-29 19:39:57 +0000641 def __repr__(self):
Fred Drake1f549022000-09-24 05:21:58 +0000642 if len(self.data) > 10:
643 dotdotdot = "..."
Fred Drake55c38192000-06-29 19:39:57 +0000644 else:
Fred Drake1f549022000-09-24 05:21:58 +0000645 dotdotdot = ""
Fred Drake87432f42001-04-04 14:09:46 +0000646 return "<DOM %s node \"%s%s\">" % (
647 self.__class__.__name__, self.data[0:10], dotdotdot)
648
649 def substringData(self, offset, count):
650 if offset < 0:
651 raise xml.dom.IndexSizeErr("offset cannot be negative")
652 if offset >= len(self.data):
653 raise xml.dom.IndexSizeErr("offset cannot be beyond end of data")
654 if count < 0:
655 raise xml.dom.IndexSizeErr("count cannot be negative")
656 return self.data[offset:offset+count]
657
658 def appendData(self, arg):
659 self.data = self.data + arg
660 self.nodeValue = self.data
Fred Drake33d2b842001-04-04 15:15:18 +0000661 self.length = len(self.data)
Fred Drake87432f42001-04-04 14:09:46 +0000662
663 def insertData(self, offset, arg):
664 if offset < 0:
665 raise xml.dom.IndexSizeErr("offset cannot be negative")
666 if offset >= len(self.data):
667 raise xml.dom.IndexSizeErr("offset cannot be beyond end of data")
668 if arg:
669 self.data = "%s%s%s" % (
670 self.data[:offset], arg, self.data[offset:])
671 self.nodeValue = self.data
Fred Drake33d2b842001-04-04 15:15:18 +0000672 self.length = len(self.data)
Fred Drake87432f42001-04-04 14:09:46 +0000673
674 def deleteData(self, offset, count):
675 if offset < 0:
676 raise xml.dom.IndexSizeErr("offset cannot be negative")
677 if offset >= len(self.data):
678 raise xml.dom.IndexSizeErr("offset cannot be beyond end of data")
679 if count < 0:
680 raise xml.dom.IndexSizeErr("count cannot be negative")
681 if count:
682 self.data = self.data[:offset] + self.data[offset+count:]
683 self.nodeValue = self.data
Fred Drake33d2b842001-04-04 15:15:18 +0000684 self.length = len(self.data)
Fred Drake87432f42001-04-04 14:09:46 +0000685
686 def replaceData(self, offset, count, arg):
687 if offset < 0:
688 raise xml.dom.IndexSizeErr("offset cannot be negative")
689 if offset >= len(self.data):
690 raise xml.dom.IndexSizeErr("offset cannot be beyond end of data")
691 if count < 0:
692 raise xml.dom.IndexSizeErr("count cannot be negative")
693 if count:
694 self.data = "%s%s%s" % (
695 self.data[:offset], arg, self.data[offset+count:])
696 self.nodeValue = self.data
Fred Drake33d2b842001-04-04 15:15:18 +0000697 self.length = len(self.data)
Fred Drake87432f42001-04-04 14:09:46 +0000698
699class Text(CharacterData):
700 nodeType = Node.TEXT_NODE
701 nodeName = "#text"
702 attributes = None
703 childNodeTypes = ()
Fred Drake55c38192000-06-29 19:39:57 +0000704
Fred Drakef7cf40d2000-12-14 18:16:11 +0000705 def splitText(self, offset):
706 if offset < 0 or offset > len(self.data):
Martin v. Löwisd5fb58f2001-01-27 08:38:34 +0000707 raise xml.dom.IndexSizeErr("illegal offset value")
Fred Drakef7cf40d2000-12-14 18:16:11 +0000708 newText = Text(self.data[offset:])
709 next = self.nextSibling
710 if self.parentNode and self in self.parentNode.childNodes:
711 if next is None:
712 self.parentNode.appendChild(newText)
713 else:
714 self.parentNode.insertBefore(newText, next)
715 self.data = self.data[:offset]
Fred Drake33d2b842001-04-04 15:15:18 +0000716 self.nodeValue = self.data
717 self.length = len(self.data)
Fred Drakef7cf40d2000-12-14 18:16:11 +0000718 return newText
719
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000720 def writexml(self, writer, indent="", addindent="", newl=""):
721 _write_data(writer, "%s%s%s"%(indent, self.data, newl))
Fred Drake55c38192000-06-29 19:39:57 +0000722
Fred Drake87432f42001-04-04 14:09:46 +0000723
724class CDATASection(Text):
725 nodeType = Node.CDATA_SECTION_NODE
726 nodeName = "#cdata-section"
727
728 def writexml(self, writer, indent="", addindent="", newl=""):
Guido van Rossum5b5e0b92001-09-19 13:28:25 +0000729 writer.write("<![CDATA[%s]]>" % self.data)
Fred Drake87432f42001-04-04 14:09:46 +0000730
731
Fred Drake1f549022000-09-24 05:21:58 +0000732def _nssplit(qualifiedName):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000733 fields = _string.split(qualifiedName, ':', 1)
Paul Prescod73678da2000-07-01 04:58:47 +0000734 if len(fields) == 2:
735 return fields
736 elif len(fields) == 1:
Fred Drake1f549022000-09-24 05:21:58 +0000737 return ('', fields[0])
Paul Prescod73678da2000-07-01 04:58:47 +0000738
Fred Drakef7cf40d2000-12-14 18:16:11 +0000739
740class DocumentType(Node):
741 nodeType = Node.DOCUMENT_TYPE_NODE
742 nodeValue = None
743 attributes = None
744 name = None
745 publicId = None
746 systemId = None
Fred Drakedc806702001-04-05 14:41:30 +0000747 internalSubset = None
Fred Drakef7cf40d2000-12-14 18:16:11 +0000748 entities = None
749 notations = None
750
751 def __init__(self, qualifiedName):
752 Node.__init__(self)
753 if qualifiedName:
754 prefix, localname = _nssplit(qualifiedName)
755 self.name = localname
756
757
758class DOMImplementation:
759 def hasFeature(self, feature, version):
760 if version not in ("1.0", "2.0"):
761 return 0
762 feature = _string.lower(feature)
763 return feature == "core"
764
765 def createDocument(self, namespaceURI, qualifiedName, doctype):
766 if doctype and doctype.parentNode is not None:
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000767 raise xml.dom.WrongDocumentErr(
768 "doctype object owned by another DOM tree")
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000769 doc = self._createDocument()
Fred Drakef7cf40d2000-12-14 18:16:11 +0000770 if doctype is None:
771 doctype = self.createDocumentType(qualifiedName, None, None)
Martin v. Löwisb417be22001-02-06 01:16:06 +0000772 if not qualifiedName:
773 # The spec is unclear what to raise here; SyntaxErr
774 # would be the other obvious candidate. Since Xerces raises
775 # InvalidCharacterErr, and since SyntaxErr is not listed
776 # for createDocument, that seems to be the better choice.
777 # XXX: need to check for illegal characters here and in
778 # createElement.
779 raise xml.dom.InvalidCharacterErr("Element with no name")
780 prefix, localname = _nssplit(qualifiedName)
781 if prefix == "xml" \
782 and namespaceURI != "http://www.w3.org/XML/1998/namespace":
783 raise xml.dom.NamespaceErr("illegal use of 'xml' prefix")
784 if prefix and not namespaceURI:
785 raise xml.dom.NamespaceErr(
786 "illegal use of prefix without namespaces")
787 element = doc.createElementNS(namespaceURI, qualifiedName)
788 doc.appendChild(element)
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000789 doctype.parentNode = doctype.ownerDocument = doc
Fred Drakef7cf40d2000-12-14 18:16:11 +0000790 doc.doctype = doctype
791 doc.implementation = self
792 return doc
793
794 def createDocumentType(self, qualifiedName, publicId, systemId):
795 doctype = DocumentType(qualifiedName)
796 doctype.publicId = publicId
797 doctype.systemId = systemId
798 return doctype
799
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000800 # internal
801 def _createDocument(self):
802 return Document()
Fred Drakef7cf40d2000-12-14 18:16:11 +0000803
Fred Drake1f549022000-09-24 05:21:58 +0000804class Document(Node):
805 nodeType = Node.DOCUMENT_NODE
Fred Drake4ccf4a12000-11-21 22:02:22 +0000806 nodeName = "#document"
807 nodeValue = None
808 attributes = None
Fred Drakef7cf40d2000-12-14 18:16:11 +0000809 doctype = None
810 parentNode = None
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000811 previousSibling = nextSibling = None
Fred Drakef7cf40d2000-12-14 18:16:11 +0000812
813 implementation = DOMImplementation()
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000814 childNodeTypes = (Node.ELEMENT_NODE, Node.PROCESSING_INSTRUCTION_NODE,
815 Node.COMMENT_NODE, Node.DOCUMENT_TYPE_NODE)
Fred Drake55c38192000-06-29 19:39:57 +0000816
Fred Drake1f549022000-09-24 05:21:58 +0000817 def appendChild(self, node):
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000818 if node.nodeType not in self.childNodeTypes:
819 raise HierarchyRequestErr, \
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000820 "%s cannot be child of %s" % (repr(node), repr(self))
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000821 if node.parentNode is not None:
822 node.parentNode.removeChild(node)
823
Fred Drakef7cf40d2000-12-14 18:16:11 +0000824 if node.nodeType == Node.ELEMENT_NODE \
825 and self._get_documentElement():
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000826 raise xml.dom.HierarchyRequestErr(
827 "two document elements disallowed")
Fred Drake4ccf4a12000-11-21 22:02:22 +0000828 return Node.appendChild(self, node)
Paul Prescod73678da2000-07-01 04:58:47 +0000829
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000830 def removeChild(self, oldChild):
831 self.childNodes.remove(oldChild)
832 oldChild.nextSibling = oldChild.previousSibling = None
833 oldChild.parentNode = None
834 if self.documentElement is oldChild:
835 self.documentElement = None
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000836
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000837 return oldChild
838
Fred Drakef7cf40d2000-12-14 18:16:11 +0000839 def _get_documentElement(self):
840 for node in self.childNodes:
841 if node.nodeType == Node.ELEMENT_NODE:
842 return node
843
844 def unlink(self):
845 if self.doctype is not None:
846 self.doctype.unlink()
847 self.doctype = None
848 Node.unlink(self)
849
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000850 def createDocumentFragment(self):
851 d = DocumentFragment()
852 d.ownerDoc = self
853 return d
Fred Drake55c38192000-06-29 19:39:57 +0000854
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000855 def createElement(self, tagName):
856 e = Element(tagName)
857 e.ownerDocument = self
858 return e
Fred Drake55c38192000-06-29 19:39:57 +0000859
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000860 def createTextNode(self, data):
861 t = Text(data)
862 t.ownerDocument = self
863 return t
Fred Drake55c38192000-06-29 19:39:57 +0000864
Fred Drake87432f42001-04-04 14:09:46 +0000865 def createCDATASection(self, data):
866 c = CDATASection(data)
867 c.ownerDocument = self
868 return c
869
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000870 def createComment(self, data):
871 c = Comment(data)
872 c.ownerDocument = self
873 return c
Fred Drake55c38192000-06-29 19:39:57 +0000874
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000875 def createProcessingInstruction(self, target, data):
876 p = ProcessingInstruction(target, data)
877 p.ownerDocument = self
878 return p
879
880 def createAttribute(self, qName):
881 a = Attr(qName)
882 a.ownerDocument = self
Martin v. Löwiscb67ea12001-03-31 16:30:40 +0000883 a.value = ""
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000884 return a
Fred Drake55c38192000-06-29 19:39:57 +0000885
886 def createElementNS(self, namespaceURI, qualifiedName):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000887 prefix, localName = _nssplit(qualifiedName)
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000888 e = Element(qualifiedName, namespaceURI, prefix, localName)
889 e.ownerDocument = self
890 return e
Fred Drake55c38192000-06-29 19:39:57 +0000891
892 def createAttributeNS(self, namespaceURI, qualifiedName):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000893 prefix, localName = _nssplit(qualifiedName)
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000894 a = Attr(qualifiedName, namespaceURI, localName, prefix)
895 a.ownerDocument = self
Martin v. Löwiscb67ea12001-03-31 16:30:40 +0000896 a.value = ""
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000897 return a
Fred Drake55c38192000-06-29 19:39:57 +0000898
Fred Drake1f549022000-09-24 05:21:58 +0000899 def getElementsByTagName(self, name):
Fred Drakefbe7b4f2001-07-04 06:25:53 +0000900 return _getElementsByTagNameHelper(self, name, [])
901
902 def getElementsByTagNameNS(self, namespaceURI, localName):
903 return _getElementsByTagNameNSHelper(self, namespaceURI, localName, [])
Fred Drake55c38192000-06-29 19:39:57 +0000904
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000905 def writexml(self, writer, indent="", addindent="", newl=""):
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000906 writer.write('<?xml version="1.0" ?>\n')
Fred Drake55c38192000-06-29 19:39:57 +0000907 for node in self.childNodes:
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000908 node.writexml(writer, indent, addindent, newl)
Fred Drake55c38192000-06-29 19:39:57 +0000909
Fred Drake4ccf4a12000-11-21 22:02:22 +0000910def _get_StringIO():
Fred Drakef7cf40d2000-12-14 18:16:11 +0000911 # we can't use cStringIO since it doesn't support Unicode strings
912 from StringIO import StringIO
Fred Drake4ccf4a12000-11-21 22:02:22 +0000913 return StringIO()
914
Fred Drake1f549022000-09-24 05:21:58 +0000915def _doparse(func, args, kwargs):
916 events = apply(func, args, kwargs)
917 toktype, rootNode = events.getEvent()
918 events.expandNode(rootNode)
Martin v. Löwisb417be22001-02-06 01:16:06 +0000919 events.clear()
Fred Drake55c38192000-06-29 19:39:57 +0000920 return rootNode
921
Fred Drake1f549022000-09-24 05:21:58 +0000922def parse(*args, **kwargs):
Fred Drakef7cf40d2000-12-14 18:16:11 +0000923 """Parse a file into a DOM by filename or file object."""
Fred Drake4ccf4a12000-11-21 22:02:22 +0000924 from xml.dom import pulldom
Fred Drake1f549022000-09-24 05:21:58 +0000925 return _doparse(pulldom.parse, args, kwargs)
Fred Drake55c38192000-06-29 19:39:57 +0000926
Fred Drake1f549022000-09-24 05:21:58 +0000927def parseString(*args, **kwargs):
Fred Drakef7cf40d2000-12-14 18:16:11 +0000928 """Parse a file into a DOM from a string."""
Fred Drake4ccf4a12000-11-21 22:02:22 +0000929 from xml.dom import pulldom
Fred Drake1f549022000-09-24 05:21:58 +0000930 return _doparse(pulldom.parseString, args, kwargs)
Martin v. Löwis7edbd4f2001-02-22 14:05:50 +0000931
932def getDOMImplementation():
933 return Document.implementation