blob: 2e9d866e3190c6d4fc2ce28a678b3d125f258877 [file] [log] [blame]
Fred Drake1f549022000-09-24 05:21:58 +00001"""\
Fred Drakef7cf40d2000-12-14 18:16:11 +00002minidom.py -- a lightweight DOM implementation.
Fred Drake55c38192000-06-29 19:39:57 +00003
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +00004parse("foo.xml")
Paul Prescod623511b2000-07-21 22:05:49 +00005
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +00006parseString("<foo><bar/></foo>")
Paul Prescod623511b2000-07-21 22:05:49 +00007
Fred Drake55c38192000-06-29 19:39:57 +00008Todo:
9=====
10 * convenience methods for getting elements and text.
11 * more testing
12 * bring some of the writer and linearizer code into conformance with this
13 interface
14 * SAX 2 namespaces
15"""
16
Fred Drake1f549022000-09-24 05:21:58 +000017import string
Fred Drake4ccf4a12000-11-21 22:02:22 +000018_string = string
19del string
20
Fred Drake49a5d032001-11-30 22:21:58 +000021from xml.dom import HierarchyRequestErr, EMPTY_NAMESPACE
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +000022
Fred Drake4ccf4a12000-11-21 22:02:22 +000023# localize the types, and allow support for Unicode values if available:
Fred Drake1f549022000-09-24 05:21:58 +000024import types
Fred Drake4ccf4a12000-11-21 22:02:22 +000025_TupleType = types.TupleType
26try:
27 _StringTypes = (types.StringType, types.UnicodeType)
28except AttributeError:
29 _StringTypes = (types.StringType,)
30del types
31
Fred Drakef7cf40d2000-12-14 18:16:11 +000032import xml.dom
Fred Drake55c38192000-06-29 19:39:57 +000033
Fred Drake3ac6a092001-09-28 04:33:06 +000034
35if list is type([]):
36 class NodeList(list):
37 def item(self, index):
38 if 0 <= index < len(self):
39 return self[index]
40
Fred Drake575712e2001-09-28 20:25:45 +000041 length = property(lambda self: len(self),
42 doc="The number of nodes in the NodeList.")
Fred Drake3ac6a092001-09-28 04:33:06 +000043
44else:
45 def NodeList():
46 return []
47
48
Fred Drake575712e2001-09-28 20:25:45 +000049class Node(xml.dom.Node):
Fred Drake1f549022000-09-24 05:21:58 +000050 allnodes = {}
51 _debug = 0
52 _makeParentNodes = 1
53 debug = None
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +000054 childNodeTypes = ()
Martin v. Löwis126f2f62001-03-13 10:50:13 +000055 namespaceURI = None # this is non-null only for elements and attributes
Fred Drake575712e2001-09-28 20:25:45 +000056 parentNode = None
57 ownerDocument = None
Martin v. Löwis52ce0d02001-01-27 08:47:37 +000058
Fred Drake1f549022000-09-24 05:21:58 +000059 def __init__(self):
Fred Drake3ac6a092001-09-28 04:33:06 +000060 self.childNodes = NodeList()
Fred Drake16f63292000-10-23 18:09:50 +000061 if Node._debug:
Fred Drake1f549022000-09-24 05:21:58 +000062 index = repr(id(self)) + repr(self.__class__)
63 Node.allnodes[index] = repr(self.__dict__)
64 if Node.debug is None:
Fred Drake4ccf4a12000-11-21 22:02:22 +000065 Node.debug = _get_StringIO()
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +000066 #open("debug4.out", "w")
Fred Drake1f549022000-09-24 05:21:58 +000067 Node.debug.write("create %s\n" % index)
Fred Drake55c38192000-06-29 19:39:57 +000068
Fred Drake1f549022000-09-24 05:21:58 +000069 def __nonzero__(self):
70 return 1
Fred Drake55c38192000-06-29 19:39:57 +000071
Fred Drake1f549022000-09-24 05:21:58 +000072 def toxml(self):
Fred Drake4ccf4a12000-11-21 22:02:22 +000073 writer = _get_StringIO()
Fred Drake1f549022000-09-24 05:21:58 +000074 self.writexml(writer)
Fred Drake55c38192000-06-29 19:39:57 +000075 return writer.getvalue()
76
Martin v. Löwis46fa39a2001-02-06 00:14:08 +000077 def toprettyxml(self, indent="\t", newl="\n"):
Martin v. Löwiscb67ea12001-03-31 16:30:40 +000078 # indent = the indentation string to prepend, per level
79 # newl = the newline string to append
80 writer = _get_StringIO()
81 self.writexml(writer, "", indent, newl)
82 return writer.getvalue()
Martin v. Löwis46fa39a2001-02-06 00:14:08 +000083
Fred Drake1f549022000-09-24 05:21:58 +000084 def hasChildNodes(self):
85 if self.childNodes:
86 return 1
87 else:
88 return 0
Fred Drake55c38192000-06-29 19:39:57 +000089
Fred Drake1f549022000-09-24 05:21:58 +000090 def _get_firstChild(self):
Fred Drake4ccf4a12000-11-21 22:02:22 +000091 if self.childNodes:
92 return self.childNodes[0]
Paul Prescod73678da2000-07-01 04:58:47 +000093
Fred Drake1f549022000-09-24 05:21:58 +000094 def _get_lastChild(self):
Fred Drake4ccf4a12000-11-21 22:02:22 +000095 if self.childNodes:
96 return self.childNodes[-1]
Paul Prescod73678da2000-07-01 04:58:47 +000097
Fred Draked1572372001-09-29 04:58:32 +000098 try:
99 property
100 except NameError:
101 def __getattr__(self, key):
102 if key[0:2] == "__":
103 raise AttributeError, key
104 # getattr should never call getattr!
105 if self.__dict__.has_key("inGetAttr"):
106 del self.inGetAttr
107 raise AttributeError, key
108
109 prefix, attrname = key[:5], key[5:]
110 if prefix == "_get_":
111 self.inGetAttr = 1
112 if hasattr(self, attrname):
113 del self.inGetAttr
114 return (lambda self=self, attrname=attrname:
115 getattr(self, attrname))
116 else:
117 del self.inGetAttr
118 raise AttributeError, key
119 else:
120 self.inGetAttr = 1
121 try:
122 func = getattr(self, "_get_" + key)
123 except AttributeError:
124 raise AttributeError, key
125 del self.inGetAttr
126 return func()
127 else:
128 firstChild = property(_get_firstChild,
129 doc="First child node, or None.")
130 lastChild = property(_get_lastChild,
131 doc="Last child node, or None.")
132
Fred Drake1f549022000-09-24 05:21:58 +0000133 def insertBefore(self, newChild, refChild):
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000134 if newChild.nodeType == self.DOCUMENT_FRAGMENT_NODE:
Fred Drakee50959a2001-12-06 04:32:18 +0000135 for c in tuple(newChild.childNodes):
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000136 self.insertBefore(c, refChild)
137 ### The DOM does not clearly specify what to return in this case
138 return newChild
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000139 if newChild.nodeType not in self.childNodeTypes:
140 raise HierarchyRequestErr, \
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000141 "%s cannot be child of %s" % (repr(newChild), repr(self))
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000142 if newChild.parentNode is not None:
143 newChild.parentNode.removeChild(newChild)
Fred Drake4ccf4a12000-11-21 22:02:22 +0000144 if refChild is None:
145 self.appendChild(newChild)
146 else:
147 index = self.childNodes.index(refChild)
148 self.childNodes.insert(index, newChild)
149 newChild.nextSibling = refChild
150 refChild.previousSibling = newChild
151 if index:
152 node = self.childNodes[index-1]
153 node.nextSibling = newChild
154 newChild.previousSibling = node
155 else:
156 newChild.previousSibling = None
157 if self._makeParentNodes:
158 newChild.parentNode = self
159 return newChild
Fred Drake55c38192000-06-29 19:39:57 +0000160
Fred Drake1f549022000-09-24 05:21:58 +0000161 def appendChild(self, node):
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000162 if node.nodeType == self.DOCUMENT_FRAGMENT_NODE:
Fred Drakee50959a2001-12-06 04:32:18 +0000163 for c in tuple(node.childNodes):
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000164 self.appendChild(c)
165 ### The DOM does not clearly specify what to return in this case
166 return node
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000167 if node.nodeType not in self.childNodeTypes:
168 raise HierarchyRequestErr, \
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000169 "%s cannot be child of %s" % (repr(node), repr(self))
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000170 if node.parentNode is not None:
171 node.parentNode.removeChild(node)
Fred Drake13a30692000-10-09 20:04:16 +0000172 if self.childNodes:
173 last = self.lastChild
174 node.previousSibling = last
175 last.nextSibling = node
176 else:
177 node.previousSibling = None
178 node.nextSibling = None
Fred Drake1f549022000-09-24 05:21:58 +0000179 self.childNodes.append(node)
Fred Drake4ccf4a12000-11-21 22:02:22 +0000180 if self._makeParentNodes:
181 node.parentNode = self
Paul Prescod73678da2000-07-01 04:58:47 +0000182 return node
183
Fred Drake1f549022000-09-24 05:21:58 +0000184 def replaceChild(self, newChild, oldChild):
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000185 if newChild.nodeType == self.DOCUMENT_FRAGMENT_NODE:
186 refChild = oldChild.nextSibling
187 self.removeChild(oldChild)
188 return self.insertBefore(newChild, refChild)
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000189 if newChild.nodeType not in self.childNodeTypes:
190 raise HierarchyRequestErr, \
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000191 "%s cannot be child of %s" % (repr(newChild), repr(self))
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000192 if newChild.parentNode is not None:
193 newChild.parentNode.removeChild(newChild)
Fred Drake4ccf4a12000-11-21 22:02:22 +0000194 if newChild is oldChild:
195 return
Fred Drake1f549022000-09-24 05:21:58 +0000196 index = self.childNodes.index(oldChild)
Fred Drake4ccf4a12000-11-21 22:02:22 +0000197 self.childNodes[index] = newChild
198 if self._makeParentNodes:
199 newChild.parentNode = self
200 oldChild.parentNode = None
201 newChild.nextSibling = oldChild.nextSibling
202 newChild.previousSibling = oldChild.previousSibling
Martin v. Löwis156c3372000-12-28 18:40:56 +0000203 oldChild.nextSibling = None
Fred Drake4ccf4a12000-11-21 22:02:22 +0000204 oldChild.previousSibling = None
Martin v. Löwis156c3372000-12-28 18:40:56 +0000205 if newChild.previousSibling:
206 newChild.previousSibling.nextSibling = newChild
207 if newChild.nextSibling:
208 newChild.nextSibling.previousSibling = newChild
Fred Drake4ccf4a12000-11-21 22:02:22 +0000209 return oldChild
Paul Prescod73678da2000-07-01 04:58:47 +0000210
Fred Drake1f549022000-09-24 05:21:58 +0000211 def removeChild(self, oldChild):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000212 self.childNodes.remove(oldChild)
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000213 if oldChild.nextSibling is not None:
214 oldChild.nextSibling.previousSibling = oldChild.previousSibling
215 if oldChild.previousSibling is not None:
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000216 oldChild.previousSibling.nextSibling = oldChild.nextSibling
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000217 oldChild.nextSibling = oldChild.previousSibling = None
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000218
Fred Drake4ccf4a12000-11-21 22:02:22 +0000219 if self._makeParentNodes:
220 oldChild.parentNode = None
221 return oldChild
222
223 def normalize(self):
Fred Drakef7cf40d2000-12-14 18:16:11 +0000224 L = []
225 for child in self.childNodes:
226 if child.nodeType == Node.TEXT_NODE:
227 data = child.data
228 if data and L and L[-1].nodeType == child.nodeType:
Fred Drake4ccf4a12000-11-21 22:02:22 +0000229 # collapse text node
230 node = L[-1]
231 node.data = node.nodeValue = node.data + child.data
232 node.nextSibling = child.nextSibling
233 child.unlink()
Fred Drakef7cf40d2000-12-14 18:16:11 +0000234 elif data:
235 if L:
236 L[-1].nextSibling = child
237 child.previousSibling = L[-1]
238 else:
239 child.previousSibling = None
240 L.append(child)
Fred Drake4ccf4a12000-11-21 22:02:22 +0000241 else:
Fred Drakef7cf40d2000-12-14 18:16:11 +0000242 # empty text node; discard
243 child.unlink()
244 else:
245 if L:
Fred Drake4ccf4a12000-11-21 22:02:22 +0000246 L[-1].nextSibling = child
247 child.previousSibling = L[-1]
Fred Drakef7cf40d2000-12-14 18:16:11 +0000248 else:
249 child.previousSibling = None
250 L.append(child)
251 if child.nodeType == Node.ELEMENT_NODE:
Fred Drake4ccf4a12000-11-21 22:02:22 +0000252 child.normalize()
Fred Drakef7cf40d2000-12-14 18:16:11 +0000253 self.childNodes[:] = L
Paul Prescod73678da2000-07-01 04:58:47 +0000254
Fred Drake1f549022000-09-24 05:21:58 +0000255 def cloneNode(self, deep):
Paul Prescod73678da2000-07-01 04:58:47 +0000256 import new
Fred Drake4ccf4a12000-11-21 22:02:22 +0000257 clone = new.instance(self.__class__, self.__dict__.copy())
258 if self._makeParentNodes:
259 clone.parentNode = None
Fred Drake3ac6a092001-09-28 04:33:06 +0000260 clone.childNodes = NodeList()
Fred Drake4ccf4a12000-11-21 22:02:22 +0000261 if deep:
262 for child in self.childNodes:
263 clone.appendChild(child.cloneNode(1))
Paul Prescod73678da2000-07-01 04:58:47 +0000264 return clone
Fred Drake55c38192000-06-29 19:39:57 +0000265
Fred Drake25239772001-02-02 19:40:19 +0000266 # DOM Level 3 (Working Draft 2001-Jan-26)
267
268 def isSameNode(self, other):
269 return self is other
270
271 # minidom-specific API:
272
Fred Drake1f549022000-09-24 05:21:58 +0000273 def unlink(self):
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000274 self.parentNode = self.ownerDocument = None
Fred Drake4ccf4a12000-11-21 22:02:22 +0000275 for child in self.childNodes:
276 child.unlink()
Fred Drake1f549022000-09-24 05:21:58 +0000277 self.childNodes = None
Paul Prescod4221ff02000-10-13 20:11:42 +0000278 self.previousSibling = None
279 self.nextSibling = None
Paul Prescod73678da2000-07-01 04:58:47 +0000280 if Node._debug:
Fred Drake1f549022000-09-24 05:21:58 +0000281 index = repr(id(self)) + repr(self.__class__)
282 self.debug.write("Deleting: %s\n" % index)
Paul Prescod73678da2000-07-01 04:58:47 +0000283 del Node.allnodes[index]
Fred Drake55c38192000-06-29 19:39:57 +0000284
Fred Drake1f549022000-09-24 05:21:58 +0000285def _write_data(writer, data):
Fred Drake55c38192000-06-29 19:39:57 +0000286 "Writes datachars to writer."
Fred Drake4ccf4a12000-11-21 22:02:22 +0000287 replace = _string.replace
288 data = replace(data, "&", "&amp;")
289 data = replace(data, "<", "&lt;")
290 data = replace(data, "\"", "&quot;")
291 data = replace(data, ">", "&gt;")
Fred Drake55c38192000-06-29 19:39:57 +0000292 writer.write(data)
293
Fred Drake1f549022000-09-24 05:21:58 +0000294def _getElementsByTagNameHelper(parent, name, rc):
Fred Drake55c38192000-06-29 19:39:57 +0000295 for node in parent.childNodes:
Fred Drake1f549022000-09-24 05:21:58 +0000296 if node.nodeType == Node.ELEMENT_NODE and \
297 (name == "*" or node.tagName == name):
298 rc.append(node)
299 _getElementsByTagNameHelper(node, name, rc)
Fred Drake55c38192000-06-29 19:39:57 +0000300 return rc
301
Fred Drake1f549022000-09-24 05:21:58 +0000302def _getElementsByTagNameNSHelper(parent, nsURI, localName, rc):
Fred Drake55c38192000-06-29 19:39:57 +0000303 for node in parent.childNodes:
Fred Drake1f549022000-09-24 05:21:58 +0000304 if node.nodeType == Node.ELEMENT_NODE:
Martin v. Löwised525fb2001-06-03 14:06:42 +0000305 if ((localName == "*" or node.localName == localName) and
Fred Drake1f549022000-09-24 05:21:58 +0000306 (nsURI == "*" or node.namespaceURI == nsURI)):
307 rc.append(node)
Fred Drakef7cf40d2000-12-14 18:16:11 +0000308 _getElementsByTagNameNSHelper(node, nsURI, localName, rc)
309 return rc
Fred Drake55c38192000-06-29 19:39:57 +0000310
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000311class DocumentFragment(Node):
312 nodeType = Node.DOCUMENT_FRAGMENT_NODE
313 nodeName = "#document-fragment"
314 nodeValue = None
315 attributes = None
316 parentNode = None
317 childNodeTypes = (Node.ELEMENT_NODE,
318 Node.TEXT_NODE,
319 Node.CDATA_SECTION_NODE,
320 Node.ENTITY_REFERENCE_NODE,
321 Node.PROCESSING_INSTRUCTION_NODE,
322 Node.COMMENT_NODE,
323 Node.NOTATION_NODE)
324
325
Fred Drake55c38192000-06-29 19:39:57 +0000326class Attr(Node):
Fred Drake1f549022000-09-24 05:21:58 +0000327 nodeType = Node.ATTRIBUTE_NODE
Fred Drake4ccf4a12000-11-21 22:02:22 +0000328 attributes = None
329 ownerElement = None
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000330 childNodeTypes = (Node.TEXT_NODE, Node.ENTITY_REFERENCE_NODE)
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000331
Fred Drake49a5d032001-11-30 22:21:58 +0000332 def __init__(self, qName, namespaceURI=EMPTY_NAMESPACE, localName=None, prefix=None):
Fred Drake55c38192000-06-29 19:39:57 +0000333 # skip setattr for performance
Fred Drake4ccf4a12000-11-21 22:02:22 +0000334 d = self.__dict__
335 d["localName"] = localName or qName
336 d["nodeName"] = d["name"] = qName
337 d["namespaceURI"] = namespaceURI
338 d["prefix"] = prefix
Fred Drake1f549022000-09-24 05:21:58 +0000339 Node.__init__(self)
Paul Prescod73678da2000-07-01 04:58:47 +0000340 # nodeValue and value are set elsewhere
Fred Drake55c38192000-06-29 19:39:57 +0000341
Fred Drake1f549022000-09-24 05:21:58 +0000342 def __setattr__(self, name, value):
Fred Drakef7cf40d2000-12-14 18:16:11 +0000343 d = self.__dict__
Fred Drake1f549022000-09-24 05:21:58 +0000344 if name in ("value", "nodeValue"):
Fred Drakef7cf40d2000-12-14 18:16:11 +0000345 d["value"] = d["nodeValue"] = value
346 elif name in ("name", "nodeName"):
347 d["name"] = d["nodeName"] = value
Fred Drake55c38192000-06-29 19:39:57 +0000348 else:
Fred Drakef7cf40d2000-12-14 18:16:11 +0000349 d[name] = value
Fred Drake55c38192000-06-29 19:39:57 +0000350
Fred Drake4ccf4a12000-11-21 22:02:22 +0000351 def cloneNode(self, deep):
352 clone = Node.cloneNode(self, deep)
353 if clone.__dict__.has_key("ownerElement"):
354 del clone.ownerElement
355 return clone
356
Fred Drakef7cf40d2000-12-14 18:16:11 +0000357
358class NamedNodeMap:
Fred Drake4ccf4a12000-11-21 22:02:22 +0000359 """The attribute list is a transient interface to the underlying
360 dictionaries. Mutations here will change the underlying element's
Fred Drakef7cf40d2000-12-14 18:16:11 +0000361 dictionary.
362
363 Ordering is imposed artificially and does not reflect the order of
364 attributes as found in an input document.
365 """
Fred Drake4ccf4a12000-11-21 22:02:22 +0000366
Fred Drake1f549022000-09-24 05:21:58 +0000367 def __init__(self, attrs, attrsNS):
368 self._attrs = attrs
369 self._attrsNS = attrsNS
Fred Drakef7cf40d2000-12-14 18:16:11 +0000370
Fred Draked1572372001-09-29 04:58:32 +0000371 try:
372 property
373 except NameError:
374 def __getattr__(self, name):
375 if name == "length":
376 return len(self._attrs)
377 raise AttributeError, name
378 else:
379 length = property(lambda self: len(self._attrs),
380 doc="Number of nodes in the NamedNodeMap.")
Fred Drake55c38192000-06-29 19:39:57 +0000381
Fred Drake1f549022000-09-24 05:21:58 +0000382 def item(self, index):
Fred Drake55c38192000-06-29 19:39:57 +0000383 try:
Fred Drakef7cf40d2000-12-14 18:16:11 +0000384 return self[self._attrs.keys()[index]]
Fred Drake55c38192000-06-29 19:39:57 +0000385 except IndexError:
386 return None
Fred Drake55c38192000-06-29 19:39:57 +0000387
Fred Drake1f549022000-09-24 05:21:58 +0000388 def items(self):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000389 L = []
390 for node in self._attrs.values():
Martin v. Löwisd5fb58f2001-01-27 08:38:34 +0000391 L.append((node.nodeName, node.value))
Fred Drake4ccf4a12000-11-21 22:02:22 +0000392 return L
Fred Drake1f549022000-09-24 05:21:58 +0000393
394 def itemsNS(self):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000395 L = []
396 for node in self._attrs.values():
Fred Drake49a5d032001-11-30 22:21:58 +0000397 L.append(((node.namespaceURI, node.localName), node.value))
Fred Drake4ccf4a12000-11-21 22:02:22 +0000398 return L
Fred Drake16f63292000-10-23 18:09:50 +0000399
Fred Drake1f549022000-09-24 05:21:58 +0000400 def keys(self):
Paul Prescod73678da2000-07-01 04:58:47 +0000401 return self._attrs.keys()
Fred Drake55c38192000-06-29 19:39:57 +0000402
Fred Drake1f549022000-09-24 05:21:58 +0000403 def keysNS(self):
Paul Prescod73678da2000-07-01 04:58:47 +0000404 return self._attrsNS.keys()
Fred Drake55c38192000-06-29 19:39:57 +0000405
Fred Drake1f549022000-09-24 05:21:58 +0000406 def values(self):
Paul Prescod73678da2000-07-01 04:58:47 +0000407 return self._attrs.values()
Fred Drake55c38192000-06-29 19:39:57 +0000408
Martin v. Löwisd5fb58f2001-01-27 08:38:34 +0000409 def get(self, name, value = None):
410 return self._attrs.get(name, value)
411
Fred Drake1f549022000-09-24 05:21:58 +0000412 def __len__(self):
Fred Drake55c38192000-06-29 19:39:57 +0000413 return self.length
414
Fred Drake1f549022000-09-24 05:21:58 +0000415 def __cmp__(self, other):
416 if self._attrs is getattr(other, "_attrs", None):
Fred Drake55c38192000-06-29 19:39:57 +0000417 return 0
Fred Drake16f63292000-10-23 18:09:50 +0000418 else:
Fred Drake1f549022000-09-24 05:21:58 +0000419 return cmp(id(self), id(other))
Fred Drake55c38192000-06-29 19:39:57 +0000420
421 #FIXME: is it appropriate to return .value?
Fred Drake1f549022000-09-24 05:21:58 +0000422 def __getitem__(self, attname_or_tuple):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000423 if type(attname_or_tuple) is _TupleType:
Paul Prescod73678da2000-07-01 04:58:47 +0000424 return self._attrsNS[attname_or_tuple]
Fred Drake55c38192000-06-29 19:39:57 +0000425 else:
Paul Prescod73678da2000-07-01 04:58:47 +0000426 return self._attrs[attname_or_tuple]
Fred Drake55c38192000-06-29 19:39:57 +0000427
Paul Prescod1e688272000-07-01 19:21:47 +0000428 # same as set
Fred Drake1f549022000-09-24 05:21:58 +0000429 def __setitem__(self, attname, value):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000430 if type(value) in _StringTypes:
Fred Drake1f549022000-09-24 05:21:58 +0000431 node = Attr(attname)
Fred Drake4ccf4a12000-11-21 22:02:22 +0000432 node.value = value
Paul Prescod1e688272000-07-01 19:21:47 +0000433 else:
Fred Drake4ccf4a12000-11-21 22:02:22 +0000434 if not isinstance(value, Attr):
435 raise TypeError, "value must be a string or Attr object"
Fred Drake1f549022000-09-24 05:21:58 +0000436 node = value
Fred Drakef7cf40d2000-12-14 18:16:11 +0000437 self.setNamedItem(node)
438
439 def setNamedItem(self, node):
Andrew M. Kuchlingbc8f72c2001-02-21 01:30:26 +0000440 if not isinstance(node, Attr):
441 raise HierarchyRequestErr, \
442 "%s cannot be child of %s" % (repr(node), repr(self))
Fred Drakef7cf40d2000-12-14 18:16:11 +0000443 old = self._attrs.get(node.name)
Paul Prescod1e688272000-07-01 19:21:47 +0000444 if old:
445 old.unlink()
Fred Drake1f549022000-09-24 05:21:58 +0000446 self._attrs[node.name] = node
447 self._attrsNS[(node.namespaceURI, node.localName)] = node
Fred Drakef7cf40d2000-12-14 18:16:11 +0000448 return old
449
450 def setNamedItemNS(self, node):
451 return self.setNamedItem(node)
Paul Prescod73678da2000-07-01 04:58:47 +0000452
Fred Drake1f549022000-09-24 05:21:58 +0000453 def __delitem__(self, attname_or_tuple):
454 node = self[attname_or_tuple]
Paul Prescod73678da2000-07-01 04:58:47 +0000455 node.unlink()
456 del self._attrs[node.name]
457 del self._attrsNS[(node.namespaceURI, node.localName)]
Fred Drakef7cf40d2000-12-14 18:16:11 +0000458 self.length = len(self._attrs)
459
460AttributeList = NamedNodeMap
461
Fred Drake1f549022000-09-24 05:21:58 +0000462
Martin v. Löwisa2fda0d2000-10-07 12:10:28 +0000463class Element(Node):
Fred Drake1f549022000-09-24 05:21:58 +0000464 nodeType = Node.ELEMENT_NODE
Fred Drake4ccf4a12000-11-21 22:02:22 +0000465 nextSibling = None
466 previousSibling = None
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000467 childNodeTypes = (Node.ELEMENT_NODE, Node.PROCESSING_INSTRUCTION_NODE,
468 Node.COMMENT_NODE, Node.TEXT_NODE,
469 Node.CDATA_SECTION_NODE, Node.ENTITY_REFERENCE_NODE)
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000470
Fred Drake49a5d032001-11-30 22:21:58 +0000471 def __init__(self, tagName, namespaceURI=EMPTY_NAMESPACE, prefix=None,
Fred Drake1f549022000-09-24 05:21:58 +0000472 localName=None):
473 Node.__init__(self)
Fred Drake55c38192000-06-29 19:39:57 +0000474 self.tagName = self.nodeName = tagName
Fred Drake1f549022000-09-24 05:21:58 +0000475 self.localName = localName or tagName
476 self.prefix = prefix
477 self.namespaceURI = namespaceURI
478 self.nodeValue = None
Fred Drake55c38192000-06-29 19:39:57 +0000479
Fred Drake4ccf4a12000-11-21 22:02:22 +0000480 self._attrs = {} # attributes are double-indexed:
481 self._attrsNS = {} # tagName -> Attribute
482 # URI,localName -> Attribute
483 # in the future: consider lazy generation
484 # of attribute objects this is too tricky
485 # for now because of headaches with
486 # namespaces.
487
488 def cloneNode(self, deep):
489 clone = Node.cloneNode(self, deep)
490 clone._attrs = {}
491 clone._attrsNS = {}
492 for attr in self._attrs.values():
493 node = attr.cloneNode(1)
494 clone._attrs[node.name] = node
495 clone._attrsNS[(node.namespaceURI, node.localName)] = node
496 node.ownerElement = clone
497 return clone
498
499 def unlink(self):
500 for attr in self._attrs.values():
501 attr.unlink()
502 self._attrs = None
503 self._attrsNS = None
504 Node.unlink(self)
Fred Drake55c38192000-06-29 19:39:57 +0000505
Fred Drake1f549022000-09-24 05:21:58 +0000506 def getAttribute(self, attname):
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000507 try:
508 return self._attrs[attname].value
509 except KeyError:
510 return ""
Fred Drake55c38192000-06-29 19:39:57 +0000511
Fred Drake1f549022000-09-24 05:21:58 +0000512 def getAttributeNS(self, namespaceURI, localName):
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000513 try:
514 return self._attrsNS[(namespaceURI, localName)].value
515 except KeyError:
516 return ""
Fred Drake1f549022000-09-24 05:21:58 +0000517
518 def setAttribute(self, attname, value):
519 attr = Attr(attname)
Fred Drake55c38192000-06-29 19:39:57 +0000520 # for performance
Fred Drake1f549022000-09-24 05:21:58 +0000521 attr.__dict__["value"] = attr.__dict__["nodeValue"] = value
522 self.setAttributeNode(attr)
Fred Drake55c38192000-06-29 19:39:57 +0000523
Fred Drake1f549022000-09-24 05:21:58 +0000524 def setAttributeNS(self, namespaceURI, qualifiedName, value):
525 prefix, localname = _nssplit(qualifiedName)
Fred Drake55c38192000-06-29 19:39:57 +0000526 # for performance
Fred Drake1f549022000-09-24 05:21:58 +0000527 attr = Attr(qualifiedName, namespaceURI, localname, prefix)
528 attr.__dict__["value"] = attr.__dict__["nodeValue"] = value
529 self.setAttributeNode(attr)
Fred Drake55c38192000-06-29 19:39:57 +0000530
Fred Drake1f549022000-09-24 05:21:58 +0000531 def getAttributeNode(self, attrname):
532 return self._attrs.get(attrname)
Paul Prescod73678da2000-07-01 04:58:47 +0000533
Fred Drake1f549022000-09-24 05:21:58 +0000534 def getAttributeNodeNS(self, namespaceURI, localName):
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000535 return self._attrsNS.get((namespaceURI, localName))
Paul Prescod73678da2000-07-01 04:58:47 +0000536
Fred Drake1f549022000-09-24 05:21:58 +0000537 def setAttributeNode(self, attr):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000538 if attr.ownerElement not in (None, self):
Martin v. Löwisd5fb58f2001-01-27 08:38:34 +0000539 raise xml.dom.InuseAttributeErr("attribute node already owned")
Fred Drake1f549022000-09-24 05:21:58 +0000540 old = self._attrs.get(attr.name, None)
Paul Prescod73678da2000-07-01 04:58:47 +0000541 if old:
542 old.unlink()
Fred Drake1f549022000-09-24 05:21:58 +0000543 self._attrs[attr.name] = attr
544 self._attrsNS[(attr.namespaceURI, attr.localName)] = attr
Fred Drake4ccf4a12000-11-21 22:02:22 +0000545
546 # This creates a circular reference, but Element.unlink()
547 # breaks the cycle since the references to the attribute
548 # dictionaries are tossed.
549 attr.ownerElement = self
550
551 if old is not attr:
552 # It might have already been part of this node, in which case
553 # it doesn't represent a change, and should not be returned.
554 return old
Fred Drake55c38192000-06-29 19:39:57 +0000555
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000556 setAttributeNodeNS = setAttributeNode
557
Fred Drake1f549022000-09-24 05:21:58 +0000558 def removeAttribute(self, name):
Paul Prescod73678da2000-07-01 04:58:47 +0000559 attr = self._attrs[name]
Fred Drake1f549022000-09-24 05:21:58 +0000560 self.removeAttributeNode(attr)
Fred Drake55c38192000-06-29 19:39:57 +0000561
Fred Drake1f549022000-09-24 05:21:58 +0000562 def removeAttributeNS(self, namespaceURI, localName):
Paul Prescod73678da2000-07-01 04:58:47 +0000563 attr = self._attrsNS[(namespaceURI, localName)]
Fred Drake1f549022000-09-24 05:21:58 +0000564 self.removeAttributeNode(attr)
Fred Drake55c38192000-06-29 19:39:57 +0000565
Fred Drake1f549022000-09-24 05:21:58 +0000566 def removeAttributeNode(self, node):
Paul Prescod73678da2000-07-01 04:58:47 +0000567 node.unlink()
568 del self._attrs[node.name]
569 del self._attrsNS[(node.namespaceURI, node.localName)]
Fred Drake16f63292000-10-23 18:09:50 +0000570
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000571 removeAttributeNodeNS = removeAttributeNode
572
Martin v. Löwis156c3372000-12-28 18:40:56 +0000573 def hasAttribute(self, name):
574 return self._attrs.has_key(name)
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000575
Martin v. Löwis156c3372000-12-28 18:40:56 +0000576 def hasAttributeNS(self, namespaceURI, localName):
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000577 return self._attrsNS.has_key((namespaceURI, localName))
578
Fred Drake1f549022000-09-24 05:21:58 +0000579 def getElementsByTagName(self, name):
580 return _getElementsByTagNameHelper(self, name, [])
Fred Drake55c38192000-06-29 19:39:57 +0000581
Fred Drake1f549022000-09-24 05:21:58 +0000582 def getElementsByTagNameNS(self, namespaceURI, localName):
Fred Drakefbe7b4f2001-07-04 06:25:53 +0000583 return _getElementsByTagNameNSHelper(self, namespaceURI, localName, [])
Fred Drake55c38192000-06-29 19:39:57 +0000584
Fred Drake1f549022000-09-24 05:21:58 +0000585 def __repr__(self):
586 return "<DOM Element: %s at %s>" % (self.tagName, id(self))
Fred Drake55c38192000-06-29 19:39:57 +0000587
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000588 def writexml(self, writer, indent="", addindent="", newl=""):
589 # indent = current indentation
590 # addindent = indentation to add to higher levels
591 # newl = newline string
592 writer.write(indent+"<" + self.tagName)
Fred Drake16f63292000-10-23 18:09:50 +0000593
Fred Drake4ccf4a12000-11-21 22:02:22 +0000594 attrs = self._get_attributes()
595 a_names = attrs.keys()
Fred Drake55c38192000-06-29 19:39:57 +0000596 a_names.sort()
597
598 for a_name in a_names:
Fred Drake1f549022000-09-24 05:21:58 +0000599 writer.write(" %s=\"" % a_name)
Fred Drake4ccf4a12000-11-21 22:02:22 +0000600 _write_data(writer, attrs[a_name].value)
Fred Drake55c38192000-06-29 19:39:57 +0000601 writer.write("\"")
602 if self.childNodes:
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000603 writer.write(">%s"%(newl))
Fred Drake55c38192000-06-29 19:39:57 +0000604 for node in self.childNodes:
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000605 node.writexml(writer,indent+addindent,addindent,newl)
606 writer.write("%s</%s>%s" % (indent,self.tagName,newl))
Fred Drake55c38192000-06-29 19:39:57 +0000607 else:
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000608 writer.write("/>%s"%(newl))
Fred Drake55c38192000-06-29 19:39:57 +0000609
Fred Drake1f549022000-09-24 05:21:58 +0000610 def _get_attributes(self):
611 return AttributeList(self._attrs, self._attrsNS)
Fred Drake55c38192000-06-29 19:39:57 +0000612
Fred Draked1572372001-09-29 04:58:32 +0000613 try:
614 property
615 except NameError:
616 pass
617 else:
618 attributes = property(_get_attributes,
619 doc="NamedNodeMap of attributes on the element.")
620
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000621 def hasAttributes(self):
622 if self._attrs or self._attrsNS:
623 return 1
624 else:
625 return 0
626
Fred Drake1f549022000-09-24 05:21:58 +0000627class Comment(Node):
628 nodeType = Node.COMMENT_NODE
Fred Drake4ccf4a12000-11-21 22:02:22 +0000629 nodeName = "#comment"
630 attributes = None
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000631 childNodeTypes = ()
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000632
Fred Drake1f549022000-09-24 05:21:58 +0000633 def __init__(self, data):
634 Node.__init__(self)
635 self.data = self.nodeValue = data
Fred Drake55c38192000-06-29 19:39:57 +0000636
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000637 def writexml(self, writer, indent="", addindent="", newl=""):
638 writer.write("%s<!--%s-->%s" % (indent,self.data,newl))
Fred Drake1f549022000-09-24 05:21:58 +0000639
640class ProcessingInstruction(Node):
641 nodeType = Node.PROCESSING_INSTRUCTION_NODE
Fred Drake4ccf4a12000-11-21 22:02:22 +0000642 attributes = None
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000643 childNodeTypes = ()
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000644
Fred Drake1f549022000-09-24 05:21:58 +0000645 def __init__(self, target, data):
646 Node.__init__(self)
Fred Drake55c38192000-06-29 19:39:57 +0000647 self.target = self.nodeName = target
648 self.data = self.nodeValue = data
Fred Drake55c38192000-06-29 19:39:57 +0000649
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000650 def writexml(self, writer, indent="", addindent="", newl=""):
651 writer.write("%s<?%s %s?>%s" % (indent,self.target, self.data, newl))
Fred Drake55c38192000-06-29 19:39:57 +0000652
Fred Drake87432f42001-04-04 14:09:46 +0000653class CharacterData(Node):
Fred Drake1f549022000-09-24 05:21:58 +0000654 def __init__(self, data):
Fred Drakedaa823a2001-01-08 04:04:34 +0000655 if type(data) not in _StringTypes:
656 raise TypeError, "node contents must be a string"
Fred Drake1f549022000-09-24 05:21:58 +0000657 Node.__init__(self)
Fred Drake55c38192000-06-29 19:39:57 +0000658 self.data = self.nodeValue = data
Fred Drake33d2b842001-04-04 15:15:18 +0000659 self.length = len(data)
Fred Drake87432f42001-04-04 14:09:46 +0000660
Fred Drake55c38192000-06-29 19:39:57 +0000661 def __repr__(self):
Fred Drake1f549022000-09-24 05:21:58 +0000662 if len(self.data) > 10:
663 dotdotdot = "..."
Fred Drake55c38192000-06-29 19:39:57 +0000664 else:
Fred Drake1f549022000-09-24 05:21:58 +0000665 dotdotdot = ""
Fred Drake87432f42001-04-04 14:09:46 +0000666 return "<DOM %s node \"%s%s\">" % (
667 self.__class__.__name__, self.data[0:10], dotdotdot)
668
669 def substringData(self, offset, count):
670 if offset < 0:
671 raise xml.dom.IndexSizeErr("offset cannot be negative")
672 if offset >= len(self.data):
673 raise xml.dom.IndexSizeErr("offset cannot be beyond end of data")
674 if count < 0:
675 raise xml.dom.IndexSizeErr("count cannot be negative")
676 return self.data[offset:offset+count]
677
678 def appendData(self, arg):
679 self.data = self.data + arg
680 self.nodeValue = self.data
Fred Drake33d2b842001-04-04 15:15:18 +0000681 self.length = len(self.data)
Fred Drake87432f42001-04-04 14:09:46 +0000682
683 def insertData(self, offset, arg):
684 if offset < 0:
685 raise xml.dom.IndexSizeErr("offset cannot be negative")
686 if offset >= len(self.data):
687 raise xml.dom.IndexSizeErr("offset cannot be beyond end of data")
688 if arg:
689 self.data = "%s%s%s" % (
690 self.data[:offset], arg, self.data[offset:])
691 self.nodeValue = self.data
Fred Drake33d2b842001-04-04 15:15:18 +0000692 self.length = len(self.data)
Fred Drake87432f42001-04-04 14:09:46 +0000693
694 def deleteData(self, offset, count):
695 if offset < 0:
696 raise xml.dom.IndexSizeErr("offset cannot be negative")
697 if offset >= len(self.data):
698 raise xml.dom.IndexSizeErr("offset cannot be beyond end of data")
699 if count < 0:
700 raise xml.dom.IndexSizeErr("count cannot be negative")
701 if count:
702 self.data = self.data[:offset] + self.data[offset+count:]
703 self.nodeValue = self.data
Fred Drake33d2b842001-04-04 15:15:18 +0000704 self.length = len(self.data)
Fred Drake87432f42001-04-04 14:09:46 +0000705
706 def replaceData(self, offset, count, arg):
707 if offset < 0:
708 raise xml.dom.IndexSizeErr("offset cannot be negative")
709 if offset >= len(self.data):
710 raise xml.dom.IndexSizeErr("offset cannot be beyond end of data")
711 if count < 0:
712 raise xml.dom.IndexSizeErr("count cannot be negative")
713 if count:
714 self.data = "%s%s%s" % (
715 self.data[:offset], arg, self.data[offset+count:])
716 self.nodeValue = self.data
Fred Drake33d2b842001-04-04 15:15:18 +0000717 self.length = len(self.data)
Fred Drake87432f42001-04-04 14:09:46 +0000718
719class Text(CharacterData):
720 nodeType = Node.TEXT_NODE
721 nodeName = "#text"
722 attributes = None
723 childNodeTypes = ()
Fred Drake55c38192000-06-29 19:39:57 +0000724
Fred Drakef7cf40d2000-12-14 18:16:11 +0000725 def splitText(self, offset):
726 if offset < 0 or offset > len(self.data):
Martin v. Löwisd5fb58f2001-01-27 08:38:34 +0000727 raise xml.dom.IndexSizeErr("illegal offset value")
Fred Drakef7cf40d2000-12-14 18:16:11 +0000728 newText = Text(self.data[offset:])
729 next = self.nextSibling
730 if self.parentNode and self in self.parentNode.childNodes:
731 if next is None:
732 self.parentNode.appendChild(newText)
733 else:
734 self.parentNode.insertBefore(newText, next)
735 self.data = self.data[:offset]
Fred Drake33d2b842001-04-04 15:15:18 +0000736 self.nodeValue = self.data
737 self.length = len(self.data)
Fred Drakef7cf40d2000-12-14 18:16:11 +0000738 return newText
739
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000740 def writexml(self, writer, indent="", addindent="", newl=""):
741 _write_data(writer, "%s%s%s"%(indent, self.data, newl))
Fred Drake55c38192000-06-29 19:39:57 +0000742
Fred Drake87432f42001-04-04 14:09:46 +0000743
744class CDATASection(Text):
745 nodeType = Node.CDATA_SECTION_NODE
746 nodeName = "#cdata-section"
747
748 def writexml(self, writer, indent="", addindent="", newl=""):
Guido van Rossum5b5e0b92001-09-19 13:28:25 +0000749 writer.write("<![CDATA[%s]]>" % self.data)
Fred Drake87432f42001-04-04 14:09:46 +0000750
751
Fred Drake1f549022000-09-24 05:21:58 +0000752def _nssplit(qualifiedName):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000753 fields = _string.split(qualifiedName, ':', 1)
Paul Prescod73678da2000-07-01 04:58:47 +0000754 if len(fields) == 2:
755 return fields
756 elif len(fields) == 1:
Fred Drake49a5d032001-11-30 22:21:58 +0000757 return (None, fields[0])
Paul Prescod73678da2000-07-01 04:58:47 +0000758
Fred Drakef7cf40d2000-12-14 18:16:11 +0000759
760class DocumentType(Node):
761 nodeType = Node.DOCUMENT_TYPE_NODE
762 nodeValue = None
763 attributes = None
764 name = None
765 publicId = None
766 systemId = None
Fred Drakedc806702001-04-05 14:41:30 +0000767 internalSubset = None
Fred Drakef7cf40d2000-12-14 18:16:11 +0000768 entities = None
769 notations = None
770
771 def __init__(self, qualifiedName):
772 Node.__init__(self)
773 if qualifiedName:
774 prefix, localname = _nssplit(qualifiedName)
775 self.name = localname
776
777
778class DOMImplementation:
779 def hasFeature(self, feature, version):
780 if version not in ("1.0", "2.0"):
781 return 0
782 feature = _string.lower(feature)
783 return feature == "core"
784
785 def createDocument(self, namespaceURI, qualifiedName, doctype):
786 if doctype and doctype.parentNode is not None:
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000787 raise xml.dom.WrongDocumentErr(
788 "doctype object owned by another DOM tree")
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000789 doc = self._createDocument()
Fred Drakef7cf40d2000-12-14 18:16:11 +0000790 if doctype is None:
791 doctype = self.createDocumentType(qualifiedName, None, None)
Martin v. Löwisb417be22001-02-06 01:16:06 +0000792 if not qualifiedName:
793 # The spec is unclear what to raise here; SyntaxErr
794 # would be the other obvious candidate. Since Xerces raises
795 # InvalidCharacterErr, and since SyntaxErr is not listed
796 # for createDocument, that seems to be the better choice.
797 # XXX: need to check for illegal characters here and in
798 # createElement.
799 raise xml.dom.InvalidCharacterErr("Element with no name")
800 prefix, localname = _nssplit(qualifiedName)
801 if prefix == "xml" \
802 and namespaceURI != "http://www.w3.org/XML/1998/namespace":
803 raise xml.dom.NamespaceErr("illegal use of 'xml' prefix")
804 if prefix and not namespaceURI:
805 raise xml.dom.NamespaceErr(
806 "illegal use of prefix without namespaces")
807 element = doc.createElementNS(namespaceURI, qualifiedName)
808 doc.appendChild(element)
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000809 doctype.parentNode = doctype.ownerDocument = doc
Fred Drakef7cf40d2000-12-14 18:16:11 +0000810 doc.doctype = doctype
811 doc.implementation = self
812 return doc
813
814 def createDocumentType(self, qualifiedName, publicId, systemId):
815 doctype = DocumentType(qualifiedName)
816 doctype.publicId = publicId
817 doctype.systemId = systemId
818 return doctype
819
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000820 # internal
821 def _createDocument(self):
822 return Document()
Fred Drakef7cf40d2000-12-14 18:16:11 +0000823
Fred Drake1f549022000-09-24 05:21:58 +0000824class Document(Node):
825 nodeType = Node.DOCUMENT_NODE
Fred Drake4ccf4a12000-11-21 22:02:22 +0000826 nodeName = "#document"
827 nodeValue = None
828 attributes = None
Fred Drakef7cf40d2000-12-14 18:16:11 +0000829 doctype = None
830 parentNode = None
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000831 previousSibling = nextSibling = None
Fred Drakef7cf40d2000-12-14 18:16:11 +0000832
833 implementation = DOMImplementation()
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000834 childNodeTypes = (Node.ELEMENT_NODE, Node.PROCESSING_INSTRUCTION_NODE,
835 Node.COMMENT_NODE, Node.DOCUMENT_TYPE_NODE)
Fred Drake55c38192000-06-29 19:39:57 +0000836
Fred Drake1f549022000-09-24 05:21:58 +0000837 def appendChild(self, node):
Andrew M. Kuchling291ed4f2000-12-31 03:50:23 +0000838 if node.nodeType not in self.childNodeTypes:
839 raise HierarchyRequestErr, \
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000840 "%s cannot be child of %s" % (repr(node), repr(self))
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000841 if node.parentNode is not None:
842 node.parentNode.removeChild(node)
843
Fred Drakef7cf40d2000-12-14 18:16:11 +0000844 if node.nodeType == Node.ELEMENT_NODE \
845 and self._get_documentElement():
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000846 raise xml.dom.HierarchyRequestErr(
847 "two document elements disallowed")
Fred Drake4ccf4a12000-11-21 22:02:22 +0000848 return Node.appendChild(self, node)
Paul Prescod73678da2000-07-01 04:58:47 +0000849
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000850 def removeChild(self, oldChild):
851 self.childNodes.remove(oldChild)
852 oldChild.nextSibling = oldChild.previousSibling = None
853 oldChild.parentNode = None
854 if self.documentElement is oldChild:
855 self.documentElement = None
Martin v. Löwis52ce0d02001-01-27 08:47:37 +0000856
Andrew M. Kuchling04a45e92000-12-20 14:47:24 +0000857 return oldChild
858
Fred Drakef7cf40d2000-12-14 18:16:11 +0000859 def _get_documentElement(self):
860 for node in self.childNodes:
861 if node.nodeType == Node.ELEMENT_NODE:
862 return node
863
Fred Draked1572372001-09-29 04:58:32 +0000864 try:
865 property
866 except NameError:
867 pass
868 else:
869 documentElement = property(_get_documentElement,
870 doc="Top-level element of this document.")
871
Fred Drakef7cf40d2000-12-14 18:16:11 +0000872 def unlink(self):
873 if self.doctype is not None:
874 self.doctype.unlink()
875 self.doctype = None
876 Node.unlink(self)
877
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000878 def createDocumentFragment(self):
879 d = DocumentFragment()
880 d.ownerDoc = self
881 return d
Fred Drake55c38192000-06-29 19:39:57 +0000882
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000883 def createElement(self, tagName):
884 e = Element(tagName)
885 e.ownerDocument = self
886 return e
Fred Drake55c38192000-06-29 19:39:57 +0000887
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000888 def createTextNode(self, data):
889 t = Text(data)
890 t.ownerDocument = self
891 return t
Fred Drake55c38192000-06-29 19:39:57 +0000892
Fred Drake87432f42001-04-04 14:09:46 +0000893 def createCDATASection(self, data):
894 c = CDATASection(data)
895 c.ownerDocument = self
896 return c
897
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000898 def createComment(self, data):
899 c = Comment(data)
900 c.ownerDocument = self
901 return c
Fred Drake55c38192000-06-29 19:39:57 +0000902
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000903 def createProcessingInstruction(self, target, data):
904 p = ProcessingInstruction(target, data)
905 p.ownerDocument = self
906 return p
907
908 def createAttribute(self, qName):
909 a = Attr(qName)
910 a.ownerDocument = self
Martin v. Löwiscb67ea12001-03-31 16:30:40 +0000911 a.value = ""
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000912 return a
Fred Drake55c38192000-06-29 19:39:57 +0000913
914 def createElementNS(self, namespaceURI, qualifiedName):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000915 prefix, localName = _nssplit(qualifiedName)
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000916 e = Element(qualifiedName, namespaceURI, prefix, localName)
917 e.ownerDocument = self
918 return e
Fred Drake55c38192000-06-29 19:39:57 +0000919
920 def createAttributeNS(self, namespaceURI, qualifiedName):
Fred Drake4ccf4a12000-11-21 22:02:22 +0000921 prefix, localName = _nssplit(qualifiedName)
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000922 a = Attr(qualifiedName, namespaceURI, localName, prefix)
923 a.ownerDocument = self
Martin v. Löwiscb67ea12001-03-31 16:30:40 +0000924 a.value = ""
Martin v. Löwis126f2f62001-03-13 10:50:13 +0000925 return a
Fred Drake55c38192000-06-29 19:39:57 +0000926
Fred Drake1f549022000-09-24 05:21:58 +0000927 def getElementsByTagName(self, name):
Fred Drakefbe7b4f2001-07-04 06:25:53 +0000928 return _getElementsByTagNameHelper(self, name, [])
929
930 def getElementsByTagNameNS(self, namespaceURI, localName):
931 return _getElementsByTagNameNSHelper(self, namespaceURI, localName, [])
Fred Drake55c38192000-06-29 19:39:57 +0000932
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000933 def writexml(self, writer, indent="", addindent="", newl=""):
Guido van Rossum9e1fe1e2001-02-05 19:17:50 +0000934 writer.write('<?xml version="1.0" ?>\n')
Fred Drake55c38192000-06-29 19:39:57 +0000935 for node in self.childNodes:
Martin v. Löwis46fa39a2001-02-06 00:14:08 +0000936 node.writexml(writer, indent, addindent, newl)
Fred Drake55c38192000-06-29 19:39:57 +0000937
Fred Drake4ccf4a12000-11-21 22:02:22 +0000938def _get_StringIO():
Fred Drakef7cf40d2000-12-14 18:16:11 +0000939 # we can't use cStringIO since it doesn't support Unicode strings
940 from StringIO import StringIO
Fred Drake4ccf4a12000-11-21 22:02:22 +0000941 return StringIO()
942
Fred Drake1f549022000-09-24 05:21:58 +0000943def _doparse(func, args, kwargs):
944 events = apply(func, args, kwargs)
945 toktype, rootNode = events.getEvent()
946 events.expandNode(rootNode)
Martin v. Löwisb417be22001-02-06 01:16:06 +0000947 events.clear()
Fred Drake55c38192000-06-29 19:39:57 +0000948 return rootNode
949
Fred Drake1f549022000-09-24 05:21:58 +0000950def parse(*args, **kwargs):
Fred Drakef7cf40d2000-12-14 18:16:11 +0000951 """Parse a file into a DOM by filename or file object."""
Fred Drake4ccf4a12000-11-21 22:02:22 +0000952 from xml.dom import pulldom
Fred Drake1f549022000-09-24 05:21:58 +0000953 return _doparse(pulldom.parse, args, kwargs)
Fred Drake55c38192000-06-29 19:39:57 +0000954
Fred Drake1f549022000-09-24 05:21:58 +0000955def parseString(*args, **kwargs):
Fred Drakef7cf40d2000-12-14 18:16:11 +0000956 """Parse a file into a DOM from a string."""
Fred Drake4ccf4a12000-11-21 22:02:22 +0000957 from xml.dom import pulldom
Fred Drake1f549022000-09-24 05:21:58 +0000958 return _doparse(pulldom.parseString, args, kwargs)
Martin v. Löwis7edbd4f2001-02-22 14:05:50 +0000959
960def getDOMImplementation():
961 return Document.implementation