commit | 9f1ffb2ae932f5eef1bcf1317a0e3d8f4bad0e0c | [log] [tgz] |
---|---|---|
author | Ezio Melotti <none@none> | Tue Apr 05 20:40:52 2011 +0300 |
committer | Ezio Melotti <none@none> | Tue Apr 05 20:40:52 2011 +0300 |
tree | 934c7dffb54ca6e5d3e30b611cba8ddae4a56fef | |
parent | 104c3f1020213fc2d0a5da6b23d72dd042d6c413 [diff] [blame] |
#7311: fix HTMLParser to accept non-ASCII attribute values.
diff --git a/Lib/HTMLParser.py b/Lib/HTMLParser.py index 4fdc09a..e018901 100644 --- a/Lib/HTMLParser.py +++ b/Lib/HTMLParser.py
@@ -26,7 +26,7 @@ tagfind = re.compile('[a-zA-Z][-.a-zA-Z0-9:_]*') attrfind = re.compile( r'\s*([a-zA-Z_][-.:a-zA-Z_0-9]*)(\s*=\s*' - r'(\'[^\']*\'|"[^"]*"|[-a-zA-Z0-9./,:;+*%?!&$\(\)_#=~@]*))?') + r'(\'[^\']*\'|"[^"]*"|[^\s"\'=<>`]*))?') locatestarttagend = re.compile(r""" <[a-zA-Z][-.a-zA-Z0-9:_]* # tag name