Issue2987 - Added additional Invalid URL and changed the Invalid URL checking code for better.

commit: 241a04371bb3b1f09d91e1f5877655c54627071c [log] [tgz]
author: Senthil Kumaran <orsenthil@gmail.com> Tue Apr 20 20:37:59 2010 +0000
committer: Senthil Kumaran <orsenthil@gmail.com> Tue Apr 20 20:37:59 2010 +0000
tree: e0f74b37144efe8e5768f9e992eeb67f5b6383bd
parent: c166b4021facb0cac9e54bfb1b8c48cc0e6cba6f [diff]
diff --git a/Lib/test/test_urlparse.py b/Lib/test/test_urlparse.py
index 4085de7..c25b6e0 100644
--- a/Lib/test/test_urlparse.py
+++ b/Lib/test/test_urlparse.py

@@ -272,6 +272,7 @@
         for invalid_url in [
                 'http://::12.34.56.78]/',
                 'http://[::1/foo/',
+                'http://[::1/foo/bad]/bad',
                 'http://[::ffff:12.34.56.78']:
             self.assertRaises(ValueError, lambda : urlparse.urlparse(invalid_url).hostname)
             self.assertRaises(ValueError, lambda : urlparse.urlparse(invalid_url))

diff --git a/Lib/urlparse.py b/Lib/urlparse.py
index 8c37dff..1a81518 100644
--- a/Lib/urlparse.py
+++ b/Lib/urlparse.py

@@ -90,8 +90,6 @@
         netloc = self.netloc.split('@')[-1]
         if '[' in netloc and ']' in netloc:
             return netloc.split(']')[0][1:].lower()
-        elif '[' in netloc or ']' in netloc:
-            raise ValueError("Invalid IPv6 hostname")
         elif ':' in netloc:
             return netloc.split(':')[0].lower()
         elif netloc == '':
@@ -151,10 +149,6 @@
 
 def _splitnetloc(url, start=0):
     delim = len(url)   # position of end of domain part of url, default is end
-    if '[' in url:     # check for invalid IPv6 URL
-        if not ']' in url: raise ValueError("Invalid IPv6 URL")
-    elif ']' in url:
-        if not '[' in url: raise ValueError("Invalid IPv6 URL")
     for c in '/?#':    # look for delimiters; the order is NOT important
         wdelim = url.find(c, start)        # find first of this delim
         if wdelim >= 0:                    # if found
@@ -182,6 +176,10 @@
             url = url[i+1:]
             if url[:2] == '//':
                 netloc, url = _splitnetloc(url, 2)
+                if '[' in netloc :
+                    if not ']' in netloc: raise ValueError("Invalid IPv6 URL")
+                if ']' in netloc:
+                    if not '[' in netloc: raise ValueError("Invalid IPv6 URL")
             if allow_fragments and '#' in url:
                 url, fragment = url.split('#', 1)
             if '?' in url:
@@ -197,6 +195,10 @@
 
     if url[:2] == '//':
         netloc, url = _splitnetloc(url, 2)
+        if '[' in netloc:
+            if not ']' in netloc: raise ValueError("Invalid IPv6 URL")
+        if ']' in netloc:
+            if not '[' in netloc: raise ValueError("Invalid IPv6 URL")
     if allow_fragments and scheme in uses_fragment and '#' in url:
         url, fragment = url.split('#', 1)
     if scheme in uses_query and '?' in url:
commit	241a04371bb3b1f09d91e1f5877655c54627071c	[log] [tgz]
author	Senthil Kumaran <orsenthil@gmail.com>	Tue Apr 20 20:37:59 2010 +0000
committer	Senthil Kumaran <orsenthil@gmail.com>	Tue Apr 20 20:37:59 2010 +0000
tree	e0f74b37144efe8e5768f9e992eeb67f5b6383bd
parent	c166b4021facb0cac9e54bfb1b8c48cc0e6cba6f [diff]