Blame - Lib/urlparse.py - platform/external/python/cpython2

2010-04-17 14:30:53 +0000

[diff] [blame]

3

urlparse module is based upon the following RFC specifications.

4

5

RFC 3986 (STD66): "Uniform Resource Identifiers" by T. Berners-Lee, R. Fielding

6

and L. Masinter, January 2005.

7

8

RFC 2732 : "Format for Literal IPv6 Addresses in URL's by R.Hinden, B.Carpenter

9

and L.Masinter, December 1999.

10

Andrew M. Kuchling

2010-04-30 00:49:09 +0000

[diff] [blame]

11

RFC 2396: "Uniform Resource Identifiers (URI)": Generic Syntax by T.

Senthil Kumaran

2010-04-17 14:30:53 +0000

[diff] [blame]

12

Berners-Lee, R. Fielding, and L. Masinter, August 1998.

13

Andrew M. Kuchling

2010-04-30 00:49:09 +0000

[diff] [blame]

14

RFC 2368: "The mailto URL scheme", by P.Hoffman , L Masinter, J. Zwinski, July 1998.

Senthil Kumaran

2010-04-17 14:30:53 +0000

[diff] [blame]

15

16

RFC 1808: "Relative Uniform Resource Locators", by R. Fielding, UC Irvine, June

17

1995.

18

Andrew M. Kuchling

2010-04-30 00:49:09 +0000

[diff] [blame]

19

RFC 1738: "Uniform Resource Locators (URL)" by T. Berners-Lee, L. Masinter, M.

Senthil Kumaran

2010-04-17 14:30:53 +0000

[diff] [blame]

20

McCahill, December 1994

21

Andrew M. Kuchling

2010-04-30 00:49:09 +0000

[diff] [blame]

22

RFC 3986 is considered the current standard and any future changes to

23

urlparse module should conform with it. The urlparse module is

24

currently not entirely compliant with this RFC due to defacto

25

scenarios for parsing, and for backward compatibility purposes, some

26

parsing quirks from older RFCs are retained. The testcases in

Senthil Kumaran

2010-04-17 14:30:53 +0000

[diff] [blame]

27

test_urlparse.py provides a good indicator of parsing behavior.

28

Guido van Rossum

e7b146f

2000-02-04 15:28:42 +0000

[diff] [blame]

29

"""

Guido van Rossum

1994-09-12 10:36:35 +0000

[diff] [blame]

30

Serhiy Storchaka

2013-03-14 21:31:09 +0200

[diff] [blame]

31

import re

32

Fred Drake

f606e8d

2002-10-16 21:21:39 +0000

[diff] [blame]

33

__all__ = ["urlparse", "urlunparse", "urljoin", "urldefrag",

Facundo Batista

2008-09-03 22:35:50 +0000

[diff] [blame]

34

"urlsplit", "urlunsplit", "parse_qs", "parse_qsl"]

Skip Montanaro

40fc160

2001-03-01 04:27:19 +0000

[diff] [blame]

35

Guido van Rossum

1994-09-12 10:36:35 +0000

[diff] [blame]

36

# A classification of schemes ('' means apply by default)

Raymond Hettinger

156c49a

2004-05-07 05:50:35 +0000

[diff] [blame]

37

uses_relative = ['ftp', 'http', 'gopher', 'nntp', 'imap',

Georg Brandl

89f35ac

2006-01-20 17:24:23 +0000

[diff] [blame]

38

'wais', 'file', 'https', 'shttp', 'mms',

Senthil Kumaran

f432aec

2011-08-03 18:31:59 +0800

[diff] [blame]

39

'prospero', 'rtsp', 'rtspu', '', 'sftp',

Senthil Kumaran

0df24c9

2011-08-03 18:40:18 +0800

[diff] [blame]

40

'svn', 'svn+ssh']

Raymond Hettinger

156c49a

2004-05-07 05:50:35 +0000

[diff] [blame]

41

uses_netloc = ['ftp', 'http', 'gopher', 'nntp', 'telnet',

Georg Brandl

89f35ac

2006-01-20 17:24:23 +0000

[diff] [blame]

42

'imap', 'wais', 'file', 'mms', 'https', 'shttp',

43

'snews', 'prospero', 'rtsp', 'rtspu', 'rsync', '',

Senthil Kumaran

81a0450

2010-05-13 03:25:21 +0000

[diff] [blame]

44

'svn', 'svn+ssh', 'sftp','nfs','git', 'git+ssh']

Raymond Hettinger

156c49a

2004-05-07 05:50:35 +0000

[diff] [blame]

45

uses_params = ['ftp', 'hdl', 'prospero', 'http', 'imap',

Fred Drake

23fd3d4

2006-04-01 06:11:07 +0000

[diff] [blame]

46

'https', 'shttp', 'rtsp', 'rtspu', 'sip', 'sips',

Senthil Kumaran

1974baa

2012-12-24 13:56:54 -0800

[diff] [blame]

47

'mms', '', 'sftp', 'tel']

Guido van Rossum

1994-09-12 10:36:35 +0000

[diff] [blame]

48

Georg Brandl

e991236

2012-08-24 18:17:28 +0200

[diff] [blame]

49

# These are not actually used anymore, but should stay for backwards

50

# compatibility. (They are undocumented, but have a public-looking name.)

51

non_hierarchical = ['gopher', 'hdl', 'mailto', 'news',

52

'telnet', 'wais', 'imap', 'snews', 'sip', 'sips']

53

uses_query = ['http', 'wais', 'imap', 'https', 'shttp', 'mms',

54

'gopher', 'rtsp', 'rtspu', 'sip', 'sips', '']

55

uses_fragment = ['ftp', 'hdl', 'http', 'gopher', 'news',

56

'nntp', 'wais', 'https', 'shttp', 'snews',

57

'file', 'prospero', '']

58

Guido van Rossum

1994-09-12 10:36:35 +0000

[diff] [blame]

59

# Characters valid in scheme names

Guido van Rossum

fad81f0

2000-12-19 16:48:13 +0000

[diff] [blame]

60

scheme_chars = ('abcdefghijklmnopqrstuvwxyz'

61

'ABCDEFGHIJKLMNOPQRSTUVWXYZ'

62

'0123456789'

63

'+-.')

Guido van Rossum

1994-09-12 10:36:35 +0000

[diff] [blame]

64

Guido van Rossum

7449540

1997-07-14 19:08:15 +0000

[diff] [blame]

65

MAX_CACHE_SIZE = 20

Guido van Rossum

1996-05-28 23:54:24 +0000

[diff] [blame]

66

_parse_cache = {}

67

68

def clear_cache():

Tim Peters

2001-01-15 03:34:38 +0000

[diff] [blame]

69

"""Clear the parse cache."""

Raymond Hettinger

2008-01-11 18:04:55 +0000

[diff] [blame]

70

_parse_cache.clear()

Guido van Rossum

1996-05-28 23:54:24 +0000

[diff] [blame]

71

72

Raymond Hettinger

2008-01-11 18:04:55 +0000

[diff] [blame]

73

class ResultMixin(object):

74

"""Shared methods for the parsed result objects."""

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

@property

def username(self):

netloc = self.netloc

if "@" in netloc:

Guido van Rossum

ced4eb0

2008-01-05 01:21:57 +0000

[diff] [blame]

80

userinfo = netloc.rsplit("@", 1)[0]

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

81

if ":" in userinfo:

82

userinfo = userinfo.split(":", 1)[0]

return userinfo

return None

@property

def password(self):

netloc = self.netloc

if "@" in netloc:

Guido van Rossum

ced4eb0

2008-01-05 01:21:57 +0000

[diff] [blame]

90

userinfo = netloc.rsplit("@", 1)[0]

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

91

if ":" in userinfo:

92

return userinfo.split(":", 1)[1]

return None

@property

def hostname(self):

Senthil Kumaran

8c6d9d7

2010-04-16 02:46:46 +0000

[diff] [blame]

97

netloc = self.netloc.split('@')[-1]

98

if '[' in netloc and ']' in netloc:

99

return netloc.split(']')[0][1:].lower()

Senthil Kumaran

8c6d9d7

2010-04-16 02:46:46 +0000

[diff] [blame]

100

elif ':' in netloc:

101

return netloc.split(':')[0].lower()

elif netloc == '':

return None

else:

return netloc.lower()

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

106

107

@property

108

def port(self):

Senthil Kumaran

8c6d9d7

2010-04-16 02:46:46 +0000

[diff] [blame]

109

netloc = self.netloc.split('@')[-1].split(']')[-1]

110

if ':' in netloc:

111

port = netloc.split(':')[1]

Senthil Kumaran

37484dc

2012-05-24 21:54:34 +0800

[diff] [blame]

112

port = int(port, 10)

113

# verify legal port

114

if (0 <= port <= 65535):

115

return port

116

return None

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

117

Raymond Hettinger

2008-01-11 18:04:55 +0000

[diff] [blame]

118

from collections import namedtuple

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

119

Raymond Hettinger

2008-01-11 18:04:55 +0000

[diff] [blame]

120

class SplitResult(namedtuple('SplitResult', 'scheme netloc path query fragment'), ResultMixin):

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

__slots__ = ()

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

124

def geturl(self):

125

return urlunsplit(self)

126

127

Raymond Hettinger

2008-01-11 18:04:55 +0000

[diff] [blame]

128

class ParseResult(namedtuple('ParseResult', 'scheme netloc path params query fragment'), ResultMixin):

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

__slots__ = ()

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

132

def geturl(self):

133

return urlunparse(self)

134

135

136

def urlparse(url, scheme='', allow_fragments=True):

Tim Peters

2001-01-15 03:34:38 +0000

[diff] [blame]

137

"""Parse a URL into 6 components:

138

139

Return a 6-tuple: (scheme, netloc, path, params, query, fragment).

140

Note that we don't break the components up in smaller bits

141

(e.g. netloc is a single string) and we don't expand % escapes."""

Fred Drake

2001-11-16 02:52:57 +0000

[diff] [blame]

142

tuple = urlsplit(url, scheme, allow_fragments)

143

scheme, netloc, url, query, fragment = tuple

144

if scheme in uses_params and ';' in url:

145

url, params = _splitparams(url)

146

else:

147

params = ''

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

148

return ParseResult(scheme, netloc, url, params, query, fragment)

Fred Drake

2001-11-16 02:52:57 +0000

[diff] [blame]

149

150

def _splitparams(url):

151

if '/' in url:

152

i = url.find(';', url.rfind('/'))

if i < 0:

return url, ''

else:

i = url.find(';')

return url[:i], url[i+1:]

158

Johannes Gijsbers

2005-01-09 15:29:10 +0000

[diff] [blame]

159

def _splitnetloc(url, start=0):

Guido van Rossum

c6a04c2

2008-01-05 22:19:06 +0000

[diff] [blame]

160

delim = len(url) # position of end of domain part of url, default is end

161

for c in '/?#': # look for delimiters; the order is NOT important

162

wdelim = url.find(c, start) # find first of this delim

163

if wdelim >= 0: # if found

164

delim = min(delim, wdelim) # use earliest delim position

165

return url[start:delim], url[delim:] # return (domain, rest)

Johannes Gijsbers

2005-01-09 15:29:10 +0000

[diff] [blame]

166

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

167

def urlsplit(url, scheme='', allow_fragments=True):

Fred Drake

2001-11-16 02:52:57 +0000

[diff] [blame]

168

"""Parse a URL into 5 components:

169

170

Return a 5-tuple: (scheme, netloc, path, query, fragment).

171

Note that we don't break the components up in smaller bits

172

(e.g. netloc is a single string) and we don't expand % escapes."""

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

173

allow_fragments = bool(allow_fragments)

Alexandre Vassalotti

2f9ca29

2007-12-13 17:58:23 +0000

[diff] [blame]

174

key = url, scheme, allow_fragments, type(url), type(scheme)

Tim Peters

2001-01-15 03:34:38 +0000

[diff] [blame]

175

cached = _parse_cache.get(key, None)

176

if cached:

177

return cached

178

if len(_parse_cache) >= MAX_CACHE_SIZE: # avoid runaway growth

179

clear_cache()

Fred Drake

2001-11-16 02:52:57 +0000

[diff] [blame]

180

netloc = query = fragment = ''

Tim Peters

2001-01-15 03:34:38 +0000

[diff] [blame]

181

i = url.find(':')

182

if i > 0:

183

if url[:i] == 'http': # optimize the common case

184

scheme = url[:i].lower()

185

url = url[i+1:]

186

if url[:2] == '//':

Johannes Gijsbers

2005-01-09 15:29:10 +0000

[diff] [blame]

187

netloc, url = _splitnetloc(url, 2)

Senthil Kumaran

3982461

2010-04-22 12:10:13 +0000

[diff] [blame]

188

if (('[' in netloc and ']' not in netloc) or

189

(']' in netloc and '[' not in netloc)):

190

raise ValueError("Invalid IPv6 URL")

Fred Drake

2001-11-16 02:52:57 +0000

[diff] [blame]

191

if allow_fragments and '#' in url:

192

url, fragment = url.split('#', 1)

193

if '?' in url:

194

url, query = url.split('?', 1)

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

195

v = SplitResult(scheme, netloc, url, query, fragment)

196

_parse_cache[key] = v

197

return v

Senthil Kumaran

ddaea1c

2011-04-15 18:07:33 +0800

[diff] [blame]

198

for c in url[:i]:

199

if c not in scheme_chars:

200

break

201

else:

Ezio Melotti

6d9c1b1

2012-05-19 17:12:17 +0300

[diff] [blame]

202

# make sure "url" is not actually a port number (in which case

203

# "scheme" is really part of the path)

204

rest = url[i+1:]

205

if not rest or any(c not in '0123456789' for c in rest):

206

# not a port number

207

scheme, url = url[:i].lower(), rest

Senthil Kumaran

4e78de8

2010-02-19 07:32:48 +0000

[diff] [blame]

208

209

if url[:2] == '//':

Johannes Gijsbers

2005-01-09 15:29:10 +0000

[diff] [blame]

210

netloc, url = _splitnetloc(url, 2)

Senthil Kumaran

3982461

2010-04-22 12:10:13 +0000

[diff] [blame]

211

if (('[' in netloc and ']' not in netloc) or

212

(']' in netloc and '[' not in netloc)):

213

raise ValueError("Invalid IPv6 URL")

Senthil Kumaran

ea24dda

2012-05-19 08:10:40 +0800

[diff] [blame]

214

if allow_fragments and '#' in url:

Fred Drake

2001-11-16 02:52:57 +0000

[diff] [blame]

215

url, fragment = url.split('#', 1)

Senthil Kumaran

ea24dda

2012-05-19 08:10:40 +0800

[diff] [blame]

216

if '?' in url:

Fred Drake

2001-11-16 02:52:57 +0000

[diff] [blame]

217

url, query = url.split('?', 1)

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

218

v = SplitResult(scheme, netloc, url, query, fragment)

219

_parse_cache[key] = v

220

return v

Guido van Rossum

1994-09-12 10:36:35 +0000

[diff] [blame]

221

Brett Cannon

2008-08-03 00:51:02 +0000

[diff] [blame]

222

def urlunparse(data):

Tim Peters

2001-01-15 03:34:38 +0000

[diff] [blame]

223

"""Put a parsed URL back together again. This may result in a

224

slightly different, but equivalent URL, if the URL that was parsed

225

originally had redundant delimiters, e.g. a ? with an empty query

226

(the draft states that these are equivalent)."""

Brett Cannon

2008-08-03 00:51:02 +0000

[diff] [blame]

227

scheme, netloc, url, params, query, fragment = data

Fred Drake

2001-11-16 02:52:57 +0000

[diff] [blame]

228

if params:

229

url = "%s;%s" % (url, params)

230

return urlunsplit((scheme, netloc, url, query, fragment))

231

Brett Cannon

2008-08-03 00:51:02 +0000

[diff] [blame]

232

def urlunsplit(data):

Senthil Kumaran

5871a8d

2010-06-28 13:56:46 +0000

[diff] [blame]

233

"""Combine the elements of a tuple as returned by urlsplit() into a

234

complete URL as a string. The data argument can be any five-item iterable.

235

This may result in a slightly different, but equivalent URL, if the URL that

236

was parsed originally had unnecessary delimiters (for example, a ? with an

237

empty query; the RFC states that these are equivalent)."""

Brett Cannon

2008-08-03 00:51:02 +0000

[diff] [blame]

238

scheme, netloc, url, query, fragment = data

Guido van Rossum

bbc0568

2002-10-14 19:59:54 +0000

[diff] [blame]

239

if netloc or (scheme and scheme in uses_netloc and url[:2] != '//'):

Tim Peters

2001-01-15 03:34:38 +0000

[diff] [blame]

240

if url and url[:1] != '/': url = '/' + url

241

url = '//' + (netloc or '') + url

242

if scheme:

243

url = scheme + ':' + url

Tim Peters

2001-01-15 03:34:38 +0000

[diff] [blame]

244

if query:

245

url = url + '?' + query

246

if fragment:

247

url = url + '#' + fragment

248

return url

Guido van Rossum

1994-09-12 10:36:35 +0000

[diff] [blame]

249

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

250

def urljoin(base, url, allow_fragments=True):

Tim Peters

2001-01-15 03:34:38 +0000

[diff] [blame]

251

"""Join a base URL and a possibly relative URL to form an absolute

252

interpretation of the latter."""

if not base:

return url

if not url:

return base

bscheme, bnetloc, bpath, bparams, bquery, bfragment = \

258

urlparse(base, '', allow_fragments)

259

scheme, netloc, path, params, query, fragment = \

260

urlparse(url, bscheme, allow_fragments)

261

if scheme != bscheme or scheme not in uses_relative:

262

return url

263

if scheme in uses_netloc:

264

if netloc:

265

return urlunparse((scheme, netloc, path,

266

params, query, fragment))

267

netloc = bnetloc

268

if path[:1] == '/':

269

return urlunparse((scheme, netloc, path,

270

params, query, fragment))

Senthil Kumaran

5c7fd6e

2010-12-17 04:56:02 +0000

[diff] [blame]

271

if not path and not params:

Facundo Batista

67d1981

2008-08-14 16:51:00 +0000

[diff] [blame]

272

path = bpath

Senthil Kumaran

5c7fd6e

2010-12-17 04:56:02 +0000

[diff] [blame]

273

params = bparams

Facundo Batista

67d1981

2008-08-14 16:51:00 +0000

[diff] [blame]

274

if not query:

275

query = bquery

276

return urlunparse((scheme, netloc, path,

277

params, query, fragment))

Tim Peters

2001-01-15 03:34:38 +0000

[diff] [blame]

278

segments = bpath.split('/')[:-1] + path.split('/')

279

# XXX The stuff below is bogus in various ways...

280

if segments[-1] == '.':

281

segments[-1] = ''

282

while '.' in segments:

segments.remove('.')

while 1:

i = 1

n = len(segments) - 1

287

while i < n:

288

if (segments[i] == '..'

289

and segments[i-1] not in ('', '..')):

290

del segments[i-1:i+1]

break

i = i+1

else:

break

if segments == ['', '..']:

296

segments[-1] = ''

297

elif len(segments) >= 2 and segments[-1] == '..':

298

segments[-2:] = ['']

299

return urlunparse((scheme, netloc, '/'.join(segments),

300

params, query, fragment))

Guido van Rossum

1994-09-12 10:36:35 +0000

[diff] [blame]

301

Guido van Rossum

1996-05-28 23:54:24 +0000

[diff] [blame]

302

def urldefrag(url):

Tim Peters

2001-01-15 03:34:38 +0000

[diff] [blame]

303

"""Removes any existing fragment from URL.

Guido van Rossum

1996-05-28 23:54:24 +0000

[diff] [blame]

304

Tim Peters

2001-01-15 03:34:38 +0000

[diff] [blame]

305

Returns a tuple of the defragmented URL and the fragment. If

306

the URL contained no fragments, the second element is the

307

empty string.

308

"""

Fred Drake

2001-11-16 02:52:57 +0000

[diff] [blame]

309

if '#' in url:

310

s, n, p, a, q, frag = urlparse(url)

311

defrag = urlunparse((s, n, p, a, q, ''))

312

return defrag, frag

313

else:

314

return url, ''

Guido van Rossum

1996-05-28 23:54:24 +0000

[diff] [blame]

315

Serhiy Storchaka

2013-03-14 21:31:09 +0200

[diff] [blame]

try:

unicode

except NameError:

def _is_unicode(x):

return 0

else:

def _is_unicode(x):

return isinstance(x, unicode)

324

Facundo Batista

2008-09-03 22:35:50 +0000

[diff] [blame]

325

# unquote method for parse_qs and parse_qsl

R. David Murray

2010-05-25 15:20:46 +0000

[diff] [blame]

326

# Cannot use directly from urllib as it would create a circular reference

327

# because urllib uses urlparse methods (urljoin). If you update this function,

328

# update it also in urllib. This code duplication does not existin in Python3.

Senthil Kumaran

f3e9b2a

2010-03-18 12:14:15 +0000

[diff] [blame]

329

330

_hexdig = '0123456789ABCDEFabcdef'

R. David Murray

2010-05-25 15:20:46 +0000

[diff] [blame]

331

_hextochr = dict((a+b, chr(int(a+b,16)))

332

for a in _hexdig for b in _hexdig)

Serhiy Storchaka

2013-03-14 21:31:09 +0200

[diff] [blame]

333

_asciire = re.compile('([\x00-\x7f]+)')

Facundo Batista

2008-09-03 22:35:50 +0000

[diff] [blame]

334

335

def unquote(s):

336

"""unquote('abc%20def') -> 'abc def'."""

Serhiy Storchaka

2013-03-14 21:31:09 +0200

[diff] [blame]

if _is_unicode(s):

if '%' not in s:

return s

bits = _asciire.split(s)

341

res = [bits[0]]

342

append = res.append

343

for i in range(1, len(bits), 2):

344

append(unquote(str(bits[i])).decode('latin1'))

append(bits[i + 1])

return ''.join(res)

bits = s.split('%')

R. David Murray

2010-05-25 15:20:46 +0000

[diff] [blame]

349

# fastpath

Serhiy Storchaka

2013-03-14 21:31:09 +0200

[diff] [blame]

350

if len(bits) == 1:

R. David Murray

2010-05-25 15:20:46 +0000

[diff] [blame]

351

return s

Serhiy Storchaka

2013-03-14 21:31:09 +0200

[diff] [blame]

352

res = [bits[0]]

353

append = res.append

354

for item in bits[1:]:

Facundo Batista

2008-09-03 22:35:50 +0000

[diff] [blame]

355

try:

Serhiy Storchaka

2013-03-14 21:31:09 +0200

[diff] [blame]

356

append(_hextochr[item[:2]])

357

append(item[2:])

Facundo Batista

2008-09-03 22:35:50 +0000

[diff] [blame]

358

except KeyError:

Serhiy Storchaka

2013-03-14 21:31:09 +0200

[diff] [blame]

359

append('%')

360

append(item)

361

return ''.join(res)

Facundo Batista

2008-09-03 22:35:50 +0000

[diff] [blame]

362

363

def parse_qs(qs, keep_blank_values=0, strict_parsing=0):

364

"""Parse a query given as a string argument.

Arguments:

Senthil Kumaran

2010-08-09 20:18:04 +0000

[diff] [blame]

368

qs: percent-encoded query string to be parsed

Facundo Batista

2008-09-03 22:35:50 +0000

[diff] [blame]

369

370

keep_blank_values: flag indicating whether blank values in

Senthil Kumaran

a5ba05c

2010-08-09 20:18:04 +0000

[diff] [blame]

371

percent-encoded queries should be treated as blank strings.

Facundo Batista

2008-09-03 22:35:50 +0000

[diff] [blame]

372

A true value indicates that blanks should be retained as

373

blank strings. The default false value indicates that

374

blank values are to be ignored and treated as if they were

375

not included.

376

377

strict_parsing: flag indicating what to do with parsing errors.

378

If false (the default), errors are silently ignored.

379

If true, errors raise a ValueError exception.

380

"""

381

dict = {}

382

for name, value in parse_qsl(qs, keep_blank_values, strict_parsing):

383

if name in dict:

384

dict[name].append(value)

else:

dict[name] = [value]

return dict

def parse_qsl(qs, keep_blank_values=0, strict_parsing=0):

390

"""Parse a query given as a string argument.

Arguments:

Senthil Kumaran

2010-08-09 20:18:04 +0000

[diff] [blame]

394

qs: percent-encoded query string to be parsed

Facundo Batista

2008-09-03 22:35:50 +0000

[diff] [blame]

395

396

keep_blank_values: flag indicating whether blank values in

Senthil Kumaran

a5ba05c

2010-08-09 20:18:04 +0000

[diff] [blame]

397

percent-encoded queries should be treated as blank strings. A

Facundo Batista