Blame - Lib/urlparse.py - platform/external/python/cpython2

2010-04-17 14:30:53 +0000

[diff] [blame]

3

urlparse module is based upon the following RFC specifications.

4

5

RFC 3986 (STD66): "Uniform Resource Identifiers" by T. Berners-Lee, R. Fielding

6

and L. Masinter, January 2005.

7

8

RFC 2732 : "Format for Literal IPv6 Addresses in URL's by R.Hinden, B.Carpenter

9

and L.Masinter, December 1999.

10

Andrew M. Kuchling

2010-04-30 00:49:09 +0000

[diff] [blame]

11

RFC 2396: "Uniform Resource Identifiers (URI)": Generic Syntax by T.

Senthil Kumaran

2010-04-17 14:30:53 +0000

[diff] [blame]

12

Berners-Lee, R. Fielding, and L. Masinter, August 1998.

13

Andrew M. Kuchling

2010-04-30 00:49:09 +0000

[diff] [blame]

14

RFC 2368: "The mailto URL scheme", by P.Hoffman , L Masinter, J. Zwinski, July 1998.

Senthil Kumaran

2010-04-17 14:30:53 +0000

[diff] [blame]

15

16

RFC 1808: "Relative Uniform Resource Locators", by R. Fielding, UC Irvine, June

17

1995.

18

Andrew M. Kuchling

2010-04-30 00:49:09 +0000

[diff] [blame]

19

RFC 1738: "Uniform Resource Locators (URL)" by T. Berners-Lee, L. Masinter, M.

Senthil Kumaran

2010-04-17 14:30:53 +0000

[diff] [blame]

20

McCahill, December 1994

21

Andrew M. Kuchling

2010-04-30 00:49:09 +0000

[diff] [blame]

22

RFC 3986 is considered the current standard and any future changes to

23

urlparse module should conform with it. The urlparse module is

24

currently not entirely compliant with this RFC due to defacto

25

scenarios for parsing, and for backward compatibility purposes, some

26

parsing quirks from older RFCs are retained. The testcases in

Senthil Kumaran

2010-04-17 14:30:53 +0000

[diff] [blame]

27

test_urlparse.py provides a good indicator of parsing behavior.

28

Guido van Rossum

e7b146f

2000-02-04 15:28:42 +0000

[diff] [blame]

29

"""

Guido van Rossum

1994-09-12 10:36:35 +0000

[diff] [blame]

30

Serhiy Storchaka

2013-03-14 21:31:09 +0200

[diff] [blame]

31

import re

32

Fred Drake

f606e8d

2002-10-16 21:21:39 +0000

[diff] [blame]

33

__all__ = ["urlparse", "urlunparse", "urljoin", "urldefrag",

Facundo Batista

2008-09-03 22:35:50 +0000

[diff] [blame]

34

"urlsplit", "urlunsplit", "parse_qs", "parse_qsl"]

Skip Montanaro

40fc160

2001-03-01 04:27:19 +0000

[diff] [blame]

35

Guido van Rossum

1994-09-12 10:36:35 +0000

[diff] [blame]

36

# A classification of schemes ('' means apply by default)

Raymond Hettinger

156c49a

2004-05-07 05:50:35 +0000

[diff] [blame]

37

uses_relative = ['ftp', 'http', 'gopher', 'nntp', 'imap',

Georg Brandl

89f35ac

2006-01-20 17:24:23 +0000

[diff] [blame]

38

'wais', 'file', 'https', 'shttp', 'mms',

Senthil Kumaran

f432aec

2011-08-03 18:31:59 +0800

[diff] [blame]

39

'prospero', 'rtsp', 'rtspu', '', 'sftp',

Senthil Kumaran

0df24c9

2011-08-03 18:40:18 +0800

[diff] [blame]

40

'svn', 'svn+ssh']

Raymond Hettinger

156c49a

2004-05-07 05:50:35 +0000

[diff] [blame]

41

uses_netloc = ['ftp', 'http', 'gopher', 'nntp', 'telnet',

Georg Brandl

89f35ac

2006-01-20 17:24:23 +0000

[diff] [blame]

42

'imap', 'wais', 'file', 'mms', 'https', 'shttp',

43

'snews', 'prospero', 'rtsp', 'rtspu', 'rsync', '',

Senthil Kumaran

81a0450

2010-05-13 03:25:21 +0000

[diff] [blame]

44

'svn', 'svn+ssh', 'sftp','nfs','git', 'git+ssh']

Raymond Hettinger

156c49a

2004-05-07 05:50:35 +0000

[diff] [blame]

45

uses_params = ['ftp', 'hdl', 'prospero', 'http', 'imap',

Fred Drake

23fd3d4

2006-04-01 06:11:07 +0000

[diff] [blame]

46

'https', 'shttp', 'rtsp', 'rtspu', 'sip', 'sips',

Senthil Kumaran

1974baa

2012-12-24 13:56:54 -0800

[diff] [blame]

47

'mms', '', 'sftp', 'tel']

Guido van Rossum

1994-09-12 10:36:35 +0000

[diff] [blame]

48

Georg Brandl

e991236

2012-08-24 18:17:28 +0200

[diff] [blame]

49

# These are not actually used anymore, but should stay for backwards

50

# compatibility. (They are undocumented, but have a public-looking name.)

51

non_hierarchical = ['gopher', 'hdl', 'mailto', 'news',

52

'telnet', 'wais', 'imap', 'snews', 'sip', 'sips']

53

uses_query = ['http', 'wais', 'imap', 'https', 'shttp', 'mms',

54

'gopher', 'rtsp', 'rtspu', 'sip', 'sips', '']

55

uses_fragment = ['ftp', 'hdl', 'http', 'gopher', 'news',

56

'nntp', 'wais', 'https', 'shttp', 'snews',

57

'file', 'prospero', '']

58

Guido van Rossum

1994-09-12 10:36:35 +0000

[diff] [blame]

59

# Characters valid in scheme names

Guido van Rossum

fad81f0

2000-12-19 16:48:13 +0000

[diff] [blame]

60

scheme_chars = ('abcdefghijklmnopqrstuvwxyz'

61

'ABCDEFGHIJKLMNOPQRSTUVWXYZ'

62

'0123456789'

63

'+-.')

Guido van Rossum

1994-09-12 10:36:35 +0000

[diff] [blame]

64

Guido van Rossum

7449540

1997-07-14 19:08:15 +0000

[diff] [blame]

65

MAX_CACHE_SIZE = 20

Guido van Rossum

1996-05-28 23:54:24 +0000

[diff] [blame]

66

_parse_cache = {}

67

68

def clear_cache():

Tim Peters

2001-01-15 03:34:38 +0000

[diff] [blame]

69

"""Clear the parse cache."""

Raymond Hettinger

2008-01-11 18:04:55 +0000

[diff] [blame]

70

_parse_cache.clear()

Guido van Rossum

1996-05-28 23:54:24 +0000

[diff] [blame]

71

72

Raymond Hettinger

2008-01-11 18:04:55 +0000

[diff] [blame]

73

class ResultMixin(object):

74

"""Shared methods for the parsed result objects."""

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

@property

def username(self):

netloc = self.netloc

if "@" in netloc:

Guido van Rossum

ced4eb0

2008-01-05 01:21:57 +0000

[diff] [blame]

80

userinfo = netloc.rsplit("@", 1)[0]

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

81

if ":" in userinfo:

82

userinfo = userinfo.split(":", 1)[0]

return userinfo

return None

@property

def password(self):

netloc = self.netloc

if "@" in netloc:

Guido van Rossum

ced4eb0

2008-01-05 01:21:57 +0000

[diff] [blame]

90

userinfo = netloc.rsplit("@", 1)[0]

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

91

if ":" in userinfo:

92

return userinfo.split(":", 1)[1]

return None

@property

def hostname(self):

Senthil Kumaran

8c6d9d7

2010-04-16 02:46:46 +0000

[diff] [blame]

97

netloc = self.netloc.split('@')[-1]

98

if '[' in netloc and ']' in netloc:

99

return netloc.split(']')[0][1:].lower()

Senthil Kumaran

8c6d9d7

2010-04-16 02:46:46 +0000

[diff] [blame]

100

elif ':' in netloc:

101

return netloc.split(':')[0].lower()

elif netloc == '':

return None

else:

return netloc.lower()

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

106

107

@property

108

def port(self):

Senthil Kumaran

8c6d9d7

2010-04-16 02:46:46 +0000

[diff] [blame]

109

netloc = self.netloc.split('@')[-1].split(']')[-1]

110

if ':' in netloc:

111

port = netloc.split(':')[1]

Serhiy Storchaka

326b5ab

2014-01-18 18:30:09 +0200

[diff] [blame]

if port:

port = int(port, 10)

# verify legal port

if (0 <= port <= 65535):

116

return port

Senthil Kumaran

37484dc

2012-05-24 21:54:34 +0800

[diff] [blame]

117

return None

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

118

Raymond Hettinger

2008-01-11 18:04:55 +0000

[diff] [blame]

119

from collections import namedtuple

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

120

Raymond Hettinger

2008-01-11 18:04:55 +0000

[diff] [blame]

121

class SplitResult(namedtuple('SplitResult', 'scheme netloc path query fragment'), ResultMixin):

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

__slots__ = ()

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

125

def geturl(self):

126

return urlunsplit(self)

127

128

Raymond Hettinger

2008-01-11 18:04:55 +0000

[diff] [blame]

129

class ParseResult(namedtuple('ParseResult', 'scheme netloc path params query fragment'), ResultMixin):

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

__slots__ = ()

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

133

def geturl(self):

134

return urlunparse(self)

135

136

137

def urlparse(url, scheme='', allow_fragments=True):

Tim Peters

2001-01-15 03:34:38 +0000

[diff] [blame]

138

"""Parse a URL into 6 components:

139

140

Return a 6-tuple: (scheme, netloc, path, params, query, fragment).

141

Note that we don't break the components up in smaller bits

142

(e.g. netloc is a single string) and we don't expand % escapes."""

Fred Drake

2001-11-16 02:52:57 +0000

[diff] [blame]

143

tuple = urlsplit(url, scheme, allow_fragments)

144

scheme, netloc, url, query, fragment = tuple

145

if scheme in uses_params and ';' in url:

146

url, params = _splitparams(url)

147

else:

148

params = ''

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

149

return ParseResult(scheme, netloc, url, params, query, fragment)

Fred Drake

2001-11-16 02:52:57 +0000

[diff] [blame]

150

151

def _splitparams(url):

152

if '/' in url:

153

i = url.find(';', url.rfind('/'))

if i < 0:

return url, ''

else:

i = url.find(';')

return url[:i], url[i+1:]

159

Johannes Gijsbers

2005-01-09 15:29:10 +0000

[diff] [blame]

160

def _splitnetloc(url, start=0):

Guido van Rossum

c6a04c2

2008-01-05 22:19:06 +0000

[diff] [blame]

161

delim = len(url) # position of end of domain part of url, default is end

162

for c in '/?#': # look for delimiters; the order is NOT important

163

wdelim = url.find(c, start) # find first of this delim

164

if wdelim >= 0: # if found

165

delim = min(delim, wdelim) # use earliest delim position

166

return url[start:delim], url[delim:] # return (domain, rest)

Johannes Gijsbers

2005-01-09 15:29:10 +0000

[diff] [blame]

167

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

168

def urlsplit(url, scheme='', allow_fragments=True):

Fred Drake

2001-11-16 02:52:57 +0000

[diff] [blame]

169

"""Parse a URL into 5 components:

170

171

Return a 5-tuple: (scheme, netloc, path, query, fragment).

172

Note that we don't break the components up in smaller bits

173

(e.g. netloc is a single string) and we don't expand % escapes."""

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

174

allow_fragments = bool(allow_fragments)

Alexandre Vassalotti

2f9ca29

2007-12-13 17:58:23 +0000

[diff] [blame]

175

key = url, scheme, allow_fragments, type(url), type(scheme)

Tim Peters

2001-01-15 03:34:38 +0000

[diff] [blame]

176

cached = _parse_cache.get(key, None)

177

if cached:

178

return cached

179

if len(_parse_cache) >= MAX_CACHE_SIZE: # avoid runaway growth

180

clear_cache()

Fred Drake

2001-11-16 02:52:57 +0000

[diff] [blame]

181

netloc = query = fragment = ''

Tim Peters

2001-01-15 03:34:38 +0000

[diff] [blame]

182

i = url.find(':')

183

if i > 0:

184

if url[:i] == 'http': # optimize the common case

185

scheme = url[:i].lower()

186

url = url[i+1:]

187

if url[:2] == '//':

Johannes Gijsbers

2005-01-09 15:29:10 +0000

[diff] [blame]

188

netloc, url = _splitnetloc(url, 2)

Senthil Kumaran

3982461

2010-04-22 12:10:13 +0000

[diff] [blame]

189

if (('[' in netloc and ']' not in netloc) or

190

(']' in netloc and '[' not in netloc)):

191

raise ValueError("Invalid IPv6 URL")

Fred Drake

2001-11-16 02:52:57 +0000

[diff] [blame]

192

if allow_fragments and '#' in url:

193

url, fragment = url.split('#', 1)

194

if '?' in url:

195

url, query = url.split('?', 1)

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

196

v = SplitResult(scheme, netloc, url, query, fragment)

197

_parse_cache[key] = v

198

return v

Senthil Kumaran

ddaea1c

2011-04-15 18:07:33 +0800

[diff] [blame]

199

for c in url[:i]:

200

if c not in scheme_chars:

201

break

202

else:

Ezio Melotti

6d9c1b1

2012-05-19 17:12:17 +0300

[diff] [blame]

203

# make sure "url" is not actually a port number (in which case

204

# "scheme" is really part of the path)

205

rest = url[i+1:]

206

if not rest or any(c not in '0123456789' for c in rest):

207

# not a port number

208

scheme, url = url[:i].lower(), rest

Senthil Kumaran

4e78de8

2010-02-19 07:32:48 +0000

[diff] [blame]

209

210

if url[:2] == '//':

Johannes Gijsbers

2005-01-09 15:29:10 +0000

[diff] [blame]

211

netloc, url = _splitnetloc(url, 2)

Senthil Kumaran

3982461

2010-04-22 12:10:13 +0000

[diff] [blame]

212

if (('[' in netloc and ']' not in netloc) or

213

(']' in netloc and '[' not in netloc)):

214

raise ValueError("Invalid IPv6 URL")

Senthil Kumaran

ea24dda

2012-05-19 08:10:40 +0800

[diff] [blame]

215

if allow_fragments and '#' in url:

Fred Drake

2001-11-16 02:52:57 +0000

[diff] [blame]

216

url, fragment = url.split('#', 1)

Senthil Kumaran

ea24dda

2012-05-19 08:10:40 +0800

[diff] [blame]

217

if '?' in url:

Fred Drake

2001-11-16 02:52:57 +0000

[diff] [blame]

218

url, query = url.split('?', 1)

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

219

v = SplitResult(scheme, netloc, url, query, fragment)

220

_parse_cache[key] = v

221

return v

Guido van Rossum

1994-09-12 10:36:35 +0000

[diff] [blame]

222

Brett Cannon

2008-08-03 00:51:02 +0000

[diff] [blame]

223

def urlunparse(data):

Tim Peters

2001-01-15 03:34:38 +0000

[diff] [blame]

224

"""Put a parsed URL back together again. This may result in a

225

slightly different, but equivalent URL, if the URL that was parsed

226

originally had redundant delimiters, e.g. a ? with an empty query

227

(the draft states that these are equivalent)."""

Brett Cannon

2008-08-03 00:51:02 +0000

[diff] [blame]

228

scheme, netloc, url, params, query, fragment = data

Fred Drake

2001-11-16 02:52:57 +0000

[diff] [blame]

229

if params:

230

url = "%s;%s" % (url, params)

231

return urlunsplit((scheme, netloc, url, query, fragment))

232

Brett Cannon

2008-08-03 00:51:02 +0000

[diff] [blame]

233

def urlunsplit(data):

Senthil Kumaran

5871a8d

2010-06-28 13:56:46 +0000

[diff] [blame]

234

"""Combine the elements of a tuple as returned by urlsplit() into a

235

complete URL as a string. The data argument can be any five-item iterable.

236

This may result in a slightly different, but equivalent URL, if the URL that

237

was parsed originally had unnecessary delimiters (for example, a ? with an

238

empty query; the RFC states that these are equivalent)."""

Brett Cannon

2008-08-03 00:51:02 +0000

[diff] [blame]

239

scheme, netloc, url, query, fragment = data

Guido van Rossum

bbc0568

2002-10-14 19:59:54 +0000

[diff] [blame]

240

if netloc or (scheme and scheme in uses_netloc and url[:2] != '//'):

Tim Peters

2001-01-15 03:34:38 +0000

[diff] [blame]

241

if url and url[:1] != '/': url = '/' + url

242

url = '//' + (netloc or '') + url

243

if scheme:

244

url = scheme + ':' + url

Tim Peters

2001-01-15 03:34:38 +0000

[diff] [blame]

245

if query:

246

url = url + '?' + query

247

if fragment:

248

url = url + '#' + fragment

249

return url

Guido van Rossum

1994-09-12 10:36:35 +0000

[diff] [blame]

250

Fred Drake

2006-04-01 22:14:43 +0000

[diff] [blame]

251

def urljoin(base, url, allow_fragments=True):

Tim Peters

2001-01-15 03:34:38 +0000

[diff] [blame]

252

"""Join a base URL and a possibly relative URL to form an absolute

253

interpretation of the latter."""

if not base:

return url

if not url:

return base

bscheme, bnetloc, bpath, bparams, bquery, bfragment = \

259

urlparse(base, '', allow_fragments)

260

scheme, netloc, path, params, query, fragment = \

261

urlparse(url, bscheme, allow_fragments)

262

if scheme != bscheme or scheme not in uses_relative:

263

return url

264

if scheme in uses_netloc:

265

if netloc:

266

return urlunparse((scheme, netloc, path,

267

params, query, fragment))

268

netloc = bnetloc

269

if path[:1] == '/':

270

return urlunparse((scheme, netloc, path,

271

params, query, fragment))

Senthil Kumaran

5c7fd6e

2010-12-17 04:56:02 +0000

[diff] [blame]

272

if not path and not params:

Facundo Batista

67d1981

2008-08-14 16:51:00 +0000

[diff] [blame]

273

path = bpath

Senthil Kumaran

5c7fd6e

2010-12-17 04:56:02 +0000

[diff] [blame]

274

params = bparams

Facundo Batista

67d1981

2008-08-14 16:51:00 +0000

[diff] [blame]

275

if not query:

276

query = bquery

277

return urlunparse((scheme, netloc, path,

278

params, query, fragment))

Tim Peters

2001-01-15 03:34:38 +0000

[diff] [blame]

279

segments = bpath.split('/')[:-1] + path.split('/')

280

# XXX The stuff below is bogus in various ways...

281

if segments[-1] == '.':

282

segments[-1] = ''

283

while '.' in segments:

segments.remove('.')

while 1:

i = 1

n = len(segments) - 1

288

while i < n:

289

if (segments[i] == '..'

290

and segments[i-1] not in ('', '..')):

291

del segments[i-1:i+1]

break

i = i+1

else:

break

if segments == ['', '..']:

297

segments[-1] = ''

298

elif len(segments) >= 2 and segments[-1] == '..':

299

segments[-2:] = ['']

300

return urlunparse((scheme, netloc, '/'.join(segments),

301

params, query, fragment))

Guido van Rossum

1994-09-12 10:36:35 +0000

[diff] [blame]

302

Guido van Rossum

1996-05-28 23:54:24 +0000

[diff] [blame]

303

def urldefrag(url):

Tim Peters

2001-01-15 03:34:38 +0000

[diff] [blame]

304

"""Removes any existing fragment from URL.

Guido van Rossum

1996-05-28 23:54:24 +0000

[diff] [blame]

305

Tim Peters

2001-01-15 03:34:38 +0000

[diff] [blame]

306

Returns a tuple of the defragmented URL and the fragment. If

307

the URL contained no fragments, the second element is the

308

empty string.

309

"""

Fred Drake

2001-11-16 02:52:57 +0000

[diff] [blame]

310

if '#' in url:

311

s, n, p, a, q, frag = urlparse(url)

312

defrag = urlunparse((s, n, p, a, q, ''))

313

return defrag, frag

314

else:

315

return url, ''

Guido van Rossum

1996-05-28 23:54:24 +0000

[diff] [blame]

316

Serhiy Storchaka

2013-03-14 21:31:09 +0200

[diff] [blame]

try:

unicode

except NameError:

def _is_unicode(x):

return 0

else:

def _is_unicode(x):

return isinstance(x, unicode)

325

Facundo Batista

2008-09-03 22:35:50 +0000

[diff] [blame]

326

# unquote method for parse_qs and parse_qsl

R. David Murray

2010-05-25 15:20:46 +0000

[diff] [blame]

327

# Cannot use directly from urllib as it would create a circular reference

328

# because urllib uses urlparse methods (urljoin). If you update this function,

329

# update it also in urllib. This code duplication does not existin in Python3.

Senthil Kumaran

f3e9b2a

2010-03-18 12:14:15 +0000

[diff] [blame]

330

331

_hexdig = '0123456789ABCDEFabcdef'

R. David Murray

2010-05-25 15:20:46 +0000

[diff] [blame]

332

_hextochr = dict((a+b, chr(int(a+b,16)))

333

for a in _hexdig for b in _hexdig)

Serhiy Storchaka

2013-03-14 21:31:09 +0200

[diff] [blame]

334

_asciire = re.compile('([\x00-\x7f]+)')

Facundo Batista

2008-09-03 22:35:50 +0000

[diff] [blame]

335

336

def unquote(s):

337

"""unquote('abc%20def') -> 'abc def'."""

Serhiy Storchaka

2013-03-14 21:31:09 +0200

[diff] [blame]

if _is_unicode(s):

if '%' not in s:

return s

bits = _asciire.split(s)

342

res = [bits[0]]

343

append = res.append

344

for i in range(1, len(bits), 2):

345

append(unquote(str(bits[i])).decode('latin1'))

append(bits[i + 1])

return ''.join(res)

bits = s.split('%')

R. David Murray

2010-05-25 15:20:46 +0000

[diff] [blame]

350

# fastpath

Serhiy Storchaka

2013-03-14 21:31:09 +0200

[diff] [blame]

351

if len(bits) == 1:

R. David Murray

2010-05-25 15:20:46 +0000

[diff] [blame]

352

return s

Serhiy Storchaka

2013-03-14 21:31:09 +0200

[diff] [blame]

353

res = [bits[0]]

354

append = res.append

355

for item in bits[1:]:

Facundo Batista

2008-09-03 22:35:50 +0000

[diff] [blame]

356

try:

Serhiy Storchaka

2013-03-14 21:31:09 +0200

[diff] [blame]

357

append(_hextochr[item[:2]])

358

append(item[2:])

Facundo Batista

2008-09-03 22:35:50 +0000

[diff] [blame]

359

except KeyError:

Serhiy Storchaka

2013-03-14 21:31:09 +0200

[diff] [blame]

360

append('%')

361

append(item)

362

return ''.join(res)

Facundo Batista

2008-09-03 22:35:50 +0000

[diff] [blame]

363

364

def parse_qs(qs, keep_blank_values=0, strict_parsing=0):

365

"""Parse a query given as a string argument.

Arguments:

Senthil Kumaran

2010-08-09 20:18:04 +0000

[diff] [blame]

369

qs: percent-encoded query string to be parsed

Facundo Batista

2008-09-03 22:35:50 +0000

[diff] [blame]

370

371

keep_blank_values: flag indicating whether blank values in

Senthil Kumaran

a5ba05c

2010-08-09 20:18:04 +0000

[diff] [blame]

372

percent-encoded queries should be treated as blank strings.

Facundo Batista

2008-09-03 22:35:50 +0000

[diff] [blame]

373

A true value indicates that blanks should be retained as

374

blank strings. The default false value indicates that

375

blank values are to be ignored and treated as if they were

376

not included.

377

378

strict_parsing: flag indicating what to do with parsing errors.

379

If false (the default), errors are silently ignored.

380

If true, errors raise a ValueError exception.

381

"""

382

dict = {}

383

for name, value in parse_qsl(qs, keep_blank_values, strict_parsing):

384

if name in dict:

385

dict[name].append(value)

else:

dict[name] = [value]

return dict

def parse_qsl(qs, keep_blank_values=0, strict_parsing=0):

391

"""Parse a query given as a string argument.

Arguments:

Senthil Kumaran

2010-08-09 20:18:04 +0000

[diff] [blame]

395

qs: percent-encoded query string to be parsed

Facundo Batista

2008-09-03 22:35:50 +0000

[diff] [blame]

396

397

keep_blank_values: flag indicating whether blank values in

Senthil Kumaran

a5ba05c

2010-08-09 20:18:04 +0000

[diff] [blame]

398

percent-encoded queries should be treated as blank strings. A

Facundo Batista