Edit File by line
/home/barbar84/www/wp-conte.../plugins/sujqvwi/ExeBy/exe_root.../opt/alt/python27/lib64/python2....
File: urlparse.py
"""Parse (absolute and relative) URLs.
[0] Fix | Delete
[1] Fix | Delete
urlparse module is based upon the following RFC specifications.
[2] Fix | Delete
[3] Fix | Delete
RFC 3986 (STD66): "Uniform Resource Identifiers" by T. Berners-Lee, R. Fielding
[4] Fix | Delete
and L. Masinter, January 2005.
[5] Fix | Delete
[6] Fix | Delete
RFC 2732 : "Format for Literal IPv6 Addresses in URL's by R.Hinden, B.Carpenter
[7] Fix | Delete
and L.Masinter, December 1999.
[8] Fix | Delete
[9] Fix | Delete
RFC 2396: "Uniform Resource Identifiers (URI)": Generic Syntax by T.
[10] Fix | Delete
Berners-Lee, R. Fielding, and L. Masinter, August 1998.
[11] Fix | Delete
[12] Fix | Delete
RFC 2368: "The mailto URL scheme", by P.Hoffman , L Masinter, J. Zwinski, July 1998.
[13] Fix | Delete
[14] Fix | Delete
RFC 1808: "Relative Uniform Resource Locators", by R. Fielding, UC Irvine, June
[15] Fix | Delete
1995.
[16] Fix | Delete
[17] Fix | Delete
RFC 1738: "Uniform Resource Locators (URL)" by T. Berners-Lee, L. Masinter, M.
[18] Fix | Delete
McCahill, December 1994
[19] Fix | Delete
[20] Fix | Delete
RFC 3986 is considered the current standard and any future changes to
[21] Fix | Delete
urlparse module should conform with it. The urlparse module is
[22] Fix | Delete
currently not entirely compliant with this RFC due to defacto
[23] Fix | Delete
scenarios for parsing, and for backward compatibility purposes, some
[24] Fix | Delete
parsing quirks from older RFCs are retained. The testcases in
[25] Fix | Delete
test_urlparse.py provides a good indicator of parsing behavior.
[26] Fix | Delete
[27] Fix | Delete
"""
[28] Fix | Delete
[29] Fix | Delete
import re
[30] Fix | Delete
[31] Fix | Delete
__all__ = ["urlparse", "urlunparse", "urljoin", "urldefrag",
[32] Fix | Delete
"urlsplit", "urlunsplit", "parse_qs", "parse_qsl"]
[33] Fix | Delete
[34] Fix | Delete
# A classification of schemes ('' means apply by default)
[35] Fix | Delete
uses_relative = ['ftp', 'http', 'gopher', 'nntp', 'imap',
[36] Fix | Delete
'wais', 'file', 'https', 'shttp', 'mms',
[37] Fix | Delete
'prospero', 'rtsp', 'rtspu', '', 'sftp',
[38] Fix | Delete
'svn', 'svn+ssh']
[39] Fix | Delete
uses_netloc = ['ftp', 'http', 'gopher', 'nntp', 'telnet',
[40] Fix | Delete
'imap', 'wais', 'file', 'mms', 'https', 'shttp',
[41] Fix | Delete
'snews', 'prospero', 'rtsp', 'rtspu', 'rsync', '',
[42] Fix | Delete
'svn', 'svn+ssh', 'sftp','nfs','git', 'git+ssh']
[43] Fix | Delete
uses_params = ['ftp', 'hdl', 'prospero', 'http', 'imap',
[44] Fix | Delete
'https', 'shttp', 'rtsp', 'rtspu', 'sip', 'sips',
[45] Fix | Delete
'mms', '', 'sftp', 'tel']
[46] Fix | Delete
[47] Fix | Delete
# These are not actually used anymore, but should stay for backwards
[48] Fix | Delete
# compatibility. (They are undocumented, but have a public-looking name.)
[49] Fix | Delete
non_hierarchical = ['gopher', 'hdl', 'mailto', 'news',
[50] Fix | Delete
'telnet', 'wais', 'imap', 'snews', 'sip', 'sips']
[51] Fix | Delete
uses_query = ['http', 'wais', 'imap', 'https', 'shttp', 'mms',
[52] Fix | Delete
'gopher', 'rtsp', 'rtspu', 'sip', 'sips', '']
[53] Fix | Delete
uses_fragment = ['ftp', 'hdl', 'http', 'gopher', 'news',
[54] Fix | Delete
'nntp', 'wais', 'https', 'shttp', 'snews',
[55] Fix | Delete
'file', 'prospero', '']
[56] Fix | Delete
[57] Fix | Delete
# Characters valid in scheme names
[58] Fix | Delete
scheme_chars = ('abcdefghijklmnopqrstuvwxyz'
[59] Fix | Delete
'ABCDEFGHIJKLMNOPQRSTUVWXYZ'
[60] Fix | Delete
'0123456789'
[61] Fix | Delete
'+-.')
[62] Fix | Delete
[63] Fix | Delete
MAX_CACHE_SIZE = 20
[64] Fix | Delete
_parse_cache = {}
[65] Fix | Delete
[66] Fix | Delete
def clear_cache():
[67] Fix | Delete
"""Clear the parse cache."""
[68] Fix | Delete
_parse_cache.clear()
[69] Fix | Delete
[70] Fix | Delete
[71] Fix | Delete
class ResultMixin(object):
[72] Fix | Delete
"""Shared methods for the parsed result objects."""
[73] Fix | Delete
[74] Fix | Delete
@property
[75] Fix | Delete
def username(self):
[76] Fix | Delete
netloc = self.netloc
[77] Fix | Delete
if "@" in netloc:
[78] Fix | Delete
userinfo = netloc.rsplit("@", 1)[0]
[79] Fix | Delete
if ":" in userinfo:
[80] Fix | Delete
userinfo = userinfo.split(":", 1)[0]
[81] Fix | Delete
return userinfo
[82] Fix | Delete
return None
[83] Fix | Delete
[84] Fix | Delete
@property
[85] Fix | Delete
def password(self):
[86] Fix | Delete
netloc = self.netloc
[87] Fix | Delete
if "@" in netloc:
[88] Fix | Delete
userinfo = netloc.rsplit("@", 1)[0]
[89] Fix | Delete
if ":" in userinfo:
[90] Fix | Delete
return userinfo.split(":", 1)[1]
[91] Fix | Delete
return None
[92] Fix | Delete
[93] Fix | Delete
@property
[94] Fix | Delete
def hostname(self):
[95] Fix | Delete
netloc = self.netloc.split('@')[-1]
[96] Fix | Delete
if '[' in netloc and ']' in netloc:
[97] Fix | Delete
return netloc.split(']')[0][1:].lower()
[98] Fix | Delete
elif ':' in netloc:
[99] Fix | Delete
return netloc.split(':')[0].lower()
[100] Fix | Delete
elif netloc == '':
[101] Fix | Delete
return None
[102] Fix | Delete
else:
[103] Fix | Delete
return netloc.lower()
[104] Fix | Delete
[105] Fix | Delete
@property
[106] Fix | Delete
def port(self):
[107] Fix | Delete
netloc = self.netloc.split('@')[-1].split(']')[-1]
[108] Fix | Delete
if ':' in netloc:
[109] Fix | Delete
port = netloc.split(':')[1]
[110] Fix | Delete
if port:
[111] Fix | Delete
port = int(port, 10)
[112] Fix | Delete
# verify legal port
[113] Fix | Delete
if (0 <= port <= 65535):
[114] Fix | Delete
return port
[115] Fix | Delete
return None
[116] Fix | Delete
[117] Fix | Delete
from collections import namedtuple
[118] Fix | Delete
[119] Fix | Delete
class SplitResult(namedtuple('SplitResult', 'scheme netloc path query fragment'), ResultMixin):
[120] Fix | Delete
[121] Fix | Delete
__slots__ = ()
[122] Fix | Delete
[123] Fix | Delete
def geturl(self):
[124] Fix | Delete
return urlunsplit(self)
[125] Fix | Delete
[126] Fix | Delete
[127] Fix | Delete
class ParseResult(namedtuple('ParseResult', 'scheme netloc path params query fragment'), ResultMixin):
[128] Fix | Delete
[129] Fix | Delete
__slots__ = ()
[130] Fix | Delete
[131] Fix | Delete
def geturl(self):
[132] Fix | Delete
return urlunparse(self)
[133] Fix | Delete
[134] Fix | Delete
[135] Fix | Delete
def urlparse(url, scheme='', allow_fragments=True):
[136] Fix | Delete
"""Parse a URL into 6 components:
[137] Fix | Delete
<scheme>://<netloc>/<path>;<params>?<query>#<fragment>
[138] Fix | Delete
Return a 6-tuple: (scheme, netloc, path, params, query, fragment).
[139] Fix | Delete
Note that we don't break the components up in smaller bits
[140] Fix | Delete
(e.g. netloc is a single string) and we don't expand % escapes."""
[141] Fix | Delete
tuple = urlsplit(url, scheme, allow_fragments)
[142] Fix | Delete
scheme, netloc, url, query, fragment = tuple
[143] Fix | Delete
if scheme in uses_params and ';' in url:
[144] Fix | Delete
url, params = _splitparams(url)
[145] Fix | Delete
else:
[146] Fix | Delete
params = ''
[147] Fix | Delete
return ParseResult(scheme, netloc, url, params, query, fragment)
[148] Fix | Delete
[149] Fix | Delete
def _splitparams(url):
[150] Fix | Delete
if '/' in url:
[151] Fix | Delete
i = url.find(';', url.rfind('/'))
[152] Fix | Delete
if i < 0:
[153] Fix | Delete
return url, ''
[154] Fix | Delete
else:
[155] Fix | Delete
i = url.find(';')
[156] Fix | Delete
return url[:i], url[i+1:]
[157] Fix | Delete
[158] Fix | Delete
def _splitnetloc(url, start=0):
[159] Fix | Delete
delim = len(url) # position of end of domain part of url, default is end
[160] Fix | Delete
for c in '/?#': # look for delimiters; the order is NOT important
[161] Fix | Delete
wdelim = url.find(c, start) # find first of this delim
[162] Fix | Delete
if wdelim >= 0: # if found
[163] Fix | Delete
delim = min(delim, wdelim) # use earliest delim position
[164] Fix | Delete
return url[start:delim], url[delim:] # return (domain, rest)
[165] Fix | Delete
[166] Fix | Delete
def _checknetloc(netloc):
[167] Fix | Delete
if not netloc or not isinstance(netloc, unicode):
[168] Fix | Delete
return
[169] Fix | Delete
# looking for characters like \u2100 that expand to 'a/c'
[170] Fix | Delete
# IDNA uses NFKC equivalence, so normalize for this check
[171] Fix | Delete
import unicodedata
[172] Fix | Delete
n = netloc.replace(u'@', u'') # ignore characters already included
[173] Fix | Delete
n = n.replace(u':', u'') # but not the surrounding text
[174] Fix | Delete
n = n.replace(u'#', u'')
[175] Fix | Delete
n = n.replace(u'?', u'')
[176] Fix | Delete
netloc2 = unicodedata.normalize('NFKC', n)
[177] Fix | Delete
if n == netloc2:
[178] Fix | Delete
return
[179] Fix | Delete
for c in '/?#@:':
[180] Fix | Delete
if c in netloc2:
[181] Fix | Delete
raise ValueError("netloc %r contains invalid characters "
[182] Fix | Delete
"under NFKC normalization"
[183] Fix | Delete
% netloc)
[184] Fix | Delete
[185] Fix | Delete
def urlsplit(url, scheme='', allow_fragments=True):
[186] Fix | Delete
"""Parse a URL into 5 components:
[187] Fix | Delete
<scheme>://<netloc>/<path>?<query>#<fragment>
[188] Fix | Delete
Return a 5-tuple: (scheme, netloc, path, query, fragment).
[189] Fix | Delete
Note that we don't break the components up in smaller bits
[190] Fix | Delete
(e.g. netloc is a single string) and we don't expand % escapes."""
[191] Fix | Delete
allow_fragments = bool(allow_fragments)
[192] Fix | Delete
key = url, scheme, allow_fragments, type(url), type(scheme)
[193] Fix | Delete
cached = _parse_cache.get(key, None)
[194] Fix | Delete
if cached:
[195] Fix | Delete
return cached
[196] Fix | Delete
if len(_parse_cache) >= MAX_CACHE_SIZE: # avoid runaway growth
[197] Fix | Delete
clear_cache()
[198] Fix | Delete
netloc = query = fragment = ''
[199] Fix | Delete
i = url.find(':')
[200] Fix | Delete
if i > 0:
[201] Fix | Delete
if url[:i] == 'http': # optimize the common case
[202] Fix | Delete
scheme = url[:i].lower()
[203] Fix | Delete
url = url[i+1:]
[204] Fix | Delete
if url[:2] == '//':
[205] Fix | Delete
netloc, url = _splitnetloc(url, 2)
[206] Fix | Delete
if (('[' in netloc and ']' not in netloc) or
[207] Fix | Delete
(']' in netloc and '[' not in netloc)):
[208] Fix | Delete
raise ValueError("Invalid IPv6 URL")
[209] Fix | Delete
if allow_fragments and '#' in url:
[210] Fix | Delete
url, fragment = url.split('#', 1)
[211] Fix | Delete
if '?' in url:
[212] Fix | Delete
url, query = url.split('?', 1)
[213] Fix | Delete
_checknetloc(netloc)
[214] Fix | Delete
v = SplitResult(scheme, netloc, url, query, fragment)
[215] Fix | Delete
_parse_cache[key] = v
[216] Fix | Delete
return v
[217] Fix | Delete
for c in url[:i]:
[218] Fix | Delete
if c not in scheme_chars:
[219] Fix | Delete
break
[220] Fix | Delete
else:
[221] Fix | Delete
# make sure "url" is not actually a port number (in which case
[222] Fix | Delete
# "scheme" is really part of the path)
[223] Fix | Delete
rest = url[i+1:]
[224] Fix | Delete
if not rest or any(c not in '0123456789' for c in rest):
[225] Fix | Delete
# not a port number
[226] Fix | Delete
scheme, url = url[:i].lower(), rest
[227] Fix | Delete
[228] Fix | Delete
if url[:2] == '//':
[229] Fix | Delete
netloc, url = _splitnetloc(url, 2)
[230] Fix | Delete
if (('[' in netloc and ']' not in netloc) or
[231] Fix | Delete
(']' in netloc and '[' not in netloc)):
[232] Fix | Delete
raise ValueError("Invalid IPv6 URL")
[233] Fix | Delete
if allow_fragments and '#' in url:
[234] Fix | Delete
url, fragment = url.split('#', 1)
[235] Fix | Delete
if '?' in url:
[236] Fix | Delete
url, query = url.split('?', 1)
[237] Fix | Delete
_checknetloc(netloc)
[238] Fix | Delete
v = SplitResult(scheme, netloc, url, query, fragment)
[239] Fix | Delete
_parse_cache[key] = v
[240] Fix | Delete
return v
[241] Fix | Delete
[242] Fix | Delete
def urlunparse(data):
[243] Fix | Delete
"""Put a parsed URL back together again. This may result in a
[244] Fix | Delete
slightly different, but equivalent URL, if the URL that was parsed
[245] Fix | Delete
originally had redundant delimiters, e.g. a ? with an empty query
[246] Fix | Delete
(the draft states that these are equivalent)."""
[247] Fix | Delete
scheme, netloc, url, params, query, fragment = data
[248] Fix | Delete
if params:
[249] Fix | Delete
url = "%s;%s" % (url, params)
[250] Fix | Delete
return urlunsplit((scheme, netloc, url, query, fragment))
[251] Fix | Delete
[252] Fix | Delete
def urlunsplit(data):
[253] Fix | Delete
"""Combine the elements of a tuple as returned by urlsplit() into a
[254] Fix | Delete
complete URL as a string. The data argument can be any five-item iterable.
[255] Fix | Delete
This may result in a slightly different, but equivalent URL, if the URL that
[256] Fix | Delete
was parsed originally had unnecessary delimiters (for example, a ? with an
[257] Fix | Delete
empty query; the RFC states that these are equivalent)."""
[258] Fix | Delete
scheme, netloc, url, query, fragment = data
[259] Fix | Delete
if netloc or (scheme and scheme in uses_netloc and url[:2] != '//'):
[260] Fix | Delete
if url and url[:1] != '/': url = '/' + url
[261] Fix | Delete
url = '//' + (netloc or '') + url
[262] Fix | Delete
if scheme:
[263] Fix | Delete
url = scheme + ':' + url
[264] Fix | Delete
if query:
[265] Fix | Delete
url = url + '?' + query
[266] Fix | Delete
if fragment:
[267] Fix | Delete
url = url + '#' + fragment
[268] Fix | Delete
return url
[269] Fix | Delete
[270] Fix | Delete
def urljoin(base, url, allow_fragments=True):
[271] Fix | Delete
"""Join a base URL and a possibly relative URL to form an absolute
[272] Fix | Delete
interpretation of the latter."""
[273] Fix | Delete
if not base:
[274] Fix | Delete
return url
[275] Fix | Delete
if not url:
[276] Fix | Delete
return base
[277] Fix | Delete
bscheme, bnetloc, bpath, bparams, bquery, bfragment = \
[278] Fix | Delete
urlparse(base, '', allow_fragments)
[279] Fix | Delete
scheme, netloc, path, params, query, fragment = \
[280] Fix | Delete
urlparse(url, bscheme, allow_fragments)
[281] Fix | Delete
if scheme != bscheme or scheme not in uses_relative:
[282] Fix | Delete
return url
[283] Fix | Delete
if scheme in uses_netloc:
[284] Fix | Delete
if netloc:
[285] Fix | Delete
return urlunparse((scheme, netloc, path,
[286] Fix | Delete
params, query, fragment))
[287] Fix | Delete
netloc = bnetloc
[288] Fix | Delete
if path[:1] == '/':
[289] Fix | Delete
return urlunparse((scheme, netloc, path,
[290] Fix | Delete
params, query, fragment))
[291] Fix | Delete
if not path and not params:
[292] Fix | Delete
path = bpath
[293] Fix | Delete
params = bparams
[294] Fix | Delete
if not query:
[295] Fix | Delete
query = bquery
[296] Fix | Delete
return urlunparse((scheme, netloc, path,
[297] Fix | Delete
params, query, fragment))
[298] Fix | Delete
segments = bpath.split('/')[:-1] + path.split('/')
[299] Fix | Delete
# XXX The stuff below is bogus in various ways...
[300] Fix | Delete
if segments[-1] == '.':
[301] Fix | Delete
segments[-1] = ''
[302] Fix | Delete
while '.' in segments:
[303] Fix | Delete
segments.remove('.')
[304] Fix | Delete
while 1:
[305] Fix | Delete
i = 1
[306] Fix | Delete
n = len(segments) - 1
[307] Fix | Delete
while i < n:
[308] Fix | Delete
if (segments[i] == '..'
[309] Fix | Delete
and segments[i-1] not in ('', '..')):
[310] Fix | Delete
del segments[i-1:i+1]
[311] Fix | Delete
break
[312] Fix | Delete
i = i+1
[313] Fix | Delete
else:
[314] Fix | Delete
break
[315] Fix | Delete
if segments == ['', '..']:
[316] Fix | Delete
segments[-1] = ''
[317] Fix | Delete
elif len(segments) >= 2 and segments[-1] == '..':
[318] Fix | Delete
segments[-2:] = ['']
[319] Fix | Delete
return urlunparse((scheme, netloc, '/'.join(segments),
[320] Fix | Delete
params, query, fragment))
[321] Fix | Delete
[322] Fix | Delete
def urldefrag(url):
[323] Fix | Delete
"""Removes any existing fragment from URL.
[324] Fix | Delete
[325] Fix | Delete
Returns a tuple of the defragmented URL and the fragment. If
[326] Fix | Delete
the URL contained no fragments, the second element is the
[327] Fix | Delete
empty string.
[328] Fix | Delete
"""
[329] Fix | Delete
if '#' in url:
[330] Fix | Delete
s, n, p, a, q, frag = urlparse(url)
[331] Fix | Delete
defrag = urlunparse((s, n, p, a, q, ''))
[332] Fix | Delete
return defrag, frag
[333] Fix | Delete
else:
[334] Fix | Delete
return url, ''
[335] Fix | Delete
[336] Fix | Delete
try:
[337] Fix | Delete
unicode
[338] Fix | Delete
except NameError:
[339] Fix | Delete
def _is_unicode(x):
[340] Fix | Delete
return 0
[341] Fix | Delete
else:
[342] Fix | Delete
def _is_unicode(x):
[343] Fix | Delete
return isinstance(x, unicode)
[344] Fix | Delete
[345] Fix | Delete
# unquote method for parse_qs and parse_qsl
[346] Fix | Delete
# Cannot use directly from urllib as it would create a circular reference
[347] Fix | Delete
# because urllib uses urlparse methods (urljoin). If you update this function,
[348] Fix | Delete
# update it also in urllib. This code duplication does not existin in Python3.
[349] Fix | Delete
[350] Fix | Delete
_hexdig = '0123456789ABCDEFabcdef'
[351] Fix | Delete
_hextochr = dict((a+b, chr(int(a+b,16)))
[352] Fix | Delete
for a in _hexdig for b in _hexdig)
[353] Fix | Delete
_asciire = re.compile('([\x00-\x7f]+)')
[354] Fix | Delete
[355] Fix | Delete
def unquote(s):
[356] Fix | Delete
"""unquote('abc%20def') -> 'abc def'."""
[357] Fix | Delete
if _is_unicode(s):
[358] Fix | Delete
if '%' not in s:
[359] Fix | Delete
return s
[360] Fix | Delete
bits = _asciire.split(s)
[361] Fix | Delete
res = [bits[0]]
[362] Fix | Delete
append = res.append
[363] Fix | Delete
for i in range(1, len(bits), 2):
[364] Fix | Delete
append(unquote(str(bits[i])).decode('latin1'))
[365] Fix | Delete
append(bits[i + 1])
[366] Fix | Delete
return ''.join(res)
[367] Fix | Delete
[368] Fix | Delete
bits = s.split('%')
[369] Fix | Delete
# fastpath
[370] Fix | Delete
if len(bits) == 1:
[371] Fix | Delete
return s
[372] Fix | Delete
res = [bits[0]]
[373] Fix | Delete
append = res.append
[374] Fix | Delete
for item in bits[1:]:
[375] Fix | Delete
try:
[376] Fix | Delete
append(_hextochr[item[:2]])
[377] Fix | Delete
append(item[2:])
[378] Fix | Delete
except KeyError:
[379] Fix | Delete
append('%')
[380] Fix | Delete
append(item)
[381] Fix | Delete
return ''.join(res)
[382] Fix | Delete
[383] Fix | Delete
def parse_qs(qs, keep_blank_values=0, strict_parsing=0, max_num_fields=None):
[384] Fix | Delete
"""Parse a query given as a string argument.
[385] Fix | Delete
[386] Fix | Delete
Arguments:
[387] Fix | Delete
[388] Fix | Delete
qs: percent-encoded query string to be parsed
[389] Fix | Delete
[390] Fix | Delete
keep_blank_values: flag indicating whether blank values in
[391] Fix | Delete
percent-encoded queries should be treated as blank strings.
[392] Fix | Delete
A true value indicates that blanks should be retained as
[393] Fix | Delete
blank strings. The default false value indicates that
[394] Fix | Delete
blank values are to be ignored and treated as if they were
[395] Fix | Delete
not included.
[396] Fix | Delete
[397] Fix | Delete
strict_parsing: flag indicating what to do with parsing errors.
[398] Fix | Delete
If false (the default), errors are silently ignored.
[399] Fix | Delete
If true, errors raise a ValueError exception.
[400] Fix | Delete
[401] Fix | Delete
max_num_fields: int. If set, then throws a ValueError if there
[402] Fix | Delete
are more than n fields read by parse_qsl().
[403] Fix | Delete
"""
[404] Fix | Delete
dict = {}
[405] Fix | Delete
for name, value in parse_qsl(qs, keep_blank_values, strict_parsing,
[406] Fix | Delete
max_num_fields):
[407] Fix | Delete
if name in dict:
[408] Fix | Delete
dict[name].append(value)
[409] Fix | Delete
else:
[410] Fix | Delete
dict[name] = [value]
[411] Fix | Delete
return dict
[412] Fix | Delete
[413] Fix | Delete
def parse_qsl(qs, keep_blank_values=0, strict_parsing=0, max_num_fields=None):
[414] Fix | Delete
"""Parse a query given as a string argument.
[415] Fix | Delete
[416] Fix | Delete
Arguments:
[417] Fix | Delete
[418] Fix | Delete
qs: percent-encoded query string to be parsed
[419] Fix | Delete
[420] Fix | Delete
keep_blank_values: flag indicating whether blank values in
[421] Fix | Delete
percent-encoded queries should be treated as blank strings. A
[422] Fix | Delete
true value indicates that blanks should be retained as blank
[423] Fix | Delete
strings. The default false value indicates that blank values
[424] Fix | Delete
are to be ignored and treated as if they were not included.
[425] Fix | Delete
[426] Fix | Delete
strict_parsing: flag indicating what to do with parsing errors. If
[427] Fix | Delete
false (the default), errors are silently ignored. If true,
[428] Fix | Delete
errors raise a ValueError exception.
[429] Fix | Delete
[430] Fix | Delete
max_num_fields: int. If set, then throws a ValueError if there
[431] Fix | Delete
are more than n fields read by parse_qsl().
[432] Fix | Delete
[433] Fix | Delete
Returns a list, as G-d intended.
[434] Fix | Delete
"""
[435] Fix | Delete
# If max_num_fields is defined then check that the number of fields
[436] Fix | Delete
# is less than max_num_fields. This prevents a memory exhaustion DOS
[437] Fix | Delete
# attack via post bodies with many fields.
[438] Fix | Delete
if max_num_fields is not None:
[439] Fix | Delete
num_fields = 1 + qs.count('&') + qs.count(';')
[440] Fix | Delete
if max_num_fields < num_fields:
[441] Fix | Delete
raise ValueError('Max number of fields exceeded')
[442] Fix | Delete
[443] Fix | Delete
pairs = [s2 for s1 in qs.split('&') for s2 in s1.split(';')]
[444] Fix | Delete
r = []
[445] Fix | Delete
for name_value in pairs:
[446] Fix | Delete
if not name_value and not strict_parsing:
[447] Fix | Delete
continue
[448] Fix | Delete
nv = name_value.split('=', 1)
[449] Fix | Delete
if len(nv) != 2:
[450] Fix | Delete
if strict_parsing:
[451] Fix | Delete
raise ValueError, "bad query field: %r" % (name_value,)
[452] Fix | Delete
# Handle case of a control-name with no equal sign
[453] Fix | Delete
if keep_blank_values:
[454] Fix | Delete
nv.append('')
[455] Fix | Delete
else:
[456] Fix | Delete
continue
[457] Fix | Delete
if len(nv[1]) or keep_blank_values:
[458] Fix | Delete
name = unquote(nv[0].replace('+', ' '))
[459] Fix | Delete
value = unquote(nv[1].replace('+', ' '))
[460] Fix | Delete
r.append((name, value))
[461] Fix | Delete
[462] Fix | Delete
return r
[463] Fix | Delete
[464] Fix | Delete
It is recommended that you Edit text format, this type of Fix handles quite a lot in one request
Function