Compare commits
No commits in common. "271ac8f80f5761da43f5345bec6a923b25677cf1" and "a2c4691090c5a8a6302a4234aad1d867b0f8c4a6" have entirely different histories.
271ac8f80f
...
a2c4691090
|
@ -123,21 +123,15 @@ def is_ascii(string):
|
|||
|
||||
|
||||
def sanitize_url(url):
|
||||
# make sure the url is unicode, i.e. not bytes
|
||||
if isinstance(url, bytes):
|
||||
url = url.decode()
|
||||
|
||||
# make sure there's a protocol (http://)
|
||||
if url.split(':', 1)[0] not in PROTOCOL:
|
||||
url = 'http://' + url
|
||||
|
||||
# turns out some websites have really badly fomatted urls (fix http:/badurl)
|
||||
url = re.sub('^(https?):/([^/])', r'\1://\2', url)
|
||||
|
||||
# escape spaces
|
||||
url = url.replace(' ', '%20')
|
||||
|
||||
# escape non-ascii unicode characters
|
||||
# Escape non-ascii unicode characters
|
||||
# https://stackoverflow.com/a/4391299
|
||||
parts = list(urlparse(url))
|
||||
|
||||
|
|
Loading…
Reference in New Issue