diff --git a/requests/models.py b/requests/models.py index 97237e77..8d33c32b 100644 --- a/requests/models.py +++ b/requests/models.py @@ -27,7 +27,7 @@ from .exceptions import ( Timeout, URLRequired, TooManyRedirects, HTTPError, ConnectionError) from .utils import ( get_unicode_from_response, stream_decode_response_unicode, - decode_gzip, stream_decode_gzip, guess_filename) + decode_gzip, stream_decode_gzip, guess_filename, requote_path) REDIRECT_STATI = (codes.moved, codes.found, codes.other, codes.temporary_moved) @@ -214,7 +214,7 @@ class Request(object): # Facilitate non-RFC2616-compliant 'location' headers # (e.g. '/path/to/resource' instead of 'http://domain.tld/path/to/resource') if not urlparse(url).netloc: - url = urljoin(r.url, urllib.quote(urllib.unquote(url))) + url = urljoin(r.url, url) # http://www.w3.org/Protocols/rfc2616/rfc2616-sec10.html#sec10.3.4 if r.status_code is codes.see_other: @@ -299,7 +299,7 @@ class Request(object): if isinstance(path, unicode): path = path.encode('utf-8') - path = urllib.quote(urllib.unquote(path)) + path = requote_path(path) url = str(urlunparse([ scheme, netloc, path, params, query, fragment ])) diff --git a/requests/utils.py b/requests/utils.py index 0249e9d6..a24327e9 100644 --- a/requests/utils.py +++ b/requests/utils.py @@ -16,6 +16,7 @@ import os import random import re import zlib +import urllib from urllib2 import parse_http_list as _parse_list_header @@ -367,3 +368,14 @@ def stream_decode_gzip(iterator): yield rv except zlib.error: pass + + +def requote_path(path): + """Re-quote the given URL path component. + + This function passes the given path through an unquote/quote cycle to + ensure that it is fully and consistenty quoted. + """ + parts = path.split("/") + parts = (urllib.quote(urllib.unquote(part), safe="") for part in parts) + return "/".join(parts)