Correct handling of URLs with quoted slashes.

author Ryan Kelly <ryan@rfk.id.au>

Thu, 17 Nov 2011 00:00:02 +0000 (11:00 +1100)

committer Ryan Kelly <ryan@rfk.id.au>

Thu, 17 Nov 2011 00:00:02 +0000 (11:00 +1100)
author Ryan Kelly <ryan@rfk.id.au>
Thu, 17 Nov 2011 00:00:02 +0000 (11:00 +1100)
committer Ryan Kelly <ryan@rfk.id.au>
Thu, 17 Nov 2011 00:00:02 +0000 (11:00 +1100)
diff --git a/requests/models.py b/requests/models.py

index 97237e7..dd2dbc0 100644 (file)
--- a/requests/models.py
+++ b/requests/models.py
@@ -27,7 +27,7 @@ from .exceptions import (
      Timeout, URLRequired, TooManyRedirects, HTTPError, ConnectionError)
  from .utils import (
      get_unicode_from_response, stream_decode_response_unicode,
-    decode_gzip, stream_decode_gzip, guess_filename)
+    decode_gzip, stream_decode_gzip, guess_filename, requote_path)
  
  
  REDIRECT_STATI = (codes.moved, codes.found, codes.other, codes.temporary_moved)
@@ -214,7 +214,7 @@ class Request(object):
                  # Facilitate non-RFC2616-compliant 'location' headers
                  # (e.g. '/path/to/resource' instead of 'http://domain.tld/path/to/resource')
                  if not urlparse(url).netloc:
-                    url = urljoin(r.url, urllib.quote(urllib.unquote(url)))
+                    url = urljoin(r.url, requote_path(url))
  
                  # http://www.w3.org/Protocols/rfc2616/rfc2616-sec10.html#sec10.3.4
                  if r.status_code is codes.see_other:
@@ -299,7 +299,7 @@ class Request(object):
          if isinstance(path, unicode):
              path = path.encode('utf-8')
  
-        path = urllib.quote(urllib.unquote(path))
+        path = requote_path(path)
  
          url = str(urlunparse([ scheme, netloc, path, params, query, fragment ]))
  
diff --git a/requests/utils.py b/requests/utils.py

index 0249e9d..a24327e 100644 (file)
--- a/requests/utils.py
+++ b/requests/utils.py
@@ -16,6 +16,7 @@ import os
  import random
  import re
  import zlib
+import urllib
  
  from urllib2 import parse_http_list as _parse_list_header
  
@@ -367,3 +368,14 @@ def stream_decode_gzip(iterator):
              yield rv
      except zlib.error:
          pass
+
+
+def requote_path(path):
+    """Re-quote the given URL path component.
+
+    This function passes the given path through an unquote/quote cycle to
+    ensure that it is fully and consistenty quoted.
+    """
+    parts = path.split("/")
+    parts = (urllib.quote(urllib.unquote(part), safe="") for part in parts)
+    return "/".join(parts)
author	Ryan Kelly <ryan@rfk.id.au>
	Thu, 17 Nov 2011 00:00:02 +0000 (11:00 +1100)
committer	Ryan Kelly <ryan@rfk.id.au>
	Thu, 17 Nov 2011 00:00:02 +0000 (11:00 +1100)
requests/models.py		patch \| blob \| history
requests/utils.py		patch \| blob \| history