diff -r f9763c363cc3 -r dd852a0f92d6 Lib/urllib.py --- a/Lib/urllib.py Mon Mar 21 10:30:07 2011 +0100 +++ b/Lib/urllib.py Thu Mar 24 08:07:45 2011 -0700 @@ -638,10 +638,19 @@ newurl = headers['uri'] else: return + + # In case the server sent a relative URL, join with original: + newurl = basejoin(self.type + ":" + url, newurl) + + # For security reasons we do not allow redirects to protocols + # other than HTTP or HTTPS. + newurl_lower = newurl.lower() + if not (newurl_lower.startswith('http://') or + newurl_lower.startswith('https://')): + return + void = fp.read() fp.close() - # In case the server sent a relative URL, join with original: - newurl = basejoin(self.type + ":" + url, newurl) return self.open(newurl) def http_error_301(self, url, fp, errcode, errmsg, headers, data=None): diff -r f9763c363cc3 -r dd852a0f92d6 Lib/urllib2.py --- a/Lib/urllib2.py Mon Mar 21 10:30:07 2011 +0100 +++ b/Lib/urllib2.py Thu Mar 24 08:07:45 2011 -0700 @@ -555,6 +555,13 @@ return newurl = urlparse.urljoin(req.get_full_url(), newurl) + # For security reasons we do not allow redirects to protocols + # other than HTTP or HTTPS. + newurl_lower = newurl.lower() + if not (newurl_lower.startswith('http://') or + newurl_lower.startswith('https://')): + return + # XXX Probably want to forget about the state of the current # request, although that might interact poorly with other # handlers that also use handler-specific request attributes