Skip to content

Commit

Permalink
[core] Remove Cookie header on redirect to prevent leaks
Browse files Browse the repository at this point in the history
Adated from yt-dlp/yt-dlp-GHSA-v8mc-9377-rwjj/pull/1/commits/101caac
Thx coletdjnz
  • Loading branch information
dirkf committed Jul 18, 2023
1 parent 46fde7c commit b383be9
Show file tree
Hide file tree
Showing 2 changed files with 36 additions and 4 deletions.
32 changes: 30 additions & 2 deletions test/test_http.py
Original file line number Diff line number Diff line change
Expand Up @@ -183,6 +183,11 @@ def gzip_compress(p):
self._method('GET')
elif self.path.startswith('/headers'):
self._headers()
elif self.path.startswith('/308-to-headers'):
self.send_response(308)
self.send_header('Location', '/headers')
self.send_header('Content-Length', '0')
self.end_headers()
elif self.path == '/trailing_garbage':
payload = b'<html><video src="/vid.mp4" /></html>'
compressed = gzip_compress(payload) + b'trailing garbage'
Expand Down Expand Up @@ -385,8 +390,31 @@ def test_cookiejar(self):
ydl.cookiejar.set_cookie(compat_http_cookiejar_Cookie(
0, 'test', 'ytdl', None, False, '127.0.0.1', True,
False, '/headers', True, False, None, False, None, None, {}))
data = ydl.urlopen(sanitized_Request(self._test_url('headers'))).read()
self.assertIn(b'Cookie: test=ytdl', data)
data = ydl.urlopen(sanitized_Request(
self._test_url('headers'))).read().decode('utf-8')
self.assertIn('Cookie: test=ytdl', data)

def test_passed_cookie_header(self):
# We should accept a Cookie header being passed as in normal headers and handle it appropriately.
with FakeYDL() as ydl:
# Specified Cookie header should be used
res = ydl.urlopen(sanitized_Request(
self._test_url('headers'), headers={'Cookie': 'test=test'})).read().decode('utf-8')
self.assertIn('Cookie: test=test', res)

# Specified Cookie header should be removed on any redirect
res = ydl.urlopen(sanitized_Request(
self._test_url('308-to-headers'), headers={'Cookie': 'test=test'})).read().decode('utf-8')
self.assertNotIn('Cookie: test=test', res)

# Specified Cookie header should override global cookiejar for that request
ydl.cookiejar.set_cookie(compat_http_cookiejar_Cookie(
0, 'test', 'ytdlp', None, False, '127.0.0.1', True,
False, '/headers', True, False, None, False, None, None, {}))
data = ydl.urlopen(sanitized_Request(
self._test_url('headers'), headers={'Cookie': 'test=test'})).read().decode('utf-8')
self.assertNotIn('Cookie: test=ytdlp', data)
self.assertIn('Cookie: test=test', data)

def test_no_compression_compat_header(self):
with FakeYDL() as ydl:
Expand Down
8 changes: 6 additions & 2 deletions youtube_dl/utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -2968,7 +2968,6 @@ def redirect_request(self, req, fp, code, msg, headers, newurl):

new_method = req.get_method()
new_data = req.data
remove_headers = []

# On python 2 urlh.geturl() may sometimes return redirect URL
# as a byte string instead of unicode. This workaround forces
Expand All @@ -2981,6 +2980,11 @@ def redirect_request(self, req, fp, code, msg, headers, newurl):
# but it is kept for compatibility with other callers.
newurl = newurl.replace(' ', '%20')

# Technically the Cookie header should be in unredirected_hdrs;
# however in practice some may set it in normal headers anyway.
# We will remove it here to prevent any leaks.
remove_headers = ['Cookie']

# A 303 must either use GET or HEAD for subsequent request
# https://datatracker.ietf.org/doc/html/rfc7231#section-6.4.4
if code == 303 and req.get_method() != 'HEAD':
Expand All @@ -2999,7 +3003,7 @@ def redirect_request(self, req, fp, code, msg, headers, newurl):

# NB: don't use dict comprehension for python 2.6 compatibility
new_headers = dict((k, v) for k, v in req.header_items()
if k.lower() not in remove_headers)
if k.title() not in remove_headers)

return compat_urllib_request.Request(
newurl, headers=new_headers, origin_req_host=req.origin_req_host,
Expand Down

0 comments on commit b383be9

Please sign in to comment.