Skip to content

Commit

Permalink
[googledrive] Use redirected URLs for source format (closes #18877, c…
Browse files Browse the repository at this point in the history
…loses #23919, closes #24689, closes #26565)
  • Loading branch information
dstftw committed Sep 13, 2020
1 parent 95c9810 commit e71763a
Showing 1 changed file with 19 additions and 8 deletions.
27 changes: 19 additions & 8 deletions youtube_dl/extractor/googledrive.py
Original file line number Diff line number Diff line change
Expand Up @@ -220,19 +220,27 @@ def _real_extract(self, url):
'id': video_id,
'export': 'download',
})
urlh = self._request_webpage(
source_url, video_id, note='Requesting source file',
errnote='Unable to request source file', fatal=False)

def request_source_file(source_url, kind):
return self._request_webpage(
source_url, video_id, note='Requesting %s file' % kind,
errnote='Unable to request %s file' % kind, fatal=False)
urlh = request_source_file(source_url, 'source')
if urlh:
def add_source_format(src_url):
def add_source_format(urlh):
formats.append({
'url': src_url,
# Use redirect URLs as download URLs in order to calculate
# correct cookies in _calc_cookies.
# Using original URLs may result in redirect loop due to
# cookies google.com mistakenly used for googleusercontent.com
# redirect URLs (see #23919).
'url': urlh.geturl(),
'ext': determine_ext(title, 'mp4').lower(),
'format_id': 'source',
'quality': 1,
})
if urlh.headers.get('Content-Disposition'):
add_source_format(source_url)
add_source_format(urlh)
else:
confirmation_webpage = self._webpage_read_content(
urlh, url, video_id, note='Downloading confirmation page',
Expand All @@ -242,9 +250,12 @@ def add_source_format(src_url):
r'confirm=([^&"\']+)', confirmation_webpage,
'confirmation code', fatal=False)
if confirm:
add_source_format(update_url_query(source_url, {
confirmed_source_url = update_url_query(source_url, {
'confirm': confirm,
}))
})
urlh = request_source_file(confirmed_source_url, 'confirmed source')
if urlh and urlh.headers.get('Content-Disposition'):
add_source_format(urlh)

if not formats:
reason = self._search_regex(
Expand Down

0 comments on commit e71763a

Please sign in to comment.