[ie/vimeo] Support browser impersonation (#10327)

Closes #10325
Authored by: bashonly
pull/10075/head
bashonly 6 months ago committed by GitHub
parent 1d6ab17d07
commit d4b99a2333
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

@ -316,7 +316,8 @@ class PatreonIE(PatreonBaseIE):
r'(https(?:%3A%2F%2F|://)player\.vimeo\.com.+app_id(?:=|%3D)+\d+)', r'(https(?:%3A%2F%2F|://)player\.vimeo\.com.+app_id(?:=|%3D)+\d+)',
traverse_obj(attributes, ('embed', 'html', {str})), 'vimeo url', fatal=False) or '') traverse_obj(attributes, ('embed', 'html', {str})), 'vimeo url', fatal=False) or '')
if url_or_none(v_url) and self._request_webpage( if url_or_none(v_url) and self._request_webpage(
v_url, video_id, 'Checking Vimeo embed URL', headers=headers, fatal=False, errnote=False): v_url, video_id, 'Checking Vimeo embed URL', headers=headers,
fatal=False, errnote=False, expected_status=429): # 429 is TLS fingerprint rejection
entries.append(self.url_result( entries.append(self.url_result(
VimeoIE._smuggle_referrer(v_url, 'https://patreon.com/'), VimeoIE._smuggle_referrer(v_url, 'https://patreon.com/'),
VimeoIE, url_transparent=True)) VimeoIE, url_transparent=True))

@ -829,21 +829,33 @@ class VimeoIE(VimeoBaseInfoExtractor):
url = 'https://vimeo.com/' + video_id url = 'https://vimeo.com/' + video_id
self._try_album_password(url) self._try_album_password(url)
is_secure = urllib.parse.urlparse(url).scheme == 'https'
try: try:
# Retrieve video webpage to extract further information # Retrieve video webpage to extract further information
webpage, urlh = self._download_webpage_handle( webpage, urlh = self._download_webpage_handle(
url, video_id, headers=headers) url, video_id, headers=headers, impersonate=is_secure)
redirect_url = urlh.url redirect_url = urlh.url
except ExtractorError as ee: except ExtractorError as error:
if isinstance(ee.cause, HTTPError) and ee.cause.status == 403: if not isinstance(error.cause, HTTPError) or error.cause.status not in (403, 429):
errmsg = ee.cause.response.read() raise
errmsg = error.cause.response.read()
if b'Because of its privacy settings, this video cannot be played here' in errmsg: if b'Because of its privacy settings, this video cannot be played here' in errmsg:
raise ExtractorError( raise ExtractorError(
'Cannot download embed-only video without embedding ' 'Cannot download embed-only video without embedding URL. Please call yt-dlp '
'URL. Please call yt-dlp with the URL of the page ' 'with the URL of the page that embeds this video.', expected=True)
'that embeds this video.', # 403 == vimeo.com TLS fingerprint or DC IP block; 429 == player.vimeo.com TLS FP block
expected=True) status = error.cause.status
raise dcip_msg = 'If you are using a data center IP or VPN/proxy, your IP may be blocked'
if target := error.cause.response.extensions.get('impersonate'):
raise ExtractorError(
f'Got HTTP Error {status} when using impersonate target "{target}". {dcip_msg}')
elif not is_secure:
raise ExtractorError(f'Got HTTP Error {status}. {dcip_msg}', expected=True)
raise ExtractorError(
'This request has been blocked due to its TLS fingerprint. Install a '
'required impersonation dependency if possible, or else if you are okay with '
f'{self._downloader._format_err("compromising your security/cookies", "light red")}, '
f'try replacing "https:" with "http:" in the input URL. {dcip_msg}.', expected=True)
if '://player.vimeo.com/video/' in url: if '://player.vimeo.com/video/' in url:
config = self._search_json( config = self._search_json(

Loading…
Cancel
Save