yt-dlp/yt_dlp/extractor/vimeo.py

# coding: utf-8
from __future__ import unicode_literals

import base64
import functools
import re
import itertools

from .common import InfoExtractor
from ..compat import (
    compat_kwargs,
    compat_HTTPError,
    compat_str,
    compat_urlparse,
)
from ..utils import (
    clean_html,
    determine_ext,
    ExtractorError,
    get_element_by_class,
    HEADRequest,
    js_to_json,
    int_or_none,
    merge_dicts,
    OnDemandPagedList,
    parse_filesize,
    parse_iso8601,
    parse_qs,
    sanitized_Request,
    smuggle_url,
    str_or_none,
    try_get,
    unified_timestamp,
    unsmuggle_url,
    urlencode_postdata,
    urljoin,
    unescapeHTML,
    urlhandle_detect_ext,
)


class VimeoBaseInfoExtractor(InfoExtractor):
    _NETRC_MACHINE = 'vimeo'
    _LOGIN_REQUIRED = False
    _LOGIN_URL = 'https://vimeo.com/log_in'

    def _login(self):
        username, password = self._get_login_info()
        if username is None:
            if self._LOGIN_REQUIRED:
                raise ExtractorError('No login info available, needed for using %s.' % self.IE_NAME, expected=True)
            return
        webpage = self._download_webpage(
            self._LOGIN_URL, None, 'Downloading login page')
        token, vuid = self._extract_xsrft_and_vuid(webpage)
        data = {
            'action': 'login',
            'email': username,
            'password': password,
            'service': 'vimeo',
            'token': token,
        }
        self._set_vimeo_cookie('vuid', vuid)
        try:
            self._download_webpage(
                self._LOGIN_URL, None, 'Logging in',
                data=urlencode_postdata(data), headers={
                    'Content-Type': 'application/x-www-form-urlencoded',
                    'Referer': self._LOGIN_URL,
                })
        except ExtractorError as e:
            if isinstance(e.cause, compat_HTTPError) and e.cause.code == 418:
                raise ExtractorError(
                    'Unable to log in: bad username or password',
                    expected=True)
            raise ExtractorError('Unable to log in')

    def _get_video_password(self):
        password = self.get_param('videopassword')
        if password is None:
            raise ExtractorError(
                'This video is protected by a password, use the --video-password option',
                expected=True)
        return password

    def _verify_video_password(self, url, video_id, password, token, vuid):
        if url.startswith('http://'):
            # vimeo only supports https now, but the user can give an http url
            url = url.replace('http://', 'https://')
        self._set_vimeo_cookie('vuid', vuid)
        return self._download_webpage(
            url + '/password', video_id, 'Verifying the password',
            'Wrong password', data=urlencode_postdata({
                'password': password,
                'token': token,
            }), headers={
                'Content-Type': 'application/x-www-form-urlencoded',
                'Referer': url,
            })

    def _extract_xsrft_and_vuid(self, webpage):
        xsrft = self._search_regex(
            r'(?:(?P<q1>["\'])xsrft(?P=q1)\s*:|xsrft\s*[=:])\s*(?P<q>["\'])(?P<xsrft>.+?)(?P=q)',
            webpage, 'login token', group='xsrft')
        vuid = self._search_regex(
            r'["\']vuid["\']\s*:\s*(["\'])(?P<vuid>.+?)\1',
            webpage, 'vuid', group='vuid')
        return xsrft, vuid

    def _extract_vimeo_config(self, webpage, video_id, *args, **kwargs):
        vimeo_config = self._search_regex(
            r'vimeo\.config\s*=\s*(?:({.+?})|_extend\([^,]+,\s+({.+?})\));',
            webpage, 'vimeo config', *args, **compat_kwargs(kwargs))
        if vimeo_config:
            return self._parse_json(vimeo_config, video_id)

    def _set_vimeo_cookie(self, name, value):
        self._set_cookie('vimeo.com', name, value)

    def _vimeo_sort_formats(self, formats):
        # Note: Bitrates are completely broken. Single m3u8 may contain entries in kbps and bps
        # at the same time without actual units specified.
        self._sort_formats(formats, ('quality', 'res', 'fps', 'hdr:12', 'source'))

    def _parse_config(self, config, video_id):
        video_data = config['video']
        video_title = video_data['title']
        live_event = video_data.get('live_event') or {}
        is_live = live_event.get('status') == 'started'
        request = config.get('request') or {}

        formats = []
        subtitles = {}

        config_files = video_data.get('files') or request.get('files') or {}
        for f in (config_files.get('progressive') or []):
            video_url = f.get('url')
            if not video_url:
                continue
            formats.append({
                'url': video_url,
                'format_id': 'http-%s' % f.get('quality'),
                'source_preference': 10,
                'width': int_or_none(f.get('width')),
                'height': int_or_none(f.get('height')),
                'fps': int_or_none(f.get('fps')),
                'tbr': int_or_none(f.get('bitrate')),
            })

        # TODO: fix handling of 308 status code returned for live archive manifest requests
        sep_pattern = r'/sep/video/'
        for files_type in ('hls', 'dash'):
            for cdn_name, cdn_data in (try_get(config_files, lambda x: x[files_type]['cdns']) or {}).items():
                manifest_url = cdn_data.get('url')
                if not manifest_url:
                    continue
                format_id = '%s-%s' % (files_type, cdn_name)
                sep_manifest_urls = []
                if re.search(sep_pattern, manifest_url):
                    for suffix, repl in (('', 'video'), ('_sep', 'sep/video')):
                        sep_manifest_urls.append((format_id + suffix, re.sub(
                            sep_pattern, '/%s/' % repl, manifest_url)))
                else:
                    sep_manifest_urls = [(format_id, manifest_url)]
                for f_id, m_url in sep_manifest_urls:
                    if files_type == 'hls':
                        fmts, subs = self._extract_m3u8_formats_and_subtitles(
                            m_url, video_id, 'mp4', live=is_live, m3u8_id=f_id,
                            note='Downloading %s m3u8 information' % cdn_name,
                            fatal=False)
                        formats.extend(fmts)
                        self._merge_subtitles(subs, target=subtitles)
                    elif files_type == 'dash':
                        if 'json=1' in m_url:
                            real_m_url = (self._download_json(m_url, video_id, fatal=False) or {}).get('url')
                            if real_m_url:
                                m_url = real_m_url
                        fmts, subs = self._extract_mpd_formats_and_subtitles(
                            m_url.replace('/master.json', '/master.mpd'), video_id, f_id,
                            'Downloading %s MPD information' % cdn_name,
                            fatal=False)
                        formats.extend(fmts)
                        self._merge_subtitles(subs, target=subtitles)

        live_archive = live_event.get('archive') or {}
        live_archive_source_url = live_archive.get('source_url')
        if live_archive_source_url and live_archive.get('status') == 'done':
            formats.append({
                'format_id': 'live-archive-source',
                'url': live_archive_source_url,
                'quality': 10,
            })

        for tt in (request.get('text_tracks') or []):
            subtitles.setdefault(tt['lang'], []).append({
                'ext': 'vtt',
                'url': urljoin('https://vimeo.com', tt['url']),
            })

        thumbnails = []
        if not is_live:
            for key, thumb in (video_data.get('thumbs') or {}).items():
                thumbnails.append({
                    'id': key,
                    'width': int_or_none(key),
                    'url': thumb,
                })
            thumbnail = video_data.get('thumbnail')
            if thumbnail:
                thumbnails.append({
                    'url': thumbnail,
                })

        owner = video_data.get('owner') or {}
        video_uploader_url = owner.get('url')

        duration = int_or_none(video_data.get('duration'))
        chapter_data = try_get(config, lambda x: x['embed']['chapters']) or []
        chapters = [{
            'title': current_chapter.get('title'),
            'start_time': current_chapter.get('timecode'),
            'end_time': next_chapter.get('timecode'),
        } for current_chapter, next_chapter in zip(chapter_data, chapter_data[1:] + [{'timecode': duration}])]
        if chapters and chapters[0]['start_time']:  # Chapters may not start from 0
            chapters[:0] = [{'title': '<Untitled>', 'start_time': 0, 'end_time': chapters[0]['start_time']}]

        return {
            'id': str_or_none(video_data.get('id')) or video_id,
            'title': video_title,
            'uploader': owner.get('name'),
            'uploader_id': video_uploader_url.split('/')[-1] if video_uploader_url else None,
            'uploader_url': video_uploader_url,
            'thumbnails': thumbnails,
            'duration': duration,
            'chapters': chapters or None,
            'formats': formats,
            'subtitles': subtitles,
            'is_live': is_live,
        }

    def _extract_original_format(self, url, video_id, unlisted_hash=None):
        query = {'action': 'load_download_config'}
        if unlisted_hash:
            query['unlisted_hash'] = unlisted_hash
        download_data = self._download_json(
            url, video_id, fatal=False, query=query,
            headers={'X-Requested-With': 'XMLHttpRequest'},
            expected_status=(403, 404)) or {}
        source_file = download_data.get('source_file')
        download_url = try_get(source_file, lambda x: x['download_url'])
        if download_url and not source_file.get('is_cold') and not source_file.get('is_defrosting'):
            source_name = source_file.get('public_name', 'Original')
            if self._is_valid_url(download_url, video_id, '%s video' % source_name):
                ext = (try_get(
                    source_file, lambda x: x['extension'],
                    compat_str) or determine_ext(
                    download_url, None) or 'mp4').lower()
                return {
                    'url': download_url,
                    'ext': ext,
                    'width': int_or_none(source_file.get('width')),
                    'height': int_or_none(source_file.get('height')),
                    'filesize': parse_filesize(source_file.get('size')),
                    'format_id': source_name,
                    'quality': 1,
                }

        jwt_response = self._download_json(
            'https://vimeo.com/_rv/viewer', video_id, note='Downloading jwt token', fatal=False) or {}
        if not jwt_response.get('jwt'):
            return
        headers = {'Authorization': 'jwt %s' % jwt_response['jwt']}
        original_response = self._download_json(
            f'https://api.vimeo.com/videos/{video_id}', video_id,
            headers=headers, fatal=False, expected_status=(403, 404)) or {}
        for download_data in original_response.get('download') or []:
            download_url = download_data.get('link')
            if not download_url or download_data.get('quality') != 'source':
                continue
            ext = determine_ext(parse_qs(download_url).get('filename', [''])[0].lower(), default_ext=None)
            if not ext:
                urlh = self._request_webpage(
                    HEADRequest(download_url), video_id, fatal=False, note='Determining source extension')
                ext = urlh and urlhandle_detect_ext(urlh)
            return {
                'url': download_url,
                'ext': ext or 'unknown_video',
                'format_id': download_data.get('public_name', 'Original'),
                'width': int_or_none(download_data.get('width')),
                'height': int_or_none(download_data.get('height')),
                'fps': int_or_none(download_data.get('fps')),
                'filesize': int_or_none(download_data.get('size')),
                'quality': 1,
            }


class VimeoIE(VimeoBaseInfoExtractor):
    """Information extractor for vimeo.com."""

    # _VALID_URL matches Vimeo URLs
    _VALID_URL = r'''(?x)
                    https?://
                        (?:
                            (?:
                                www|
                                player
                            )
                            \.
                        )?
                        vimeo(?:pro)?\.com/
                        (?!(?:channels|album|showcase)/[^/?#]+/?(?:$|[?#])|[^/]+/review/|ondemand/)
                        (?:[^/]+/)*?
                        (?:
                            (?:
                                play_redirect_hls|
                                moogaloop\.swf)\?clip_id=
                            )?
                        (?:videos?/)?
                        (?P<id>[0-9]+)
                        (?:/(?P<unlisted_hash>[\da-f]{10}))?
                        /?(?:[?&].*)?(?:[#].*)?$
                    '''
    IE_NAME = 'vimeo'
    _TESTS = [
        {
            'url': 'http://vimeo.com/56015672#at=0',
            'md5': '8879b6cc097e987f02484baf890129e5',
            'info_dict': {
                'id': '56015672',
                'ext': 'mp4',
                'title': "youtube-dl test video - \u2605 \" ' \u5e78 / \\ \u00e4 \u21ad \U0001d550",
                'description': 'md5:2d3305bad981a06ff79f027f19865021',
                'timestamp': 1355990239,
                'upload_date': '20121220',
                'uploader_url': r're:https?://(?:www\.)?vimeo\.com/user7108434',
                'uploader_id': 'user7108434',
                'uploader': 'Filippo Valsorda',
                'duration': 10,
                'license': 'by-sa',
            },
            'params': {
                'format': 'best[protocol=https]',
            },
        },
        {
            'url': 'http://vimeopro.com/openstreetmapus/state-of-the-map-us-2013/video/68093876',
            'md5': '3b5ca6aa22b60dfeeadf50b72e44ed82',
            'note': 'Vimeo Pro video (#1197)',
            'info_dict': {
                'id': '68093876',
                'ext': 'mp4',
                'uploader_url': r're:https?://(?:www\.)?vimeo\.com/openstreetmapus',
                'uploader_id': 'openstreetmapus',
                'uploader': 'OpenStreetMap US',
                'title': 'Andy Allan - Putting the Carto into OpenStreetMap Cartography',
                'description': 'md5:2c362968038d4499f4d79f88458590c1',
                'duration': 1595,
                'upload_date': '20130610',
                'timestamp': 1370893156,
                'license': 'by',
            },
            'params': {
                'format': 'best[protocol=https]',
            },
        },
        {
            'url': 'http://player.vimeo.com/video/54469442',
            'md5': '619b811a4417aa4abe78dc653becf511',
            'note': 'Videos that embed the url in the player page',
            'info_dict': {
                'id': '54469442',
                'ext': 'mp4',
                'title': 'Kathy Sierra: Building the minimum Badass User, Business of Software 2012',
                'uploader': 'Business of Software',
                'uploader_url': r're:https?://(?:www\.)?vimeo\.com/businessofsoftware',
                'uploader_id': 'businessofsoftware',
                'duration': 3610,
                'description': None,
            },
            'params': {
                'format': 'best[protocol=https]',
            },
        },
        {
            'url': 'http://vimeo.com/68375962',
            'md5': 'aaf896bdb7ddd6476df50007a0ac0ae7',
            'note': 'Video protected with password',
            'info_dict': {
                'id': '68375962',
                'ext': 'mp4',
                'title': 'youtube-dl password protected test video',
                'timestamp': 1371200155,
                'upload_date': '20130614',
                'uploader_url': r're:https?://(?:www\.)?vimeo\.com/user18948128',
                'uploader_id': 'user18948128',
                'uploader': 'Jaime Marquínez Ferrándiz',
                'duration': 10,
                'description': 'md5:dca3ea23adb29ee387127bc4ddfce63f',
            },
            'params': {
                'format': 'best[protocol=https]',
                'videopassword': 'youtube-dl',
            },
        },
        {
            'url': 'http://vimeo.com/channels/keypeele/75629013',
            'md5': '2f86a05afe9d7abc0b9126d229bbe15d',
            'info_dict': {
                'id': '75629013',
                'ext': 'mp4',
                'title': 'Key & Peele: Terrorist Interrogation',
                'description': 'md5:8678b246399b070816b12313e8b4eb5c',
                'uploader_url': r're:https?://(?:www\.)?vimeo\.com/atencio',
                'uploader_id': 'atencio',
                'uploader': 'Peter Atencio',
                'channel_id': 'keypeele',
                'channel_url': r're:https?://(?:www\.)?vimeo\.com/channels/keypeele',
                'timestamp': 1380339469,
                'upload_date': '20130928',
                'duration': 187,
            },
            'params': {'format': 'http-1080p'},
        },
        {
            'url': 'http://vimeo.com/76979871',
            'note': 'Video with subtitles',
            'info_dict': {
                'id': '76979871',
                'ext': 'mp4',
                'title': 'The New Vimeo Player (You Know, For Videos)',
                'description': 'md5:2ec900bf97c3f389378a96aee11260ea',
                'timestamp': 1381846109,
                'upload_date': '20131015',
                'uploader_url': r're:https?://(?:www\.)?vimeo\.com/staff',
                'uploader_id': 'staff',
                'uploader': 'Vimeo Staff',
                'duration': 62,
                'subtitles': {
                    'de': [{'ext': 'vtt'}],
                    'en': [{'ext': 'vtt'}],
                    'es': [{'ext': 'vtt'}],
                    'fr': [{'ext': 'vtt'}],
                },
            },
            'expected_warnings': ['Ignoring subtitle tracks found in the HLS manifest'],
        },
        {
            # from https://www.ouya.tv/game/Pier-Solar-and-the-Great-Architects/
            'url': 'https://player.vimeo.com/video/98044508',
            'note': 'The js code contains assignments to the same variable as the config',
            'info_dict': {
                'id': '98044508',
                'ext': 'mp4',
                'title': 'Pier Solar OUYA Official Trailer',
                'uploader': 'Tulio Gonçalves',
                'uploader_url': r're:https?://(?:www\.)?vimeo\.com/user28849593',
                'uploader_id': 'user28849593',
            },
        },
        {
            # contains original format
            'url': 'https://vimeo.com/33951933',
            'md5': '53c688fa95a55bf4b7293d37a89c5c53',
            'info_dict': {
                'id': '33951933',
                'ext': 'mp4',
                'title': 'FOX CLASSICS - Forever Classic ID - A Full Minute',
                'uploader': 'The DMCI',
                'uploader_url': r're:https?://(?:www\.)?vimeo\.com/dmci',
                'uploader_id': 'dmci',
                'timestamp': 1324343742,
                'upload_date': '20111220',
                'description': 'md5:ae23671e82d05415868f7ad1aec21147',
            },
        },
        {
            'note': 'Contains original format not accessible in webpage',
            'url': 'https://vimeo.com/393756517',
            'md5': 'c464af248b592190a5ffbb5d33f382b0',
            'info_dict': {
                'id': '393756517',
                'ext': 'mov',
                'timestamp': 1582642091,
                'uploader_id': 'frameworkla',
                'title': 'Straight To Hell - Sabrina: Netflix',
                'uploader': 'Framework Studio',
                'description': 'md5:f2edc61af3ea7a5592681ddbb683db73',
                'upload_date': '20200225',
            },
        },
        {
            # only available via https://vimeo.com/channels/tributes/6213729 and
            # not via https://vimeo.com/6213729
            'url': 'https://vimeo.com/channels/tributes/6213729',
            'info_dict': {
                'id': '6213729',
                'ext': 'mp4',
                'title': 'Vimeo Tribute: The Shining',
                'uploader': 'Casey Donahue',
                'uploader_url': r're:https?://(?:www\.)?vimeo\.com/caseydonahue',
                'uploader_id': 'caseydonahue',
                'channel_url': r're:https?://(?:www\.)?vimeo\.com/channels/tributes',
                'channel_id': 'tributes',
                'timestamp': 1250886430,
                'upload_date': '20090821',
                'description': 'md5:bdbf314014e58713e6e5b66eb252f4a6',
            },
            'params': {
                'skip_download': True,
            },
        },
        {
            # redirects to ondemand extractor and should be passed through it
            # for successful extraction
            'url': 'https://vimeo.com/73445910',
            'info_dict': {
                'id': '73445910',
                'ext': 'mp4',
                'title': 'The Reluctant Revolutionary',
                'uploader': '10Ft Films',
                'uploader_url': r're:https?://(?:www\.)?vimeo\.com/tenfootfilms',
                'uploader_id': 'tenfootfilms',
                'description': 'md5:0fa704e05b04f91f40b7f3ca2e801384',
                'upload_date': '20130830',
                'timestamp': 1377853339,
            },
            'params': {
                'skip_download': True,
            },
            'skip': 'this page is no longer available.',
        },
        {
            'url': 'http://player.vimeo.com/video/68375962',
            'md5': 'aaf896bdb7ddd6476df50007a0ac0ae7',
            'info_dict': {
                'id': '68375962',
                'ext': 'mp4',
                'title': 'youtube-dl password protected test video',
                'uploader_url': r're:https?://(?:www\.)?vimeo\.com/user18948128',
                'uploader_id': 'user18948128',
                'uploader': 'Jaime Marquínez Ferrándiz',
                'duration': 10,
            },
            'params': {
                'format': 'best[protocol=https]',
                'videopassword': 'youtube-dl',
            },
        },
        {
            'url': 'http://vimeo.com/moogaloop.swf?clip_id=2539741',
            'only_matching': True,
        },
        {
            'url': 'https://vimeo.com/109815029',
            'note': 'Video not completely processed, "failed" seed status',
            'only_matching': True,
        },
        {
            'url': 'https://vimeo.com/groups/travelhd/videos/22439234',
            'only_matching': True,
        },
        {
            'url': 'https://vimeo.com/album/2632481/video/79010983',
            'only_matching': True,
        },
        {
            'url': 'https://vimeo.com/showcase/3253534/video/119195465',
            'note': 'A video in a password protected album (showcase)',
            'info_dict': {
                'id': '119195465',
                'ext': 'mp4',
                'title': 'youtube-dl test video \'ä"BaW_jenozKc',
                'uploader': 'Philipp Hagemeister',
                'uploader_id': 'user20132939',
                'description': 'md5:fa7b6c6d8db0bdc353893df2f111855b',
                'upload_date': '20150209',
                'timestamp': 1423518307,
            },
            'params': {
                'format': 'best[protocol=https]',
                'videopassword': 'youtube-dl',
            },
        },
        {
            # source file returns 403: Forbidden
            'url': 'https://vimeo.com/7809605',
            'only_matching': True,
        },
        {
            'note': 'Direct URL with hash',
            'url': 'https://vimeo.com/160743502/abd0e13fb4',
            'info_dict': {
                'id': '160743502',
                'ext': 'mp4',
                'uploader': 'Julian Tryba',
                'uploader_id': 'aliniamedia',
                'title': 'Harrisville New Hampshire',
                'timestamp': 1459259666,
                'upload_date': '20160329',
            },
            'params': {'skip_download': True},
        },
        {
            'url': 'https://vimeo.com/138909882',
            'info_dict': {
                'id': '138909882',
                'ext': 'mp4',
                'title': 'Eastnor Castle 2015 Firework Champions - The Promo!',
                'description': 'md5:5967e090768a831488f6e74b7821b3c1',
                'uploader_id': 'fireworkchampions',
                'uploader': 'Firework Champions',
                'upload_date': '20150910',
                'timestamp': 1441901895,
            },
            'params': {
                'skip_download': True,
                'format': 'Original',
            },
        },
        {
            'url': 'https://vimeo.com/channels/staffpicks/143603739',
            'info_dict': {
                'id': '143603739',
                'ext': 'mp4',
                'uploader': 'Karim Huu Do',
                'timestamp': 1445846953,
                'upload_date': '20151026',
                'title': 'The Shoes - Submarine Feat. Blaine Harrison',
                'uploader_id': 'karimhd',
                'description': 'md5:8e2eea76de4504c2e8020a9bcfa1e843',
            },
            'params': {'skip_download': 'm3u8'},
        },
        {
            # requires passing unlisted_hash(a52724358e) to load_download_config request
            'url': 'https://vimeo.com/392479337/a52724358e',
            'only_matching': True,
        },
        {
            # similar, but all numeric: ID must be 581039021, not 9603038895
            # issue #29690
            'url': 'https://vimeo.com/581039021/9603038895',
            'info_dict': {
                'id': '581039021',
                # these have to be provided but we don't care
                'ext': 'mp4',
                'timestamp': 1627621014,
                'title': 're:.+',
                'uploader_id': 're:.+',
                'uploader': 're:.+',
                'upload_date': r're:\d+',
            },
            'params': {
                'skip_download': True,
            },
        }
        # https://gettingthingsdone.com/workflowmap/
        # vimeo embed with check-password page protected by Referer header
    ]

    @staticmethod
    def _smuggle_referrer(url, referrer_url):
        return smuggle_url(url, {'http_headers': {'Referer': referrer_url}})

    @staticmethod
    def _extract_urls(url, webpage):
        urls = []
        # Look for embedded (iframe) Vimeo player
        for mobj in re.finditer(
                r'<iframe[^>]+?src=(["\'])(?P<url>(?:https?:)?//player\.vimeo\.com/video/\d+.*?)\1',
                webpage):
            urls.append(VimeoIE._smuggle_referrer(unescapeHTML(mobj.group('url')), url))
        PLAIN_EMBED_RE = (
            # Look for embedded (swf embed) Vimeo player
            r'<embed[^>]+?src=(["\'])(?P<url>(?:https?:)?//(?:www\.)?vimeo\.com/moogaloop\.swf.+?)\1',
            # Look more for non-standard embedded Vimeo player
            r'<video[^>]+src=(["\'])(?P<url>(?:https?:)?//(?:www\.)?vimeo\.com/[0-9]+)\1',
        )
        for embed_re in PLAIN_EMBED_RE:
            for mobj in re.finditer(embed_re, webpage):
                urls.append(mobj.group('url'))
        return urls

    @staticmethod
    def _extract_url(url, webpage):
        urls = VimeoIE._extract_urls(url, webpage)
        return urls[0] if urls else None

    def _verify_player_video_password(self, url, video_id, headers):
        password = self._get_video_password()
        data = urlencode_postdata({
            'password': base64.b64encode(password.encode()),
        })
        headers = merge_dicts(headers, {
            'Content-Type': 'application/x-www-form-urlencoded',
        })
        checked = self._download_json(
            url + '/check-password', video_id,
            'Verifying the password', data=data, headers=headers)
        if checked is False:
            raise ExtractorError('Wrong video password', expected=True)
        return checked

    def _real_initialize(self):
        self._login()

    def _extract_from_api(self, video_id, unlisted_hash=None):
        token = self._download_json(
            'https://vimeo.com/_rv/jwt', video_id, headers={
                'X-Requested-With': 'XMLHttpRequest'
            })['token']
        api_url = 'https://api.vimeo.com/videos/' + video_id
        if unlisted_hash:
            api_url += ':' + unlisted_hash
        video = self._download_json(
            api_url, video_id, headers={
                'Authorization': 'jwt ' + token,
            }, query={
                'fields': 'config_url,created_time,description,license,metadata.connections.comments.total,metadata.connections.likes.total,release_time,stats.plays',
            })
        info = self._parse_config(self._download_json(
            video['config_url'], video_id), video_id)
        self._vimeo_sort_formats(info['formats'])
        get_timestamp = lambda x: parse_iso8601(video.get(x + '_time'))
        info.update({
            'description': video.get('description'),
            'license': video.get('license'),
            'release_timestamp': get_timestamp('release'),
            'timestamp': get_timestamp('created'),
            'view_count': int_or_none(try_get(video, lambda x: x['stats']['plays'])),
        })
        connections = try_get(
            video, lambda x: x['metadata']['connections'], dict) or {}
        for k in ('comment', 'like'):
            info[k + '_count'] = int_or_none(try_get(connections, lambda x: x[k + 's']['total']))
        return info

    def _try_album_password(self, url):
        album_id = self._search_regex(
            r'vimeo\.com/(?:album|showcase)/([^/]+)', url, 'album id', default=None)
        if not album_id:
            return
        viewer = self._download_json(
            'https://vimeo.com/_rv/viewer', album_id, fatal=False)
        if not viewer:
            webpage = self._download_webpage(url, album_id)
            viewer = self._parse_json(self._search_regex(
                r'bootstrap_data\s*=\s*({.+?})</script>',
                webpage, 'bootstrap data'), album_id)['viewer']
        jwt = viewer['jwt']
        album = self._download_json(
            'https://api.vimeo.com/albums/' + album_id,
            album_id, headers={'Authorization': 'jwt ' + jwt},
            query={'fields': 'description,name,privacy'})
        if try_get(album, lambda x: x['privacy']['view']) == 'password':
            password = self.get_param('videopassword')
            if not password:
                raise ExtractorError(
                    'This album is protected by a password, use the --video-password option',
                    expected=True)
            self._set_vimeo_cookie('vuid', viewer['vuid'])
            try:
                self._download_json(
                    'https://vimeo.com/showcase/%s/auth' % album_id,
                    album_id, 'Verifying the password', data=urlencode_postdata({
                        'password': password,
                        'token': viewer['xsrft'],
                    }), headers={
                        'X-Requested-With': 'XMLHttpRequest',
                    })
            except ExtractorError as e:
                if isinstance(e.cause, compat_HTTPError) and e.cause.code == 401:
                    raise ExtractorError('Wrong password', expected=True)
                raise

    def _real_extract(self, url):
        url, data = unsmuggle_url(url, {})
        headers = self.get_param('http_headers').copy()
        if 'http_headers' in data:
            headers.update(data['http_headers'])
        if 'Referer' not in headers:
            headers['Referer'] = url

        # Extract ID from URL
        mobj = self._match_valid_url(url).groupdict()
        video_id, unlisted_hash = mobj['id'], mobj.get('unlisted_hash')
        if unlisted_hash:
            return self._extract_from_api(video_id, unlisted_hash)

        orig_url = url
        is_pro = 'vimeopro.com/' in url
        if is_pro:
            # some videos require portfolio_id to be present in player url
            # https://github.com/ytdl-org/youtube-dl/issues/20070
            url = self._extract_url(url, self._download_webpage(url, video_id))
            if not url:
                url = 'https://vimeo.com/' + video_id
        elif any(p in url for p in ('play_redirect_hls', 'moogaloop.swf')):
            url = 'https://vimeo.com/' + video_id

        self._try_album_password(url)
        try:
            # Retrieve video webpage to extract further information
            webpage, urlh = self._download_webpage_handle(
                url, video_id, headers=headers)
            redirect_url = urlh.geturl()
        except ExtractorError as ee:
            if isinstance(ee.cause, compat_HTTPError) and ee.cause.code == 403:
                errmsg = ee.cause.read()
                if b'Because of its privacy settings, this video cannot be played here' in errmsg:
                    raise ExtractorError(
                        'Cannot download embed-only video without embedding '
                        'URL. Please call yt-dlp with the URL of the page '
                        'that embeds this video.',
                        expected=True)
            raise

        if '://player.vimeo.com/video/' in url:
            config = self._parse_json(self._search_regex(
                r'\bconfig\s*=\s*({.+?})\s*;', webpage, 'info section'), video_id)
            if config.get('view') == 4:
                config = self._verify_player_video_password(
                    redirect_url, video_id, headers)
            info = self._parse_config(config, video_id)
            self._vimeo_sort_formats(info['formats'])
            return info

        if re.search(r'<form[^>]+?id="pw_form"', webpage):
            video_password = self._get_video_password()
            token, vuid = self._extract_xsrft_and_vuid(webpage)
            webpage = self._verify_video_password(
                redirect_url, video_id, video_password, token, vuid)

        vimeo_config = self._extract_vimeo_config(webpage, video_id, default=None)
        if vimeo_config:
            seed_status = vimeo_config.get('seed_status') or {}
            if seed_status.get('state') == 'failed':
                raise ExtractorError(
                    '%s said: %s' % (self.IE_NAME, seed_status['title']),
                    expected=True)

        cc_license = None
        timestamp = None
        video_description = None
        info_dict = {}
        config_url = None

        channel_id = self._search_regex(
            r'vimeo\.com/channels/([^/]+)', url, 'channel id', default=None)
        if channel_id:
            config_url = self._html_search_regex(
                r'\bdata-config-url="([^"]+)"', webpage, 'config URL', default=None)
            video_description = clean_html(get_element_by_class('description', webpage))
            info_dict.update({
                'channel_id': channel_id,
                'channel_url': 'https://vimeo.com/channels/' + channel_id,
            })
        if not config_url:
            page_config = self._parse_json(self._search_regex(
                r'vimeo\.(?:clip|vod_title)_page_config\s*=\s*({.+?});',
                webpage, 'page config', default='{}'), video_id, fatal=False)
            if not page_config:
                return self._extract_from_api(video_id)
            config_url = page_config['player']['config_url']
            cc_license = page_config.get('cc_license')
            clip = page_config.get('clip') or {}
            timestamp = clip.get('uploaded_on')
            video_description = clean_html(
                clip.get('description') or page_config.get('description_html_escaped'))
        config = self._download_json(config_url, video_id)
        video = config.get('video') or {}
        vod = video.get('vod') or {}

        def is_rented():
            if '>You rented this title.<' in webpage:
                return True
            if try_get(config, lambda x: x['user']['purchased']):
                return True
            for purchase_option in (vod.get('purchase_options') or []):
                if purchase_option.get('purchased'):
                    return True
                label = purchase_option.get('label_string')
                if label and (label.startswith('You rented this') or label.endswith(' remaining')):
                    return True
            return False

        if is_rented() and vod.get('is_trailer'):
            feature_id = vod.get('feature_id')
            if feature_id and not data.get('force_feature_id', False):
                return self.url_result(smuggle_url(
                    'https://player.vimeo.com/player/%s' % feature_id,
                    {'force_feature_id': True}), 'Vimeo')

        if not video_description:
            video_description = self._html_search_regex(
                r'(?s)<div\s+class="[^"]*description[^"]*"[^>]*>(.*?)</div>',
                webpage, 'description', default=None)
        if not video_description:
            video_description = self._html_search_meta(
                ['description', 'og:description', 'twitter:description'],
                webpage, default=None)
        if not video_description and is_pro:
            orig_webpage = self._download_webpage(
                orig_url, video_id,
                note='Downloading webpage for description',
                fatal=False)
            if orig_webpage:
                video_description = self._html_search_meta(
                    'description', orig_webpage, default=None)
        if not video_description:
            self.report_warning('Cannot find video description')

        if not timestamp:
            timestamp = self._search_regex(
                r'<time[^>]+datetime="([^"]+)"', webpage,
                'timestamp', default=None)

        view_count = int_or_none(self._search_regex(r'UserPlays:(\d+)', webpage, 'view count', default=None))
        like_count = int_or_none(self._search_regex(r'UserLikes:(\d+)', webpage, 'like count', default=None))
        comment_count = int_or_none(self._search_regex(r'UserComments:(\d+)', webpage, 'comment count', default=None))

        formats = []

        source_format = self._extract_original_format(
            'https://vimeo.com/' + video_id, video_id, video.get('unlisted_hash'))
        if source_format:
            formats.append(source_format)

        info_dict_config = self._parse_config(config, video_id)
        formats.extend(info_dict_config['formats'])
        self._vimeo_sort_formats(formats)

        json_ld = self._search_json_ld(webpage, video_id, default={})

        if not cc_license:
            cc_license = self._search_regex(
                r'<link[^>]+rel=["\']license["\'][^>]+href=(["\'])(?P<license>(?:(?!\1).)+)\1',
                webpage, 'license', default=None, group='license')

        info_dict.update({
            'formats': formats,
            'timestamp': unified_timestamp(timestamp),
            'description': video_description,
            'webpage_url': url,
            'view_count': view_count,
            'like_count': like_count,
            'comment_count': comment_count,
            'license': cc_license,
        })

        return merge_dicts(info_dict, info_dict_config, json_ld)


class VimeoOndemandIE(VimeoIE):
    IE_NAME = 'vimeo:ondemand'
    _VALID_URL = r'https?://(?:www\.)?vimeo\.com/ondemand/(?:[^/]+/)?(?P<id>[^/?#&]+)'
    _TESTS = [{
        # ondemand video not available via https://vimeo.com/id
        'url': 'https://vimeo.com/ondemand/20704',
        'md5': 'c424deda8c7f73c1dfb3edd7630e2f35',
        'info_dict': {
            'id': '105442900',
            'ext': 'mp4',
            'title': 'המעבדה - במאי יותם פלדמן',
            'uploader': 'גם סרטים',
            'uploader_url': r're:https?://(?:www\.)?vimeo\.com/gumfilms',
            'uploader_id': 'gumfilms',
            'description': 'md5:4c027c965e439de4baab621e48b60791',
            'upload_date': '20140906',
            'timestamp': 1410032453,
        },
        'params': {
            'format': 'best[protocol=https]',
        },
        'expected_warnings': ['Unable to download JSON metadata'],
    }, {
        # requires Referer to be passed along with og:video:url
        'url': 'https://vimeo.com/ondemand/36938/126682985',
        'info_dict': {
            'id': '126584684',
            'ext': 'mp4',
            'title': 'Rävlock, rätt läte på rätt plats',
            'uploader': 'Lindroth & Norin',
            'uploader_url': r're:https?://(?:www\.)?vimeo\.com/lindrothnorin',
            'uploader_id': 'lindrothnorin',
            'description': 'md5:c3c46a90529612c8279fb6af803fc0df',
            'upload_date': '20150502',
            'timestamp': 1430586422,
        },
        'params': {
            'skip_download': True,
        },
        'expected_warnings': ['Unable to download JSON metadata'],
    }, {
        'url': 'https://vimeo.com/ondemand/nazmaalik',
        'only_matching': True,
    }, {
        'url': 'https://vimeo.com/ondemand/141692381',
        'only_matching': True,
    }, {
        'url': 'https://vimeo.com/ondemand/thelastcolony/150274832',
        'only_matching': True,
    }]


class VimeoChannelIE(VimeoBaseInfoExtractor):
    IE_NAME = 'vimeo:channel'
    _VALID_URL = r'https://vimeo\.com/channels/(?P<id>[^/?#]+)/?(?:$|[?#])'
    _MORE_PAGES_INDICATOR = r'<a.+?rel="next"'
    _TITLE = None
    _TITLE_RE = r'<link rel="alternate"[^>]+?title="(.*?)"'
    _TESTS = [{
        'url': 'https://vimeo.com/channels/tributes',
        'info_dict': {
            'id': 'tributes',
            'title': 'Vimeo Tributes',
        },
        'playlist_mincount': 25,
    }]
    _BASE_URL_TEMPL = 'https://vimeo.com/channels/%s'

    def _page_url(self, base_url, pagenum):
        return '%s/videos/page:%d/' % (base_url, pagenum)

    def _extract_list_title(self, webpage):
        return self._TITLE or self._html_search_regex(
            self._TITLE_RE, webpage, 'list title', fatal=False)

    def _title_and_entries(self, list_id, base_url):
        for pagenum in itertools.count(1):
            page_url = self._page_url(base_url, pagenum)
            webpage = self._download_webpage(
                page_url, list_id,
                'Downloading page %s' % pagenum)

            if pagenum == 1:
                yield self._extract_list_title(webpage)

            # Try extracting href first since not all videos are available via
            # short https://vimeo.com/id URL (e.g. https://vimeo.com/channels/tributes/6213729)
            clips = re.findall(
                r'id="clip_(\d+)"[^>]*>\s*<a[^>]+href="(/(?:[^/]+/)*\1)(?:[^>]+\btitle="([^"]+)")?', webpage)
            if clips:
                for video_id, video_url, video_title in clips:
                    yield self.url_result(
                        compat_urlparse.urljoin(base_url, video_url),
                        VimeoIE.ie_key(), video_id=video_id, video_title=video_title)
            # More relaxed fallback
            else:
                for video_id in re.findall(r'id=["\']clip_(\d+)', webpage):
                    yield self.url_result(
                        'https://vimeo.com/%s' % video_id,
                        VimeoIE.ie_key(), video_id=video_id)

            if re.search(self._MORE_PAGES_INDICATOR, webpage, re.DOTALL) is None:
                break

    def _extract_videos(self, list_id, base_url):
        title_and_entries = self._title_and_entries(list_id, base_url)
        list_title = next(title_and_entries)
        return self.playlist_result(title_and_entries, list_id, list_title)

    def _real_extract(self, url):
        channel_id = self._match_id(url)
        return self._extract_videos(channel_id, self._BASE_URL_TEMPL % channel_id)


class VimeoUserIE(VimeoChannelIE):
    IE_NAME = 'vimeo:user'
    _VALID_URL = r'https://vimeo\.com/(?!(?:[0-9]+|watchlater)(?:$|[?#/]))(?P<id>[^/]+)(?:/videos|[#?]|$)'
    _TITLE_RE = r'<a[^>]+?class="user">([^<>]+?)</a>'
    _TESTS = [{
        'url': 'https://vimeo.com/nkistudio/videos',
        'info_dict': {
            'title': 'Nki',
            'id': 'nkistudio',
        },
        'playlist_mincount': 66,
    }]
    _BASE_URL_TEMPL = 'https://vimeo.com/%s'


class VimeoAlbumIE(VimeoBaseInfoExtractor):
    IE_NAME = 'vimeo:album'
    _VALID_URL = r'https://vimeo\.com/(?:album|showcase)/(?P<id>\d+)(?:$|[?#]|/(?!video))'
    _TITLE_RE = r'<header id="page_header">\n\s*<h1>(.*?)</h1>'
    _TESTS = [{
        'url': 'https://vimeo.com/album/2632481',
        'info_dict': {
            'id': '2632481',
            'title': 'Staff Favorites: November 2013',
        },
        'playlist_mincount': 13,
    }, {
        'note': 'Password-protected album',
        'url': 'https://vimeo.com/album/3253534',
        'info_dict': {
            'title': 'test',
            'id': '3253534',
        },
        'playlist_count': 1,
        'params': {
            'videopassword': 'youtube-dl',
        }
    }]
    _PAGE_SIZE = 100

    def _fetch_page(self, album_id, authorization, hashed_pass, page):
        api_page = page + 1
        query = {
            'fields': 'link,uri',
            'page': api_page,
            'per_page': self._PAGE_SIZE,
        }
        if hashed_pass:
            query['_hashed_pass'] = hashed_pass
        try:
            videos = self._download_json(
                'https://api.vimeo.com/albums/%s/videos' % album_id,
                album_id, 'Downloading page %d' % api_page, query=query, headers={
                    'Authorization': 'jwt ' + authorization,
                })['data']
        except ExtractorError as e:
            if isinstance(e.cause, compat_HTTPError) and e.cause.code == 400:
                return
        for video in videos:
            link = video.get('link')
            if not link:
                continue
            uri = video.get('uri')
            video_id = self._search_regex(r'/videos/(\d+)', uri, 'video_id', default=None) if uri else None
            yield self.url_result(link, VimeoIE.ie_key(), video_id)

    def _real_extract(self, url):
        album_id = self._match_id(url)
        viewer = self._download_json(
            'https://vimeo.com/_rv/viewer', album_id, fatal=False)
        if not viewer:
            webpage = self._download_webpage(url, album_id)
            viewer = self._parse_json(self._search_regex(
                r'bootstrap_data\s*=\s*({.+?})</script>',
                webpage, 'bootstrap data'), album_id)['viewer']
        jwt = viewer['jwt']
        album = self._download_json(
            'https://api.vimeo.com/albums/' + album_id,
            album_id, headers={'Authorization': 'jwt ' + jwt},
            query={'fields': 'description,name,privacy'})
        hashed_pass = None
        if try_get(album, lambda x: x['privacy']['view']) == 'password':
            password = self.get_param('videopassword')
            if not password:
                raise ExtractorError(
                    'This album is protected by a password, use the --video-password option',
                    expected=True)
            self._set_vimeo_cookie('vuid', viewer['vuid'])
            try:
                hashed_pass = self._download_json(
                    'https://vimeo.com/showcase/%s/auth' % album_id,
                    album_id, 'Verifying the password', data=urlencode_postdata({
                        'password': password,
                        'token': viewer['xsrft'],
                    }), headers={
                        'X-Requested-With': 'XMLHttpRequest',
                    })['hashed_pass']
            except ExtractorError as e:
                if isinstance(e.cause, compat_HTTPError) and e.cause.code == 401:
                    raise ExtractorError('Wrong password', expected=True)
                raise
        entries = OnDemandPagedList(functools.partial(
            self._fetch_page, album_id, jwt, hashed_pass), self._PAGE_SIZE)
        return self.playlist_result(
            entries, album_id, album.get('name'), album.get('description'))


class VimeoGroupsIE(VimeoChannelIE):
    IE_NAME = 'vimeo:group'
    _VALID_URL = r'https://vimeo\.com/groups/(?P<id>[^/]+)(?:/(?!videos?/\d+)|$)'
    _TESTS = [{
        'url': 'https://vimeo.com/groups/meetup',
        'info_dict': {
            'id': 'meetup',
            'title': 'Vimeo Meetup!',
        },
        'playlist_mincount': 27,
    }]
    _BASE_URL_TEMPL = 'https://vimeo.com/groups/%s'


class VimeoReviewIE(VimeoBaseInfoExtractor):
    IE_NAME = 'vimeo:review'
    IE_DESC = 'Review pages on vimeo'
    _VALID_URL = r'(?P<url>https://vimeo\.com/[^/]+/review/(?P<id>[^/]+)/[0-9a-f]{10})'
    _TESTS = [{
        'url': 'https://vimeo.com/user21297594/review/75524534/3c257a1b5d',
        'md5': 'c507a72f780cacc12b2248bb4006d253',
        'info_dict': {
            'id': '75524534',
            'ext': 'mp4',
            'title': "DICK HARDWICK 'Comedian'",
            'uploader': 'Richard Hardwick',
            'uploader_id': 'user21297594',
            'description': "Comedian Dick Hardwick's five minute demo filmed in front of a live theater audience.\nEdit by Doug Mattocks",
        },
    }, {
        'note': 'video player needs Referer',
        'url': 'https://vimeo.com/user22258446/review/91613211/13f927e053',
        'md5': '6295fdab8f4bf6a002d058b2c6dce276',
        'info_dict': {
            'id': '91613211',
            'ext': 'mp4',
            'title': 're:(?i)^Death by dogma versus assembling agile . Sander Hoogendoorn',
            'uploader': 'DevWeek Events',
            'duration': 2773,
            'thumbnail': r're:^https?://.*\.jpg$',
            'uploader_id': 'user22258446',
        },
        'skip': 'video gone',
    }, {
        'note': 'Password protected',
        'url': 'https://vimeo.com/user37284429/review/138823582/c4d865efde',
        'info_dict': {
            'id': '138823582',
            'ext': 'mp4',
            'title': 'EFFICIENT PICKUP MASTERCLASS MODULE 1',
            'uploader': 'TMB',
            'uploader_id': 'user37284429',
        },
        'params': {
            'videopassword': 'holygrail',
        },
        'skip': 'video gone',
    }]

    def _real_initialize(self):
        self._login()

    def _real_extract(self, url):
        page_url, video_id = self._match_valid_url(url).groups()
        data = self._download_json(
            page_url.replace('/review/', '/review/data/'), video_id)
        if data.get('isLocked') is True:
            video_password = self._get_video_password()
            viewer = self._download_json(
                'https://vimeo.com/_rv/viewer', video_id)
            webpage = self._verify_video_password(
                'https://vimeo.com/' + video_id, video_id,
                video_password, viewer['xsrft'], viewer['vuid'])
            clip_page_config = self._parse_json(self._search_regex(
                r'window\.vimeo\.clip_page_config\s*=\s*({.+?});',
                webpage, 'clip page config'), video_id)
            config_url = clip_page_config['player']['config_url']
            clip_data = clip_page_config.get('clip') or {}
        else:
            clip_data = data['clipData']
            config_url = clip_data['configUrl']
        config = self._download_json(config_url, video_id)
        info_dict = self._parse_config(config, video_id)
        source_format = self._extract_original_format(
            page_url + '/action', video_id)
        if source_format:
            info_dict['formats'].append(source_format)
        self._vimeo_sort_formats(info_dict['formats'])
        info_dict['description'] = clean_html(clip_data.get('description'))
        return info_dict


class VimeoWatchLaterIE(VimeoChannelIE):
    IE_NAME = 'vimeo:watchlater'
    IE_DESC = 'Vimeo watch later list, "vimeowatchlater" keyword (requires authentication)'
    _VALID_URL = r'https://vimeo\.com/(?:home/)?watchlater|:vimeowatchlater'
    _TITLE = 'Watch Later'
    _LOGIN_REQUIRED = True
    _TESTS = [{
        'url': 'https://vimeo.com/watchlater',
        'only_matching': True,
    }]

    def _real_initialize(self):
        self._login()

    def _page_url(self, base_url, pagenum):
        url = '%s/page:%d/' % (base_url, pagenum)
        request = sanitized_Request(url)
        # Set the header to get a partial html page with the ids,
        # the normal page doesn't contain them.
        request.add_header('X-Requested-With', 'XMLHttpRequest')
        return request

    def _real_extract(self, url):
        return self._extract_videos('watchlater', 'https://vimeo.com/watchlater')


class VimeoLikesIE(VimeoChannelIE):
    _VALID_URL = r'https://(?:www\.)?vimeo\.com/(?P<id>[^/]+)/likes/?(?:$|[?#]|sort:)'
    IE_NAME = 'vimeo:likes'
    IE_DESC = 'Vimeo user likes'
    _TESTS = [{
        'url': 'https://vimeo.com/user755559/likes/',
        'playlist_mincount': 293,
        'info_dict': {
            'id': 'user755559',
            'title': 'urza’s Likes',
        },
    }, {
        'url': 'https://vimeo.com/stormlapse/likes',
        'only_matching': True,
    }]

    def _page_url(self, base_url, pagenum):
        return '%s/page:%d/' % (base_url, pagenum)

    def _real_extract(self, url):
        user_id = self._match_id(url)
        return self._extract_videos(user_id, 'https://vimeo.com/%s/likes' % user_id)


class VHXEmbedIE(VimeoBaseInfoExtractor):
    IE_NAME = 'vhx:embed'
    _VALID_URL = r'https?://embed\.vhx\.tv/videos/(?P<id>\d+)'

    @staticmethod
    def _extract_url(webpage):
        mobj = re.search(
            r'<iframe[^>]+src="(https?://embed\.vhx\.tv/videos/\d+[^"]*)"', webpage)
        return unescapeHTML(mobj.group(1)) if mobj else None

    def _real_extract(self, url):
        video_id = self._match_id(url)
        webpage = self._download_webpage(url, video_id)
        config_url = self._parse_json(self._search_regex(
            r'window\.OTTData\s*=\s*({.+})', webpage,
            'ott data'), video_id, js_to_json)['config_url']
        config = self._download_json(config_url, video_id)
        info = self._parse_config(config, video_id)
        info['id'] = video_id
        self._vimeo_sort_formats(info['formats'])
        return info
-												Unify coding cookie

											
										
										
											2016-10-02 11:39:18 +00:00
+								# coding: utf-8
-												[vimeo] Use unicode_literals

											
										
										
											2014-01-06 22:38:16 +00:00
+								from __future__ import unicode_literals
-												[vimeo] fix extraction for password protected player URLs(closes #18889)

											
										
										
											2019-01-17 08:44:08 +00:00
+								import base64
-												[vimeo] fix album extraction

closes #1933
closes #15704
closes #15855
closes #18967
closes #21986

											
										
										
											2019-08-03 09:29:20 +00:00
+								import functools
-												Move Vimeo into its own file

											
										
										
											2013-06-23 18:18:21 +00:00
+								import re
-												[vimeo] add an extractor for channels

											
										
										
											2013-07-29 11:12:09 +00:00
+								import itertools
-												Move Vimeo into its own file

											
										
										
											2013-06-23 18:18:21 +00:00
 								from .common import InfoExtractor
-												[util] Move compatibility functions out of util

utils is large enough without these compatibility functions.

Everything that is present in newer versions of Python (i.e. with dev Python it's just an import) goes into compat.py .
Everything else (i.e. youtube-dl-specific helpers) goes into utils.py .

											
										
										
											2014-11-02 10:23:40 +00:00
+								from ..compat import (
-												[vimeo] fix album extraction

closes #1933
closes #15704
closes #15855
closes #18967
closes #21986

											
										
										
											2019-08-03 09:29:20 +00:00
+								    compat_kwargs,
-												[vimeo] Add a better error message for embed-only videos (#2527)

											
										
										
											2014-03-08 11:24:43 +00:00
+								    compat_HTTPError,
-												[vimeo] Fix rented videos (Closes #9830)

											
										
										
											2016-06-18 20:56:01 +00:00
+								    compat_str,
-												[vimeo:likes] Support large like lists (Fixes #3847)

											
										
										
											2014-09-28 22:36:06 +00:00
+								    compat_urlparse,
-												[util] Move compatibility functions out of util

utils is large enough without these compatibility functions.

Everything that is present in newer versions of Python (i.e. with dev Python it's just an import) goes into compat.py .
Everything else (i.e. youtube-dl-specific helpers) goes into utils.py .

											
										
										
											2014-11-02 10:23:40 +00:00
+								)
 								from ..utils import (
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								    clean_html,
-												[vimeo] Check source file URL (Closes #8187)

											
										
										
											2016-01-08 21:06:09 +00:00
+								    determine_ext,
-												Move Vimeo into its own file

											
										
										
											2013-06-23 18:18:21 +00:00
+								    ExtractorError,
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								    get_element_by_class,
-												[vimeo] Detect source extension
and misc cleanup

Cherry-picked from #1477
Closes #1402

Authored by: flashdagger

											
										
										
											2021-11-05 20:45:08 +00:00
+								    HEADRequest,
-												[vimeo] Add support for VHX(Vimeo OTT)(#14835)

											
										
										
											2018-11-28 18:53:22 +00:00
+								    js_to_json,
-												[vimeo:likes] Support large like lists (Fixes #3847)

											
										
										
											2014-09-28 22:36:06 +00:00
+								    int_or_none,
-												[vimeo] Extract JSON LD (closes #16295)

											
										
										
											2018-04-27 19:48:20 +00:00
+								    merge_dicts,
-												[vimeo] fix album extraction

closes #1933
closes #15704
closes #15855
closes #18967
closes #21986

											
										
										
											2019-08-03 09:29:20 +00:00
+								    OnDemandPagedList,
-												[vimeo] Add support for VHX(Vimeo OTT)(#14835)

											
										
										
											2018-11-28 18:53:22 +00:00
+								    parse_filesize,
-												Update to ytdl v2021-04-01
https://github.com/ytdl-org/youtube-dl/commit/14f29f087e6097feb46bdb84878924bc410a57eb

Closes #205

											
										
										
											2021-04-01 08:28:33 +00:00
+								    parse_iso8601,
-												[utils] Add `parse_qs`

											
										
										
											2021-08-22 19:02:00 +00:00
+								    parse_qs,
-												Rename compat_urllib_request_Request to sanitized_Request and move to utils

											
										
										
											2015-11-20 14:33:49 +00:00
+								    sanitized_Request,
-												[vimeo] Prevent infinite loops if video password verification fails

We're seeing this in the tests¹ right now, which do not terminate.

¹  https://travis-ci.org/jaimeMF/youtube-dl/jobs/51135858

											
										
										
											2015-02-17 23:27:57 +00:00
+								    smuggle_url,
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								    str_or_none,
-												[vimeo] Extract upload timestamp

											
										
										
											2017-01-31 17:58:02 +00:00
+								    try_get,
 								    unified_timestamp,
-												[generic] Support embedded vimeo videos (#1602)

											
										
										
											2013-10-15 10:05:13 +00:00
+								    unsmuggle_url,
-												[vimeo] Fix logging in python 3.x

The POST data must be a bytes object.

											
										
										
											2014-04-24 12:44:27 +00:00
+								    urlencode_postdata,
-												[vimeo] Fix subtitles URLs (#24209)


											
										
										
											2020-03-02 18:27:40 +00:00
+								    urljoin,
-												[vimeo/generic] Move detection logic from GenericIE to VimeoIE

											
										
										
											2015-06-21 10:23:58 +00:00
+								    unescapeHTML,
-												[vimeo] Detect source extension
and misc cleanup

Cherry-picked from #1477
Closes #1402

Authored by: flashdagger

											
										
										
											2021-11-05 20:45:08 +00:00
+								    urlhandle_detect_ext,
-												Move Vimeo into its own file

											
										
										
											2013-06-23 18:18:21 +00:00
+								)
-												[vimeo] Better formatting for regexp

											
										
										
											2013-12-22 02:17:56 +00:00
-												[vimeo] Add an extractor for the watch later list (closes #2787)

											
										
										
											2014-04-24 19:51:20 +00:00
+								class VimeoBaseInfoExtractor(InfoExtractor):
 								    _NETRC_MACHINE = 'vimeo'
 								    _LOGIN_REQUIRED = False
-												[vimeo] Fix login (Closes #6488)

											
										
										
											2015-08-10 17:35:08 +00:00
+								    _LOGIN_URL = 'https://vimeo.com/log_in'
-												[vimeo] Add an extractor for the watch later list (closes #2787)

											
										
										
											2014-04-24 19:51:20 +00:00
 								    def _login(self):
-												remove unnecessary assignment parenthesis

											
										
										
											2018-05-26 15:12:44 +00:00
+								        username, password = self._get_login_info()
-												[vimeo] Add an extractor for the watch later list (closes #2787)

											
										
										
											2014-04-24 19:51:20 +00:00
+								        if username is None:
 								            if self._LOGIN_REQUIRED:
-												[vimeo] Some modernization and style fixes

											
										
										
											2014-05-04 20:27:56 +00:00
+								                raise ExtractorError('No login info available, needed for using %s.' % self.IE_NAME, expected=True)
-												[vimeo] Add an extractor for the watch later list (closes #2787)

											
										
										
											2014-04-24 19:51:20 +00:00
+								            return
-												[vimeo] Modernize login code and improve error messaging

											
										
										
											2018-03-05 15:45:47 +00:00
+								        webpage = self._download_webpage(
 								            self._LOGIN_URL, None, 'Downloading login page')
-												[vimeo] Fix password protected videos

											
										
										
											2015-10-10 20:31:37 +00:00
+								        token, vuid = self._extract_xsrft_and_vuid(webpage)
-												[vimeo] Modernize login code and improve error messaging

											
										
										
											2018-03-05 15:45:47 +00:00
+								        data = {
-												[vimeo] Fix login (Closes #6488)

											
										
										
											2015-08-10 17:35:08 +00:00
+								            'action': 'login',
-												[vimeo] Add an extractor for the watch later list (closes #2787)

											
										
										
											2014-04-24 19:51:20 +00:00
+								            'email': username,
 								            'password': password,
 								            'service': 'vimeo',
 								            'token': token,
-												[vimeo] Modernize login code and improve error messaging

											
										
										
											2018-03-05 15:45:47 +00:00
+								        }
-												[vimeo] Simplify set cookie

											
										
										
											2015-11-11 16:32:13 +00:00
+								        self._set_vimeo_cookie('vuid', vuid)
-												[vimeo] Modernize login code and improve error messaging

											
										
										
											2018-03-05 15:45:47 +00:00
+								        try:
 								            self._download_webpage(
 								                self._LOGIN_URL, None, 'Logging in',
 								                data=urlencode_postdata(data), headers={
 								                    'Content-Type': 'application/x-www-form-urlencoded',
 								                    'Referer': self._LOGIN_URL,
 								                })
 								        except ExtractorError as e:
 								            if isinstance(e.cause, compat_HTTPError) and e.cause.code == 418:
 								                raise ExtractorError(
 								                    'Unable to log in: bad username or password',
 								                    expected=True)
 								            raise ExtractorError('Unable to log in')
-												[vimeo] Add an extractor for the watch later list (closes #2787)

											
										
										
											2014-04-24 19:51:20 +00:00
-												Update to ytdl v2021-04-01
https://github.com/ytdl-org/youtube-dl/commit/14f29f087e6097feb46bdb84878924bc410a57eb

Closes #205

											
										
										
											2021-04-01 08:28:33 +00:00
+								    def _get_video_password(self):
-												[extractor] Add `write_debug` and `get_param`

											
										
										
											2021-05-17 12:23:08 +00:00
+								        password = self.get_param('videopassword')
-												[vimeo:review] Fix extraction for password-protected videos

Closes #9853

											
										
										
											2016-06-24 08:48:37 +00:00
+								        if password is None:
-												Update to ytdl v2021-04-01
https://github.com/ytdl-org/youtube-dl/commit/14f29f087e6097feb46bdb84878924bc410a57eb

Closes #205

											
										
										
											2021-04-01 08:28:33 +00:00
+								            raise ExtractorError(
 								                'This video is protected by a password, use the --video-password option',
 								                expected=True)
 								        return password
 								    def _verify_video_password(self, url, video_id, password, token, vuid):
-												[vimeo:review] Fix extraction for password-protected videos

Closes #9853

											
										
										
											2016-06-24 08:48:37 +00:00
+								        if url.startswith('http://'):
 								            # vimeo only supports https now, but the user can give an http url
 								            url = url.replace('http://', 'https://')
 								        self._set_vimeo_cookie('vuid', vuid)
 								        return self._download_webpage(
-												Update to ytdl v2021-04-01
https://github.com/ytdl-org/youtube-dl/commit/14f29f087e6097feb46bdb84878924bc410a57eb

Closes #205

											
										
										
											2021-04-01 08:28:33 +00:00
+								            url + '/password', video_id, 'Verifying the password',
 								            'Wrong password', data=urlencode_postdata({
 								                'password': password,
 								                'token': token,
 								            }), headers={
 								                'Content-Type': 'application/x-www-form-urlencoded',
 								                'Referer': url,
 								            })
-												[vimeo:review] Fix extraction for password-protected videos

Closes #9853

											
										
										
											2016-06-24 08:48:37 +00:00
-												[vimeo] Fix password protected videos

											
										
										
											2015-10-10 20:31:37 +00:00
+								    def _extract_xsrft_and_vuid(self, webpage):
 								        xsrft = self._search_regex(
-												[vimeo] Fix authentication (Closes #8520)

											
										
										
											2016-02-11 21:16:26 +00:00
+								            r'(?:(?P<q1>["\'])xsrft(?P=q1)\s*:|xsrft\s*[=:])\s*(?P<q>["\'])(?P<xsrft>.+?)(?P=q)',
-												[vimeo] Fix login (Closes #6488)

											
										
										
											2015-08-10 17:35:08 +00:00
+								            webpage, 'login token', group='xsrft')
-												[vimeo] Fix password protected videos

											
										
										
											2015-10-10 20:31:37 +00:00
+								        vuid = self._search_regex(
 								            r'["\']vuid["\']\s*:\s*(["\'])(?P<vuid>.+?)\1',
 								            webpage, 'vuid', group='vuid')
 								        return xsrft, vuid
-												[vimeo] Fix login (Closes #6488)

											
										
										
											2015-08-10 17:35:08 +00:00
-												[vimeo] fix album extraction

closes #1933
closes #15704
closes #15855
closes #18967
closes #21986

											
										
										
											2019-08-03 09:29:20 +00:00
+								    def _extract_vimeo_config(self, webpage, video_id, *args, **kwargs):
 								        vimeo_config = self._search_regex(
 								            r'vimeo\.config\s*=\s*(?:({.+?})|_extend\([^,]+,\s+({.+?})\));',
 								            webpage, 'vimeo config', *args, **compat_kwargs(kwargs))
 								        if vimeo_config:
 								            return self._parse_json(vimeo_config, video_id)
-												[vimeo] Simplify set cookie

											
										
										
											2015-11-11 16:32:13 +00:00
+								    def _set_vimeo_cookie(self, name, value):
 								        self._set_cookie('vimeo.com', name, value)
-												[vimeo] Fix extraction for VimeoReview videos

											
										
										
											2016-06-11 13:35:08 +00:00
+								    def _vimeo_sort_formats(self, formats):
-												[vimeo] Sort http formats higher
Closes #1821

											
										
										
											2021-11-28 10:54:02 +00:00
+								        # Note: Bitrates are completely broken. Single m3u8 may contain entries in kbps and bps
 								        # at the same time without actual units specified.
 								        self._sort_formats(formats, ('quality', 'res', 'fps', 'hdr:12', 'source'))
-												[vimeo] Fix extraction for VimeoReview videos

											
										
										
											2016-06-11 13:35:08 +00:00
 								    def _parse_config(self, config, video_id):
-												[vimeo] fix extraction for hls formats and add support for dash formats(closes #11490)

											
										
										
											2016-12-20 11:25:05 +00:00
+								        video_data = config['video']
 								        video_title = video_data['title']
-												[vimeo] extract live archive source format(#19144)

											
										
										
											2019-04-21 20:05:58 +00:00
+								        live_event = video_data.get('live_event') or {}
 								        is_live = live_event.get('status') == 'started'
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								        request = config.get('request') or {}
-												[vimeo] Fix extraction for VimeoReview videos

											
										
										
											2016-06-11 13:35:08 +00:00
 								        formats = []
-												[extractor] Extract subtitles from manifests for more sites (#2686)

vimeo, globo, kaltura, svt

Authored by: fstirlitz 
											
										
										
											2022-02-11 19:03:33 +00:00
+								        subtitles = {}
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								        config_files = video_data.get('files') or request.get('files') or {}
 								        for f in (config_files.get('progressive') or []):
-												[vimeo] Fix extraction for VimeoReview videos

											
										
										
											2016-06-11 13:35:08 +00:00
+								            video_url = f.get('url')
 								            if not video_url:
 								                continue
 								            formats.append({
 								                'url': video_url,
 								                'format_id': 'http-%s' % f.get('quality'),
-												[vimeo] Sort http formats higher
Closes #1821

											
										
										
											2021-11-28 10:54:02 +00:00
+								                'source_preference': 10,
-												[vimeo] Fix extraction for VimeoReview videos

											
										
										
											2016-06-11 13:35:08 +00:00
+								                'width': int_or_none(f.get('width')),
 								                'height': int_or_none(f.get('height')),
 								                'fps': int_or_none(f.get('fps')),
 								                'tbr': int_or_none(f.get('bitrate')),
 								            })
-												[vimeo] fix extraction for hls formats and add support for dash formats(closes #11490)

											
										
										
											2016-12-20 11:25:05 +00:00
-												[vimeo] extract live archive source format(#19144)

											
										
										
											2019-04-21 20:05:58 +00:00
+								        # TODO: fix handling of 308 status code returned for live archive manifest requests
-												[vimeo] improve format extraction and sorting(closes #25285)

											
										
										
											2020-05-15 14:57:06 +00:00
+								        sep_pattern = r'/sep/video/'
-												[vimeo] fix extraction for hls formats and add support for dash formats(closes #11490)

											
										
										
											2016-12-20 11:25:05 +00:00
+								        for files_type in ('hls', 'dash'):
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								            for cdn_name, cdn_data in (try_get(config_files, lambda x: x[files_type]['cdns']) or {}).items():
-												[vimeo] fix extraction for hls formats and add support for dash formats(closes #11490)

											
										
										
											2016-12-20 11:25:05 +00:00
+								                manifest_url = cdn_data.get('url')
 								                if not manifest_url:
 								                    continue
 								                format_id = '%s-%s' % (files_type, cdn_name)
-												[vimeo] improve format extraction and sorting(closes #25285)

											
										
										
											2020-05-15 14:57:06 +00:00
+								                sep_manifest_urls = []
 								                if re.search(sep_pattern, manifest_url):
 								                    for suffix, repl in (('', 'video'), ('_sep', 'sep/video')):
 								                        sep_manifest_urls.append((format_id + suffix, re.sub(
 								                            sep_pattern, '/%s/' % repl, manifest_url)))
 								                else:
 								                    sep_manifest_urls = [(format_id, manifest_url)]
 								                for f_id, m_url in sep_manifest_urls:
 								                    if files_type == 'hls':
-												[extractor] Extract subtitles from manifests for more sites (#2686)

vimeo, globo, kaltura, svt

Authored by: fstirlitz 
											
										
										
											2022-02-11 19:03:33 +00:00
+								                        fmts, subs = self._extract_m3u8_formats_and_subtitles(
-												[cleanup] Don't pass protocol to `_extract_m3u8_formats` for live videos

`live` parameter already handles changing the protocol

											
										
										
											2022-03-02 17:29:01 +00:00
+								                            m_url, video_id, 'mp4', live=is_live, m3u8_id=f_id,
-												[vimeo] improve format extraction and sorting(closes #25285)

											
										
										
											2020-05-15 14:57:06 +00:00
+								                            note='Downloading %s m3u8 information' % cdn_name,
-												[extractor] Extract subtitles from manifests for more sites (#2686)

vimeo, globo, kaltura, svt

Authored by: fstirlitz 
											
										
										
											2022-02-11 19:03:33 +00:00
+								                            fatal=False)
 								                        formats.extend(fmts)
 								                        self._merge_subtitles(subs, target=subtitles)
-												[vimeo] improve format extraction and sorting(closes #25285)

											
										
										
											2020-05-15 14:57:06 +00:00
+								                    elif files_type == 'dash':
-												[vimeo] add support live streams and improve info extraction(closes #19144)

											
										
										
											2019-04-21 16:20:28 +00:00
+								                        if 'json=1' in m_url:
 								                            real_m_url = (self._download_json(m_url, video_id, fatal=False) or {}).get('url')
 								                            if real_m_url:
 								                                m_url = real_m_url
-												[extractor] Extract subtitles from manifests for more sites (#2686)

vimeo, globo, kaltura, svt

Authored by: fstirlitz 
											
										
										
											2022-02-11 19:03:33 +00:00
+								                        fmts, subs = self._extract_mpd_formats_and_subtitles(
-												[vimeo] extract both mixed and separated dash formats

											
										
										
											2017-01-31 13:47:56 +00:00
+								                            m_url.replace('/master.json', '/master.mpd'), video_id, f_id,
 								                            'Downloading %s MPD information' % cdn_name,
-												[vimeo] Fix formats' sorting (closes #13189)

											
										
										
											2017-05-24 15:58:16 +00:00
+								                            fatal=False)
-												[extractor] Extract subtitles from manifests for more sites (#2686)

vimeo, globo, kaltura, svt

Authored by: fstirlitz 
											
										
										
											2022-02-11 19:03:33 +00:00
+								                        formats.extend(fmts)
 								                        self._merge_subtitles(subs, target=subtitles)
-												[vimeo] Fix extraction for VimeoReview videos

											
										
										
											2016-06-11 13:35:08 +00:00
-												[vimeo] extract live archive source format(#19144)

											
										
										
											2019-04-21 20:05:58 +00:00
+								        live_archive = live_event.get('archive') or {}
 								        live_archive_source_url = live_archive.get('source_url')
 								        if live_archive_source_url and live_archive.get('status') == 'done':
 								            formats.append({
 								                'format_id': 'live-archive-source',
 								                'url': live_archive_source_url,
-												[formatsort] Remove misuse of 'preference'

'preference' is to be used only when the format is better that ALL qualities of a lower preference irrespective of ANY sorting order the user requests. See deezer.py for correct use of this

In the older sorting method, `preference`, `quality` and `language_preference` were functionally almost equivalent. So these disparities doesn't really matter there

Also, despite what the documentation says, the default for `preference` was actually 0 and not -1. I have tried to correct this and also account for it when converting `preference` to `quality`

											
										
										
											2021-02-18 22:03:16 +00:00
+								                'quality': 10,
-												[vimeo] extract live archive source format(#19144)

											
										
										
											2019-04-21 20:05:58 +00:00
+								            })
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								        for tt in (request.get('text_tracks') or []):
-												[extractor] Extract subtitles from manifests for more sites (#2686)

vimeo, globo, kaltura, svt

Authored by: fstirlitz 
											
										
										
											2022-02-11 19:03:33 +00:00
+								            subtitles.setdefault(tt['lang'], []).append({
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								                'ext': 'vtt',
 								                'url': urljoin('https://vimeo.com', tt['url']),
-												[extractor] Extract subtitles from manifests for more sites (#2686)

vimeo, globo, kaltura, svt

Authored by: fstirlitz 
											
										
										
											2022-02-11 19:03:33 +00:00
+								            })
-												[vimeo] Fix extraction for VimeoReview videos

											
										
										
											2016-06-11 13:35:08 +00:00
-												[vimeo] add support live streams and improve info extraction(closes #19144)

											
										
										
											2019-04-21 16:20:28 +00:00
+								        thumbnails = []
 								        if not is_live:
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								            for key, thumb in (video_data.get('thumbs') or {}).items():
-												[vimeo] add support live streams and improve info extraction(closes #19144)

											
										
										
											2019-04-21 16:20:28 +00:00
+								                thumbnails.append({
 								                    'id': key,
 								                    'width': int_or_none(key),
 								                    'url': thumb,
 								                })
 								            thumbnail = video_data.get('thumbnail')
 								            if thumbnail:
 								                thumbnails.append({
 								                    'url': thumbnail,
 								                })
 								        owner = video_data.get('owner') or {}
 								        video_uploader_url = owner.get('url')
-												[vimeo] Extract chapters
Closes #1892

											
										
										
											2021-12-05 14:22:34 +00:00
+								        duration = int_or_none(video_data.get('duration'))
 								        chapter_data = try_get(config, lambda x: x['embed']['chapters']) or []
 								        chapters = [{
 								            'title': current_chapter.get('title'),
 								            'start_time': current_chapter.get('timecode'),
 								            'end_time': next_chapter.get('timecode'),
 								        } for current_chapter, next_chapter in zip(chapter_data, chapter_data[1:] + [{'timecode': duration}])]
 								        if chapters and chapters[0]['start_time']:  # Chapters may not start from 0
 								            chapters[:0] = [{'title': '<Untitled>', 'start_time': 0, 'end_time': chapters[0]['start_time']}]
-												[vimeo] Fix extraction for VimeoReview videos

											
										
										
											2016-06-11 13:35:08 +00:00
+								        return {
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								            'id': str_or_none(video_data.get('id')) or video_id,
-												[extractor] Standardize `_live_title`

											
										
										
											2021-12-15 16:00:46 +00:00
+								            'title': video_title,
-												[vimeo] add support live streams and improve info extraction(closes #19144)

											
										
										
											2019-04-21 16:20:28 +00:00
+								            'uploader': owner.get('name'),
 								            'uploader_id': video_uploader_url.split('/')[-1] if video_uploader_url else None,
-												[vimeo] Fix extraction for VimeoReview videos

											
										
										
											2016-06-11 13:35:08 +00:00
+								            'uploader_url': video_uploader_url,
-												[vimeo] add support live streams and improve info extraction(closes #19144)

											
										
										
											2019-04-21 16:20:28 +00:00
+								            'thumbnails': thumbnails,
-												[vimeo] Extract chapters
Closes #1892

											
										
										
											2021-12-05 14:22:34 +00:00
+								            'duration': duration,
 								            'chapters': chapters or None,
-												[vimeo] Fix extraction for VimeoReview videos

											
										
										
											2016-06-11 13:35:08 +00:00
+								            'formats': formats,
 								            'subtitles': subtitles,
-												[vimeo] add support live streams and improve info extraction(closes #19144)

											
										
										
											2019-04-21 16:20:28 +00:00
+								            'is_live': is_live,
-												[vimeo] Fix extraction for VimeoReview videos

											
										
										
											2016-06-11 13:35:08 +00:00
+								        }
-												Update to ytdl-commit-cf2dbec
https://github.com/ytdl-org/youtube-dl/commit/cf2dbec6301177a1fddf72862de05fa912d9869d

Except: [kakao] improve info extraction and detect geo restriction
https://github.com/ytdl-org/youtube-dl/commit/d8085580f63ad3b146a31712ff76cf41d5a4558a

											
										
										
											2021-02-19 20:44:36 +00:00
+								    def _extract_original_format(self, url, video_id, unlisted_hash=None):
 								        query = {'action': 'load_download_config'}
 								        if unlisted_hash:
 								            query['unlisted_hash'] = unlisted_hash
-												[vimeo:review] improve config url extraction and extract original format(closes #20305)

											
										
										
											2019-03-10 14:03:32 +00:00
+								        download_data = self._download_json(
-												Update to ytdl-commit-cf2dbec
https://github.com/ytdl-org/youtube-dl/commit/cf2dbec6301177a1fddf72862de05fa912d9869d

Except: [kakao] improve info extraction and detect geo restriction
https://github.com/ytdl-org/youtube-dl/commit/d8085580f63ad3b146a31712ff76cf41d5a4558a

											
										
										
											2021-02-19 20:44:36 +00:00
+								            url, video_id, fatal=False, query=query,
-												[vimeo] Detect source extension
and misc cleanup

Cherry-picked from #1477
Closes #1402

Authored by: flashdagger

											
										
										
											2021-11-05 20:45:08 +00:00
+								            headers={'X-Requested-With': 'XMLHttpRequest'},
 								            expected_status=(403, 404)) or {}
 								        source_file = download_data.get('source_file')
 								        download_url = try_get(source_file, lambda x: x['download_url'])
 								        if download_url and not source_file.get('is_cold') and not source_file.get('is_defrosting'):
 								            source_name = source_file.get('public_name', 'Original')
 								            if self._is_valid_url(download_url, video_id, '%s video' % source_name):
 								                ext = (try_get(
 								                    source_file, lambda x: x['extension'],
 								                    compat_str) or determine_ext(
 								                    download_url, None) or 'mp4').lower()
 								                return {
 								                    'url': download_url,
 								                    'ext': ext,
 								                    'width': int_or_none(source_file.get('width')),
 								                    'height': int_or_none(source_file.get('height')),
 								                    'filesize': parse_filesize(source_file.get('size')),
 								                    'format_id': source_name,
 								                    'quality': 1,
 								                }
-												[vimeo:review] improve config url extraction and extract original format(closes #20305)

											
										
										
											2019-03-10 14:03:32 +00:00
-												[Vimeo] Better extraction of original file (#599)

Authored by: Ashish0804
											
										
										
											2021-08-02 01:53:12 +00:00
+								        jwt_response = self._download_json(
 								            'https://vimeo.com/_rv/viewer', video_id, note='Downloading jwt token', fatal=False) or {}
 								        if not jwt_response.get('jwt'):
 								            return
 								        headers = {'Authorization': 'jwt %s' % jwt_response['jwt']}
 								        original_response = self._download_json(
 								            f'https://api.vimeo.com/videos/{video_id}', video_id,
-												[vimeo] Detect source extension
and misc cleanup

Cherry-picked from #1477
Closes #1402

Authored by: flashdagger

											
										
										
											2021-11-05 20:45:08 +00:00
+								            headers=headers, fatal=False, expected_status=(403, 404)) or {}
 								        for download_data in original_response.get('download') or []:
-												[Vimeo] Better extraction of original file (#599)

Authored by: Ashish0804
											
										
										
											2021-08-02 01:53:12 +00:00
+								            download_url = download_data.get('link')
 								            if not download_url or download_data.get('quality') != 'source':
 								                continue
-												[vimeo] Detect source extension
and misc cleanup

Cherry-picked from #1477
Closes #1402

Authored by: flashdagger

											
										
										
											2021-11-05 20:45:08 +00:00
+								            ext = determine_ext(parse_qs(download_url).get('filename', [''])[0].lower(), default_ext=None)
 								            if not ext:
 								                urlh = self._request_webpage(
 								                    HEADRequest(download_url), video_id, fatal=False, note='Determining source extension')
 								                ext = urlh and urlhandle_detect_ext(urlh)
-												[Vimeo] Better extraction of original file (#599)

Authored by: Ashish0804
											
										
										
											2021-08-02 01:53:12 +00:00
+								            return {
 								                'url': download_url,
-												[vimeo] Detect source extension
and misc cleanup

Cherry-picked from #1477
Closes #1402

Authored by: flashdagger

											
										
										
											2021-11-05 20:45:08 +00:00
+								                'ext': ext or 'unknown_video',
-												[Vimeo] Better extraction of original file (#599)

Authored by: Ashish0804
											
										
										
											2021-08-02 01:53:12 +00:00
+								                'format_id': download_data.get('public_name', 'Original'),
 								                'width': int_or_none(download_data.get('width')),
 								                'height': int_or_none(download_data.get('height')),
 								                'fps': int_or_none(download_data.get('fps')),
 								                'filesize': int_or_none(download_data.get('size')),
 								                'quality': 1,
 								            }
-												[vimeo] Add an extractor for the watch later list (closes #2787)

											
										
										
											2014-04-24 19:51:20 +00:00
-												[vimeo] Convert to new subtitles system

Removed some tests, the behaviour should be checked in a test for the YoutubeDL class

											
										
										
											2015-02-15 17:52:07 +00:00
+								class VimeoIE(VimeoBaseInfoExtractor):
-												Move Vimeo into its own file

											
										
										
											2013-06-23 18:18:21 +00:00
+								    """Information extractor for vimeo.com."""
 								    # _VALID_URL matches Vimeo URLs
-												[vimeo] Better formatting for regexp

											
										
										
											2013-12-22 02:17:56 +00:00
+								    _VALID_URL = r'''(?x)
-												[vimeo:ondemand] Separate ondemand extractor (Closes #8330, closes #8801)

											
										
										
											2016-03-09 18:51:07 +00:00
+								                    https?://
 								                        (?:
 								                            (?:
 								                                www|
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								                                player
-												[vimeo:ondemand] Separate ondemand extractor (Closes #8330, closes #8801)

											
										
										
											2016-03-09 18:51:07 +00:00
+								                            )
 								                            \.
 								                        )?
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								                        vimeo(?:pro)?\.com/
-												[vimeo] fix album extraction

closes #1933
closes #15704
closes #15855
closes #18967
closes #21986

											
										
										
											2019-08-03 09:29:20 +00:00
+								                        (?!(?:channels|album|showcase)/[^/?#]+/?(?:$|[?#])|[^/]+/review/|ondemand/)
-												[vimeo] Fix ondemand videos and direct URLs with hash
Closes #1353, #1471

											
										
										
											2021-11-05 20:24:05 +00:00
+								                        (?:[^/]+/)*?
-												[vimeo:ondemand] Separate ondemand extractor (Closes #8330, closes #8801)

											
										
										
											2016-03-09 18:51:07 +00:00
+								                        (?:
 								                            (?:
 								                                play_redirect_hls|
 								                                moogaloop\.swf)\?clip_id=
 								                            )?
 								                        (?:videos?/)?
 								                        (?P<id>[0-9]+)
-												Update to ytdl v2021-04-01
https://github.com/ytdl-org/youtube-dl/commit/14f29f087e6097feb46bdb84878924bc410a57eb

Closes #205

											
										
										
											2021-04-01 08:28:33 +00:00
+								                        (?:/(?P<unlisted_hash>[\da-f]{10}))?
-												[vimeo:ondemand] Separate ondemand extractor (Closes #8330, closes #8801)

											
										
										
											2016-03-09 18:51:07 +00:00
+								                        /?(?:[?&].*)?(?:[#].*)?$
 								                    '''
-												[vimeo] Use unicode_literals

											
										
										
											2014-01-06 22:38:16 +00:00
+								    IE_NAME = 'vimeo'
-												[vimeo] extract information for Vimeo Pro videos from http://player.vimeo.com/video/{video_id} (fixes #1197)

For some videos https://vimeo.com/{video_id} doesn't work

											
										
										
											2013-08-21 11:48:19 +00:00
+								    _TESTS = [
 								        {
-												[vimeo] Use unicode_literals

											
										
										
											2014-01-06 22:38:16 +00:00
+								            'url': 'http://vimeo.com/56015672#at=0',
 								            'md5': '8879b6cc097e987f02484baf890129e5',
 								            'info_dict': {
-												[vimeo] Modernize test definition

											
										
										
											2014-02-17 10:44:24 +00:00
+								                'id': '56015672',
 								                'ext': 'mp4',
-												renaming issues resolved


											
										
										
											2020-09-02 20:37:35 +00:00
+								                'title': "youtube-dl test video - \u2605 \" ' \u5e78 / \\ \u00e4 \u21ad \U0001d550",
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								                'description': 'md5:2d3305bad981a06ff79f027f19865021',
-												[vimeo] Extract upload timestamp

											
										
										
											2017-01-31 17:58:02 +00:00
+								                'timestamp': 1355990239,
-												[vimeo] Update tests

											
										
										
											2015-10-10 20:22:42 +00:00
+								                'upload_date': '20121220',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											2017-01-02 12:08:07 +00:00
+								                'uploader_url': r're:https?://(?:www\.)?vimeo\.com/user7108434',
-												[vimeo] Update tests

											
										
										
											2015-10-10 20:22:42 +00:00
+								                'uploader_id': 'user7108434',
 								                'uploader': 'Filippo Valsorda',
 								                'duration': 10,
-												[vimeo] Extract license (closes #11880)

											
										
										
											2017-01-31 17:49:28 +00:00
+								                'license': 'by-sa',
-												[vimeo] extract information for Vimeo Pro videos from http://player.vimeo.com/video/{video_id} (fixes #1197)

For some videos https://vimeo.com/{video_id} doesn't work

											
										
										
											2013-08-21 11:48:19 +00:00
+								            },
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								            'params': {
 								                'format': 'best[protocol=https]',
 								            },
-												[vimeo] extract information for Vimeo Pro videos from http://player.vimeo.com/video/{video_id} (fixes #1197)

For some videos https://vimeo.com/{video_id} doesn't work

											
										
										
											2013-08-21 11:48:19 +00:00
+								        },
 								        {
-												[vimeo] Use unicode_literals

											
										
										
											2014-01-06 22:38:16 +00:00
+								            'url': 'http://vimeopro.com/openstreetmapus/state-of-the-map-us-2013/video/68093876',
 								            'md5': '3b5ca6aa22b60dfeeadf50b72e44ed82',
 								            'note': 'Vimeo Pro video (#1197)',
 								            'info_dict': {
-												[vimeo] Some modernization and style fixes

											
										
										
											2014-05-04 20:27:56 +00:00
+								                'id': '68093876',
 								                'ext': 'mp4',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											2017-01-02 12:08:07 +00:00
+								                'uploader_url': r're:https?://(?:www\.)?vimeo\.com/openstreetmapus',
-												[vimeo] Use unicode_literals

											
										
										
											2014-01-06 22:38:16 +00:00
+								                'uploader_id': 'openstreetmapus',
 								                'uploader': 'OpenStreetMap US',
 								                'title': 'Andy Allan - Putting the Carto into OpenStreetMap Cartography',
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								                'description': 'md5:2c362968038d4499f4d79f88458590c1',
-												[vimeo] Add video duration extraction(Closes #2876)

											
										
										
											2014-05-09 18:46:40 +00:00
+								                'duration': 1595,
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								                'upload_date': '20130610',
 								                'timestamp': 1370893156,
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								                'license': 'by',
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								            },
 								            'params': {
 								                'format': 'best[protocol=https]',
-												[vimeo] extract information for Vimeo Pro videos from http://player.vimeo.com/video/{video_id} (fixes #1197)

For some videos https://vimeo.com/{video_id} doesn't work

											
										
										
											2013-08-21 11:48:19 +00:00
+								            },
 								        },
-												[vimeo] add support for videos that embed the download url in the player page (fixes #1364)

											
										
										
											2013-09-03 08:48:56 +00:00
+								        {
-												[vimeo] Use unicode_literals

											
										
										
											2014-01-06 22:38:16 +00:00
+								            'url': 'http://player.vimeo.com/video/54469442',
 								            'md5': '619b811a4417aa4abe78dc653becf511',
 								            'note': 'Videos that embed the url in the player page',
 								            'info_dict': {
-												[vimeo] Some modernization and style fixes

											
										
										
											2014-05-04 20:27:56 +00:00
+								                'id': '54469442',
 								                'ext': 'mp4',
-												[vimeo] Update test description

											
										
										
											2014-07-21 11:11:24 +00:00
+								                'title': 'Kathy Sierra: Building the minimum Badass User, Business of Software 2012',
-												Update to ytdl v2021-04-01
https://github.com/ytdl-org/youtube-dl/commit/14f29f087e6097feb46bdb84878924bc410a57eb

Closes #205

											
										
										
											2021-04-01 08:28:33 +00:00
+								                'uploader': 'Business of Software',
 								                'uploader_url': r're:https?://(?:www\.)?vimeo\.com/businessofsoftware',
 								                'uploader_id': 'businessofsoftware',
-												[vimeo] Add video duration extraction(Closes #2876)

											
										
										
											2014-05-09 18:46:40 +00:00
+								                'duration': 3610,
-												[vimeo] Fix description extraction

											
										
										
											2014-09-29 20:23:21 +00:00
+								                'description': None,
-												[vimeo] add support for videos that embed the download url in the player page (fixes #1364)

											
										
										
											2013-09-03 08:48:56 +00:00
+								            },
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								            'params': {
 								                'format': 'best[protocol=https]',
 								            },
-												[vimeo] fix the extraction for videos protected with password

Added a test video.

											
										
										
											2013-10-23 14:31:53 +00:00
+								        },
 								        {
-												[vimeo] Use unicode_literals

											
										
										
											2014-01-06 22:38:16 +00:00
+								            'url': 'http://vimeo.com/68375962',
 								            'md5': 'aaf896bdb7ddd6476df50007a0ac0ae7',
 								            'note': 'Video protected with password',
 								            'info_dict': {
-												[vimeo] Some modernization and style fixes

											
										
										
											2014-05-04 20:27:56 +00:00
+								                'id': '68375962',
 								                'ext': 'mp4',
-												renaming issues resolved


											
										
										
											2020-09-02 20:37:35 +00:00
+								                'title': 'youtube-dl password protected test video',
-												[vimeo] Extract upload timestamp

											
										
										
											2017-01-31 17:58:02 +00:00
+								                'timestamp': 1371200155,
-												[vimeo] Use unicode_literals

											
										
										
											2014-01-06 22:38:16 +00:00
+								                'upload_date': '20130614',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											2017-01-02 12:08:07 +00:00
+								                'uploader_url': r're:https?://(?:www\.)?vimeo\.com/user18948128',
-												[vimeo] Use unicode_literals

											
										
										
											2014-01-06 22:38:16 +00:00
+								                'uploader_id': 'user18948128',
 								                'uploader': 'Jaime Marquínez Ferrándiz',
-												[vimeo] Add video duration extraction(Closes #2876)

											
										
										
											2014-05-09 18:46:40 +00:00
+								                'duration': 10,
-												[vimeo] Fix tests

											
										
										
											2017-01-11 15:57:08 +00:00
+								                'description': 'md5:dca3ea23adb29ee387127bc4ddfce63f',
-												[vimeo] fix the extraction for videos protected with password

Added a test video.

											
										
										
											2013-10-23 14:31:53 +00:00
+								            },
-												[vimeo] Use unicode_literals

											
										
										
											2014-01-06 22:38:16 +00:00
+								            'params': {
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								                'format': 'best[protocol=https]',
-												renaming issues resolved


											
										
										
											2020-09-02 20:37:35 +00:00
+								                'videopassword': 'youtube-dl',
-												[vimeo] fix the extraction for videos protected with password

Added a test video.

											
										
										
											2013-10-23 14:31:53 +00:00
+								            },
 								        },
-												[vimeo] Use original URL when for standard vimeo.com links (Closes #3428)

Some videos that are freely accessible without password via the original URL (e.g. http://vimeo.com/channels/keypeele/75629013)
ask for password when accessed via http://vimeo.com/<video_id>.

											
										
										
											2014-08-03 17:04:47 +00:00
+								        {
 								            'url': 'http://vimeo.com/channels/keypeele/75629013',
 								            'md5': '2f86a05afe9d7abc0b9126d229bbe15d',
 								            'info_dict': {
 								                'id': '75629013',
 								                'ext': 'mp4',
 								                'title': 'Key & Peele: Terrorist Interrogation',
 								                'description': 'md5:8678b246399b070816b12313e8b4eb5c',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											2017-01-02 12:08:07 +00:00
+								                'uploader_url': r're:https?://(?:www\.)?vimeo\.com/atencio',
-												[vimeo] Use original URL when for standard vimeo.com links (Closes #3428)

Some videos that are freely accessible without password via the original URL (e.g. http://vimeo.com/channels/keypeele/75629013)
ask for password when accessed via http://vimeo.com/<video_id>.

											
										
										
											2014-08-03 17:04:47 +00:00
+								                'uploader_id': 'atencio',
 								                'uploader': 'Peter Atencio',
-												[vimeo] Extract channel meta fields

											
										
										
											2018-09-14 18:24:48 +00:00
+								                'channel_id': 'keypeele',
 								                'channel_url': r're:https?://(?:www\.)?vimeo\.com/channels/keypeele',
-												[vimeo] Extract upload timestamp

											
										
										
											2017-01-31 17:58:02 +00:00
+								                'timestamp': 1380339469,
 								                'upload_date': '20130928',
-												[vimeo] Use original URL when for standard vimeo.com links (Closes #3428)

Some videos that are freely accessible without password via the original URL (e.g. http://vimeo.com/channels/keypeele/75629013)
ask for password when accessed via http://vimeo.com/<video_id>.

											
										
										
											2014-08-03 17:04:47 +00:00
+								                'duration': 187,
 								            },
-												[vimeo] Detect source extension
and misc cleanup

Cherry-picked from #1477
Closes #1402

Authored by: flashdagger

											
										
										
											2021-11-05 20:45:08 +00:00
+								            'params': {'format': 'http-1080p'},
-												[vimeo] Use original URL when for standard vimeo.com links (Closes #3428)

Some videos that are freely accessible without password via the original URL (e.g. http://vimeo.com/channels/keypeele/75629013)
ask for password when accessed via http://vimeo.com/<video_id>.

											
										
										
											2014-08-03 17:04:47 +00:00
+								        },
-												[vimeo] Add support for subtitles (Closes #2239)
											
										
										
											2014-02-03 13:02:58 +00:00
+								        {
 								            'url': 'http://vimeo.com/76979871',
 								            'note': 'Video with subtitles',
 								            'info_dict': {
 								                'id': '76979871',
 								                'ext': 'mp4',
 								                'title': 'The New Vimeo Player (You Know, For Videos)',
 								                'description': 'md5:2ec900bf97c3f389378a96aee11260ea',
-												[vimeo] Extract upload timestamp

											
										
										
											2017-01-31 17:58:02 +00:00
+								                'timestamp': 1381846109,
-												[vimeo] Add support for subtitles (Closes #2239)
											
										
										
											2014-02-03 13:02:58 +00:00
+								                'upload_date': '20131015',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											2017-01-02 12:08:07 +00:00
+								                'uploader_url': r're:https?://(?:www\.)?vimeo\.com/staff',
-												[vimeo] Add support for subtitles (Closes #2239)
											
										
										
											2014-02-03 13:02:58 +00:00
+								                'uploader_id': 'staff',
 								                'uploader': 'Vimeo Staff',
-												[vimeo] Add video duration extraction(Closes #2876)

											
										
										
											2014-05-09 18:46:40 +00:00
+								                'duration': 62,
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								                'subtitles': {
 								                    'de': [{'ext': 'vtt'}],
 								                    'en': [{'ext': 'vtt'}],
 								                    'es': [{'ext': 'vtt'}],
 								                    'fr': [{'ext': 'vtt'}],
 								                },
-												[vimeo] Detect source extension
and misc cleanup

Cherry-picked from #1477
Closes #1402

Authored by: flashdagger

											
										
										
											2021-11-05 20:45:08 +00:00
+								            },
 								            'expected_warnings': ['Ignoring subtitle tracks found in the HLS manifest'],
-												[vimeo] Add support for subtitles (Closes #2239)
											
										
										
											2014-02-03 13:02:58 +00:00
+								        },
-												[vimeo] Improve regex for the config js dict (fixes #3955, fixes #3974)

The javascript code contains assignments of empty dicts with the same variable name

											
										
										
											2014-10-17 13:49:16 +00:00
+								        {
 								            # from https://www.ouya.tv/game/Pier-Solar-and-the-Great-Architects/
 								            'url': 'https://player.vimeo.com/video/98044508',
 								            'note': 'The js code contains assignments to the same variable as the config',
 								            'info_dict': {
 								                'id': '98044508',
 								                'ext': 'mp4',
 								                'title': 'Pier Solar OUYA Official Trailer',
 								                'uploader': 'Tulio Gonçalves',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											2017-01-02 12:08:07 +00:00
+								                'uploader_url': r're:https?://(?:www\.)?vimeo\.com/user28849593',
-												[vimeo] Improve regex for the config js dict (fixes #3955, fixes #3974)

The javascript code contains assignments of empty dicts with the same variable name

											
										
										
											2014-10-17 13:49:16 +00:00
+								                'uploader_id': 'user28849593',
 								            },
 								        },
-												[vimeo] add test for original format

											
										
										
											2015-12-16 16:00:17 +00:00
+								        {
 								            # contains original format
 								            'url': 'https://vimeo.com/33951933',
-												[vimeo] Fix tests

											
										
										
											2017-01-11 15:57:08 +00:00
+								            'md5': '53c688fa95a55bf4b7293d37a89c5c53',
-												[vimeo] add test for original format

											
										
										
											2015-12-16 16:00:17 +00:00
+								            'info_dict': {
 								                'id': '33951933',
 								                'ext': 'mp4',
 								                'title': 'FOX CLASSICS - Forever Classic ID - A Full Minute',
 								                'uploader': 'The DMCI',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											2017-01-02 12:08:07 +00:00
+								                'uploader_url': r're:https?://(?:www\.)?vimeo\.com/dmci',
-												[vimeo] add test for original format

											
										
										
											2015-12-16 16:00:17 +00:00
+								                'uploader_id': 'dmci',
-												[vimeo] Extract upload timestamp

											
										
										
											2017-01-31 17:58:02 +00:00
+								                'timestamp': 1324343742,
-												[vimeo] add test for original format

											
										
										
											2015-12-16 16:00:17 +00:00
+								                'upload_date': '20111220',
 								                'description': 'md5:ae23671e82d05415868f7ad1aec21147',
 								            },
 								        },
-												[Vimeo] Better extraction of original file (#599)

Authored by: Ashish0804
											
										
										
											2021-08-02 01:53:12 +00:00
+								        {
 								            'note': 'Contains original format not accessible in webpage',
 								            'url': 'https://vimeo.com/393756517',
 								            'md5': 'c464af248b592190a5ffbb5d33f382b0',
 								            'info_dict': {
 								                'id': '393756517',
 								                'ext': 'mov',
 								                'timestamp': 1582642091,
 								                'uploader_id': 'frameworkla',
 								                'title': 'Straight To Hell - Sabrina: Netflix',
 								                'uploader': 'Framework Studio',
 								                'description': 'md5:f2edc61af3ea7a5592681ddbb683db73',
 								                'upload_date': '20200225',
 								            },
 								        },
-												[vimeo] Override original URL only when necessary

											
										
										
											2016-06-22 17:51:36 +00:00
+								        {
 								            # only available via https://vimeo.com/channels/tributes/6213729 and
 								            # not via https://vimeo.com/6213729
 								            'url': 'https://vimeo.com/channels/tributes/6213729',
 								            'info_dict': {
 								                'id': '6213729',
-												[vimeo] Extract channel meta fields

											
										
										
											2018-09-14 18:24:48 +00:00
+								                'ext': 'mp4',
-												[vimeo] Override original URL only when necessary

											
										
										
											2016-06-22 17:51:36 +00:00
+								                'title': 'Vimeo Tribute: The Shining',
 								                'uploader': 'Casey Donahue',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											2017-01-02 12:08:07 +00:00
+								                'uploader_url': r're:https?://(?:www\.)?vimeo\.com/caseydonahue',
-												[vimeo] Override original URL only when necessary

											
										
										
											2016-06-22 17:51:36 +00:00
+								                'uploader_id': 'caseydonahue',
-												[vimeo] Extract channel meta fields

											
										
										
											2018-09-14 18:24:48 +00:00
+								                'channel_url': r're:https?://(?:www\.)?vimeo\.com/channels/tributes',
 								                'channel_id': 'tributes',
-												[vimeo] Extract upload timestamp

											
										
										
											2017-01-31 17:58:02 +00:00
+								                'timestamp': 1250886430,
-												[vimeo] Override original URL only when necessary

											
										
										
											2016-06-22 17:51:36 +00:00
+								                'upload_date': '20090821',
 								                'description': 'md5:bdbf314014e58713e6e5b66eb252f4a6',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[vimeo] Delegate ondemand redirects to ondemand extractor (closes #10994)

											
										
										
											2016-10-23 11:48:50 +00:00
+								        {
-												untie

											
										
										
											2017-01-19 09:18:13 +00:00
+								            # redirects to ondemand extractor and should be passed through it
-												[vimeo] Delegate ondemand redirects to ondemand extractor (closes #10994)

											
										
										
											2016-10-23 11:48:50 +00:00
+								            # for successful extraction
 								            'url': 'https://vimeo.com/73445910',
 								            'info_dict': {
 								                'id': '73445910',
 								                'ext': 'mp4',
 								                'title': 'The Reluctant Revolutionary',
 								                'uploader': '10Ft Films',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											2017-01-02 12:08:07 +00:00
+								                'uploader_url': r're:https?://(?:www\.)?vimeo\.com/tenfootfilms',
-												[vimeo] Delegate ondemand redirects to ondemand extractor (closes #10994)

											
										
										
											2016-10-23 11:48:50 +00:00
+								                'uploader_id': 'tenfootfilms',
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								                'description': 'md5:0fa704e05b04f91f40b7f3ca2e801384',
 								                'upload_date': '20130830',
 								                'timestamp': 1377853339,
-												[vimeo] Delegate ondemand redirects to ondemand extractor (closes #10994)

											
										
										
											2016-10-23 11:48:50 +00:00
+								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												Update to ytdl v2021-04-01
https://github.com/ytdl-org/youtube-dl/commit/14f29f087e6097feb46bdb84878924bc410a57eb

Closes #205

											
										
										
											2021-04-01 08:28:33 +00:00
+								            'skip': 'this page is no longer available.',
-												[vimeo] Delegate ondemand redirects to ondemand extractor (closes #10994)

											
										
										
											2016-10-23 11:48:50 +00:00
+								        },
-												[vimeo] fix extraction for password protected player URLs(closes #18889)

											
										
										
											2019-01-17 08:44:08 +00:00
+								        {
 								            'url': 'http://player.vimeo.com/video/68375962',
 								            'md5': 'aaf896bdb7ddd6476df50007a0ac0ae7',
 								            'info_dict': {
 								                'id': '68375962',
 								                'ext': 'mp4',
-												renaming issues resolved


											
										
										
											2020-09-02 20:37:35 +00:00
+								                'title': 'youtube-dl password protected test video',
-												[vimeo] fix extraction for password protected player URLs(closes #18889)

											
										
										
											2019-01-17 08:44:08 +00:00
+								                'uploader_url': r're:https?://(?:www\.)?vimeo\.com/user18948128',
 								                'uploader_id': 'user18948128',
 								                'uploader': 'Jaime Marquínez Ferrándiz',
 								                'duration': 10,
 								            },
 								            'params': {
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								                'format': 'best[protocol=https]',
-												renaming issues resolved


											
										
										
											2020-09-02 20:37:35 +00:00
+								                'videopassword': 'youtube-dl',
-												[vimeo] fix extraction for password protected player URLs(closes #18889)

											
										
										
											2019-01-17 08:44:08 +00:00
+								            },
 								        },
-												[vimeo] Override original URL only when necessary

											
										
										
											2016-06-22 17:51:36 +00:00
+								        {
 								            'url': 'http://vimeo.com/moogaloop.swf?clip_id=2539741',
 								            'only_matching': True,
 								        },
-												[vimeo] New test, fixed one older test

											
										
										
											2015-10-20 14:38:44 +00:00
+								        {
 								            'url': 'https://vimeo.com/109815029',
 								            'note': 'Video not completely processed, "failed" seed status',
 								            'only_matching': True,
 								        },
-												[vimeo] Add test for #7552

											
										
										
											2015-11-19 16:31:16 +00:00
+								        {
 								            'url': 'https://vimeo.com/groups/travelhd/videos/22439234',
 								            'only_matching': True,
 								        },
-												[vimeo:channel] Improve playlist extraction

											
										
										
											2016-06-22 18:28:36 +00:00
+								        {
 								            'url': 'https://vimeo.com/album/2632481/video/79010983',
 								            'only_matching': True,
 								        },
-												[vimeo] Fix videos with password
https://github.com/ytdl-org/youtube-dl/pull/27992

Fixes: https://github.com/ytdl-org/youtube-dl/issues/28354

Authored by teesid

											
										
										
											2021-01-28 12:33:48 +00:00
+								        {
 								            'url': 'https://vimeo.com/showcase/3253534/video/119195465',
 								            'note': 'A video in a password protected album (showcase)',
 								            'info_dict': {
 								                'id': '119195465',
 								                'ext': 'mp4',
 								                'title': 'youtube-dl test video \'ä"BaW_jenozKc',
 								                'uploader': 'Philipp Hagemeister',
 								                'uploader_id': 'user20132939',
 								                'description': 'md5:fa7b6c6d8db0bdc353893df2f111855b',
 								                'upload_date': '20150209',
 								                'timestamp': 1423518307,
 								            },
 								            'params': {
 								                'format': 'best[protocol=https]',
 								                'videopassword': 'youtube-dl',
 								            },
 								        },
-												[vimeo] Add test for #8187

											
										
										
											2016-01-08 21:07:29 +00:00
+								        {
 								            # source file returns 403: Forbidden
 								            'url': 'https://vimeo.com/7809605',
 								            'only_matching': True,
 								        },
-												[vimeo] Improve _VALID_URL (Closes #9229)

											
										
										
											2016-04-18 15:40:28 +00:00
+								        {
-												[vimeo] Fix ondemand videos and direct URLs with hash
Closes #1353, #1471

											
										
										
											2021-11-05 20:24:05 +00:00
+								            'note': 'Direct URL with hash',
-												[vimeo] Improve _VALID_URL (Closes #9229)

											
										
										
											2016-04-18 15:40:28 +00:00
+								            'url': 'https://vimeo.com/160743502/abd0e13fb4',
-												[vimeo] Fix ondemand videos and direct URLs with hash
Closes #1353, #1471

											
										
										
											2021-11-05 20:24:05 +00:00
+								            'info_dict': {
 								                'id': '160743502',
 								                'ext': 'mp4',
 								                'uploader': 'Julian Tryba',
 								                'uploader_id': 'aliniamedia',
 								                'title': 'Harrisville New Hampshire',
 								                'timestamp': 1459259666,
 								                'upload_date': '20160329',
 								            },
-												[vimeo] Detect source extension
and misc cleanup

Cherry-picked from #1477
Closes #1402

Authored by: flashdagger

											
										
										
											2021-11-05 20:45:08 +00:00
+								            'params': {'skip_download': True},
 								        },
 								        {
 								            'url': 'https://vimeo.com/138909882',
 								            'info_dict': {
 								                'id': '138909882',
 								                'ext': 'mp4',
 								                'title': 'Eastnor Castle 2015 Firework Champions - The Promo!',
 								                'description': 'md5:5967e090768a831488f6e74b7821b3c1',
 								                'uploader_id': 'fireworkchampions',
 								                'uploader': 'Firework Champions',
 								                'upload_date': '20150910',
 								                'timestamp': 1441901895,
 								            },
 								            'params': {
 								                'skip_download': True,
 								                'format': 'Original',
 								            },
-												Update to ytdl-commit-cf2dbec
https://github.com/ytdl-org/youtube-dl/commit/cf2dbec6301177a1fddf72862de05fa912d9869d

Except: [kakao] improve info extraction and detect geo restriction
https://github.com/ytdl-org/youtube-dl/commit/d8085580f63ad3b146a31712ff76cf41d5a4558a

											
										
										
											2021-02-19 20:44:36 +00:00
+								        },
-												[vimeo] Add fallback for config URL
Closes #1662

											
										
										
											2021-11-22 19:39:17 +00:00
+								        {
 								            'url': 'https://vimeo.com/channels/staffpicks/143603739',
 								            'info_dict': {
 								                'id': '143603739',
 								                'ext': 'mp4',
 								                'uploader': 'Karim Huu Do',
 								                'timestamp': 1445846953,
 								                'upload_date': '20151026',
 								                'title': 'The Shoes - Submarine Feat. Blaine Harrison',
 								                'uploader_id': 'karimhd',
 								                'description': 'md5:8e2eea76de4504c2e8020a9bcfa1e843',
 								            },
 								            'params': {'skip_download': 'm3u8'},
 								        },
-												Update to ytdl-commit-cf2dbec
https://github.com/ytdl-org/youtube-dl/commit/cf2dbec6301177a1fddf72862de05fa912d9869d

Except: [kakao] improve info extraction and detect geo restriction
https://github.com/ytdl-org/youtube-dl/commit/d8085580f63ad3b146a31712ff76cf41d5a4558a

											
										
										
											2021-02-19 20:44:36 +00:00
+								        {
 								            # requires passing unlisted_hash(a52724358e) to load_download_config request
 								            'url': 'https://vimeo.com/392479337/a52724358e',
 								            'only_matching': True,
-												[vimeo] Detect source extension
and misc cleanup

Cherry-picked from #1477
Closes #1402

Authored by: flashdagger

											
										
										
											2021-11-05 20:45:08 +00:00
+								        },
-												Update to ytdl-commit-6508688

Make default upload_/release_date a compat_str
https://github.com/ytdl-org/youtube-dl/commit/6508688e88c83bb811653083db9351702cd39a6a

Except:
* "[NDR] Overhaul NDR and NJoy extractors" https://github.com/ytdl-org/youtube-dl/pull/30531
    - https://github.com/ytdl-org/youtube-dl/commit/01824d275bfa7efbaca274b38c1ddc2b03f12f5d
    - https://github.com/ytdl-org/youtube-dl/commit/39a98b09a2acf50dc64bc41185be723b98e740b9
    - https://github.com/ytdl-org/youtube-dl/commit/f0a05a55c2ee512880546c056cfbec5ad3399798
    - https://github.com/ytdl-org/youtube-dl/commit/4186e817772d49d6f66b07c5ac8c248f026a6446

											
										
										
											2022-03-04 17:01:04 +00:00
+								        {
 								            # similar, but all numeric: ID must be 581039021, not 9603038895
 								            # issue #29690
 								            'url': 'https://vimeo.com/581039021/9603038895',
 								            'info_dict': {
 								                'id': '581039021',
 								                # these have to be provided but we don't care
 								                'ext': 'mp4',
 								                'timestamp': 1627621014,
 								                'title': 're:.+',
 								                'uploader_id': 're:.+',
 								                'uploader': 're:.+',
 								                'upload_date': r're:\d+',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        }
-												[vimeo] Fix video password verification for videos protected by Referer HTTP header

											
										
										
											2019-01-20 11:21:31 +00:00
+								        # https://gettingthingsdone.com/workflowmap/
 								        # vimeo embed with check-password page protected by Referer header
-												[vimeo] extract information for Vimeo Pro videos from http://player.vimeo.com/video/{video_id} (fixes #1197)

For some videos https://vimeo.com/{video_id} doesn't work

											
										
										
											2013-08-21 11:48:19 +00:00
+								    ]
-												Move Vimeo into its own file

											
										
										
											2013-06-23 18:18:21 +00:00
-												[vimeo:ondemand] Pass Referer along with embed URL (#10624)

											
										
										
											2016-09-12 14:48:45 +00:00
+								    @staticmethod
 								    def _smuggle_referrer(url, referrer_url):
 								        return smuggle_url(url, {'http_headers': {'Referer': referrer_url}})
-												[vimeo/generic] Move detection logic from GenericIE to VimeoIE

											
										
										
											2015-06-21 10:23:58 +00:00
+								    @staticmethod
-												[generic] Add support for multiple vimeo embeds (Closes #10862)

											
										
										
											2016-10-06 16:22:52 +00:00
+								    def _extract_urls(url, webpage):
 								        urls = []
-												[vimeo/generic] Move detection logic from GenericIE to VimeoIE

											
										
										
											2015-06-21 10:23:58 +00:00
+								        # Look for embedded (iframe) Vimeo player
-												[generic] Add support for multiple vimeo embeds (Closes #10862)

											
										
										
											2016-10-06 16:22:52 +00:00
+								        for mobj in re.finditer(
-												[vimeo] Restrict iframe embed regex (closes #14600)

											
										
										
											2017-10-27 15:21:47 +00:00
+								                r'<iframe[^>]+?src=(["\'])(?P<url>(?:https?:)?//player\.vimeo\.com/video/\d+.*?)\1',
-												[vimeo] PEP 8
[ci skip]

											
										
										
											2016-10-07 15:15:26 +00:00
+								                webpage):
-												[generic] Add support for multiple vimeo embeds (Closes #10862)

											
										
										
											2016-10-06 16:22:52 +00:00
+								            urls.append(VimeoIE._smuggle_referrer(unescapeHTML(mobj.group('url')), url))
 								        PLAIN_EMBED_RE = (
 								            # Look for embedded (swf embed) Vimeo player
 								            r'<embed[^>]+?src=(["\'])(?P<url>(?:https?:)?//(?:www\.)?vimeo\.com/moogaloop\.swf.+?)\1',
 								            # Look more for non-standard embedded Vimeo player
 								            r'<video[^>]+src=(["\'])(?P<url>(?:https?:)?//(?:www\.)?vimeo\.com/[0-9]+)\1',
 								        )
 								        for embed_re in PLAIN_EMBED_RE:
 								            for mobj in re.finditer(embed_re, webpage):
 								                urls.append(mobj.group('url'))
 								        return urls
 								    @staticmethod
 								    def _extract_url(url, webpage):
 								        urls = VimeoIE._extract_urls(url, webpage)
 								        return urls[0] if urls else None
-												[vimeo/generic] Move detection logic from GenericIE to VimeoIE

											
										
										
											2015-06-21 10:23:58 +00:00
-												[vimeo] Fix video password verification for videos protected by Referer HTTP header

											
										
										
											2019-01-20 11:21:31 +00:00
+								    def _verify_player_video_password(self, url, video_id, headers):
-												Update to ytdl v2021-04-01
https://github.com/ytdl-org/youtube-dl/commit/14f29f087e6097feb46bdb84878924bc410a57eb

Closes #205

											
										
										
											2021-04-01 08:28:33 +00:00
+								        password = self._get_video_password()
-												[vimeo] fix extraction for password protected player URLs(closes #18889)

											
										
										
											2019-01-17 08:44:08 +00:00
+								        data = urlencode_postdata({
 								            'password': base64.b64encode(password.encode()),
 								        })
-												[vimeo] Fix video password verification for videos protected by Referer HTTP header

											
										
										
											2019-01-20 11:21:31 +00:00
+								        headers = merge_dicts(headers, {
 								            'Content-Type': 'application/x-www-form-urlencoded',
 								        })
 								        checked = self._download_json(
 								            url + '/check-password', video_id,
 								            'Verifying the password', data=data, headers=headers)
 								        if checked is False:
 								            raise ExtractorError('Wrong video password', expected=True)
 								        return checked
-												[vimeo] Add support for passwords for player. URLs

Fixes #2053

											
										
										
											2014-01-07 08:51:57 +00:00
-												VimeoIE: authentication support (closes #885) and add a method in the base InfoExtractor to get the login info

											
										
										
											2013-07-07 21:24:34 +00:00
+								    def _real_initialize(self):
 								        self._login()
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								    def _extract_from_api(self, video_id, unlisted_hash=None):
 								        token = self._download_json(
 								            'https://vimeo.com/_rv/jwt', video_id, headers={
 								                'X-Requested-With': 'XMLHttpRequest'
 								            })['token']
 								        api_url = 'https://api.vimeo.com/videos/' + video_id
 								        if unlisted_hash:
 								            api_url += ':' + unlisted_hash
 								        video = self._download_json(
 								            api_url, video_id, headers={
 								                'Authorization': 'jwt ' + token,
 								            }, query={
 								                'fields': 'config_url,created_time,description,license,metadata.connections.comments.total,metadata.connections.likes.total,release_time,stats.plays',
 								            })
 								        info = self._parse_config(self._download_json(
 								            video['config_url'], video_id), video_id)
 								        self._vimeo_sort_formats(info['formats'])
 								        get_timestamp = lambda x: parse_iso8601(video.get(x + '_time'))
 								        info.update({
 								            'description': video.get('description'),
 								            'license': video.get('license'),
 								            'release_timestamp': get_timestamp('release'),
 								            'timestamp': get_timestamp('created'),
 								            'view_count': int_or_none(try_get(video, lambda x: x['stats']['plays'])),
 								        })
 								        connections = try_get(
 								            video, lambda x: x['metadata']['connections'], dict) or {}
 								        for k in ('comment', 'like'):
 								            info[k + '_count'] = int_or_none(try_get(connections, lambda x: x[k + 's']['total']))
 								        return info
-												[vimeo] Fix videos with password
https://github.com/ytdl-org/youtube-dl/pull/27992

Fixes: https://github.com/ytdl-org/youtube-dl/issues/28354

Authored by teesid

											
										
										
											2021-01-28 12:33:48 +00:00
+								    def _try_album_password(self, url):
 								        album_id = self._search_regex(
 								            r'vimeo\.com/(?:album|showcase)/([^/]+)', url, 'album id', default=None)
 								        if not album_id:
 								            return
 								        viewer = self._download_json(
 								            'https://vimeo.com/_rv/viewer', album_id, fatal=False)
 								        if not viewer:
 								            webpage = self._download_webpage(url, album_id)
 								            viewer = self._parse_json(self._search_regex(
 								                r'bootstrap_data\s*=\s*({.+?})</script>',
 								                webpage, 'bootstrap data'), album_id)['viewer']
 								        jwt = viewer['jwt']
 								        album = self._download_json(
 								            'https://api.vimeo.com/albums/' + album_id,
 								            album_id, headers={'Authorization': 'jwt ' + jwt},
 								            query={'fields': 'description,name,privacy'})
 								        if try_get(album, lambda x: x['privacy']['view']) == 'password':
-												[extractor] Add `write_debug` and `get_param`

											
										
										
											2021-05-17 12:23:08 +00:00
+								            password = self.get_param('videopassword')
-												[vimeo] Fix videos with password
https://github.com/ytdl-org/youtube-dl/pull/27992

Fixes: https://github.com/ytdl-org/youtube-dl/issues/28354

Authored by teesid

											
										
										
											2021-01-28 12:33:48 +00:00
+								            if not password:
 								                raise ExtractorError(
 								                    'This album is protected by a password, use the --video-password option',
 								                    expected=True)
 								            self._set_vimeo_cookie('vuid', viewer['vuid'])
 								            try:
 								                self._download_json(
 								                    'https://vimeo.com/showcase/%s/auth' % album_id,
 								                    album_id, 'Verifying the password', data=urlencode_postdata({
 								                        'password': password,
 								                        'token': viewer['xsrft'],
 								                    }), headers={
 								                        'X-Requested-With': 'XMLHttpRequest',
 								                    })
 								            except ExtractorError as e:
 								                if isinstance(e.cause, compat_HTTPError) and e.cause.code == 401:
 								                    raise ExtractorError('Wrong password', expected=True)
 								                raise
-												[vimeo] Fix unused argument of the `_real_extract` method

											
										
										
											2013-12-10 19:43:16 +00:00
+								    def _real_extract(self, url):
-												[vimeo] Automatically pickup full movie when rented (Closes #8171)

											
										
										
											2016-01-08 04:41:24 +00:00
+								        url, data = unsmuggle_url(url, {})
-												Implement `--add-header` without modifying `std_headers`

Closes #2526, #1614

											
										
										
											2022-01-28 21:55:35 +00:00
+								        headers = self.get_param('http_headers').copy()
-												[vimeo] Automatically pickup full movie when rented (Closes #8171)

											
										
										
											2016-01-08 04:41:24 +00:00
+								        if 'http_headers' in data:
 								            headers.update(data['http_headers'])
-												[vimeo] Always pass in referer (Fixes #3582)

											
										
										
											2014-08-25 07:35:37 +00:00
+								        if 'Referer' not in headers:
 								            headers['Referer'] = url
-												[generic] Support embedded vimeo videos (#1602)

											
										
										
											2013-10-15 10:05:13 +00:00
-												Move Vimeo into its own file

											
										
										
											2013-06-23 18:18:21 +00:00
+								        # Extract ID from URL
-												[vimeo] Fix ondemand videos and direct URLs with hash
Closes #1353, #1471

											
										
										
											2021-11-05 20:24:05 +00:00
+								        mobj = self._match_valid_url(url).groupdict()
 								        video_id, unlisted_hash = mobj['id'], mobj.get('unlisted_hash')
-												Update to ytdl v2021-04-01
https://github.com/ytdl-org/youtube-dl/commit/14f29f087e6097feb46bdb84878924bc410a57eb

Closes #205

											
										
										
											2021-04-01 08:28:33 +00:00
+								        if unlisted_hash:
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								            return self._extract_from_api(video_id, unlisted_hash)
-												Update to ytdl v2021-04-01
https://github.com/ytdl-org/youtube-dl/commit/14f29f087e6097feb46bdb84878924bc410a57eb

Closes #205

											
										
										
											2021-04-01 08:28:33 +00:00
-												[vimeo] Fix description extraction

											
										
										
											2014-09-29 20:23:21 +00:00
+								        orig_url = url
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								        is_pro = 'vimeopro.com/' in url
 								        if is_pro:
-												[vimeo] add support for Vimeo Pro portfolio protected videos(closes #20070)

											
										
										
											2019-03-01 07:14:34 +00:00
+								            # some videos require portfolio_id to be present in player url
-												Start moving to ytdl-org

											
										
										
											2019-03-09 12:14:41 +00:00
+								            # https://github.com/ytdl-org/youtube-dl/issues/20070
-												[vimeo] add support for Vimeo Pro portfolio protected videos(closes #20070)

											
										
										
											2019-03-01 07:14:34 +00:00
+								            url = self._extract_url(url, self._download_webpage(url, video_id))
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								            if not url:
 								                url = 'https://vimeo.com/' + video_id
-												Revert "[vimeo] fix showcase password protected video extraction(closes #24224)"

This reverts commit 12ee431676bb655f04c7dd416a73c1f142ed368d.

											
										
										
											2020-03-13 07:59:10 +00:00
+								        elif any(p in url for p in ('play_redirect_hls', 'moogaloop.swf')):
-												[vimeo] Fix redirection

											
										
										
											2015-04-28 12:56:48 +00:00
+								            url = 'https://vimeo.com/' + video_id
-												Move Vimeo into its own file

											
										
										
											2013-06-23 18:18:21 +00:00
-												[vimeo] Fix videos with password
https://github.com/ytdl-org/youtube-dl/pull/27992

Fixes: https://github.com/ytdl-org/youtube-dl/issues/28354

Authored by teesid

											
										
										
											2021-01-28 12:33:48 +00:00
+								        self._try_album_password(url)
-												[vimeo] Add a better error message for embed-only videos (#2527)

											
										
										
											2014-03-08 11:24:43 +00:00
+								        try:
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								            # Retrieve video webpage to extract further information
 								            webpage, urlh = self._download_webpage_handle(
 								                url, video_id, headers=headers)
-												Remove no longer needed compat_str around geturl

											
										
										
											2020-02-29 12:17:27 +00:00
+								            redirect_url = urlh.geturl()
-												[vimeo] Add a better error message for embed-only videos (#2527)

											
										
										
											2014-03-08 11:24:43 +00:00
+								        except ExtractorError as ee:
 								            if isinstance(ee.cause, compat_HTTPError) and ee.cause.code == 403:
 								                errmsg = ee.cause.read()
 								                if b'Because of its privacy settings, this video cannot be played here' in errmsg:
 								                    raise ExtractorError(
 								                        'Cannot download embed-only video without embedding '
-												Completely change project name to yt-dlp (#85)

* All modules and binary names are changed
* All documentation references changed
* yt-dlp no longer loads youtube-dlc config files
* All URLs changed to point to organization account

Co-authored-by: Pccode66
Co-authored-by: pukkandan
											
										
										
											2021-02-24 18:45:56 +00:00
+								                        'URL. Please call yt-dlp with the URL of the page '
-												[vimeo] Add a better error message for embed-only videos (#2527)

											
										
										
											2014-03-08 11:24:43 +00:00
+								                        'that embeds this video.',
 								                        expected=True)
 								            raise
-												Move Vimeo into its own file

											
										
										
											2013-06-23 18:18:21 +00:00
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								        if '://player.vimeo.com/video/' in url:
 								            config = self._parse_json(self._search_regex(
 								                r'\bconfig\s*=\s*({.+?})\s*;', webpage, 'info section'), video_id)
 								            if config.get('view') == 4:
 								                config = self._verify_player_video_password(
 								                    redirect_url, video_id, headers)
 								            info = self._parse_config(config, video_id)
 								            self._vimeo_sort_formats(info['formats'])
 								            return info
 								        if re.search(r'<form[^>]+?id="pw_form"', webpage):
 								            video_password = self._get_video_password()
 								            token, vuid = self._extract_xsrft_and_vuid(webpage)
 								            webpage = self._verify_video_password(
 								                redirect_url, video_id, video_password, token, vuid)
-												Move Vimeo into its own file

											
										
										
											2013-06-23 18:18:21 +00:00
-												[vimeo] fix album extraction

closes #1933
closes #15704
closes #15855
closes #18967
closes #21986

											
										
										
											2019-08-03 09:29:20 +00:00
+								        vimeo_config = self._extract_vimeo_config(webpage, video_id, default=None)
-												[vimeo] Capture and output error message (#5294)

											
										
										
											2015-03-26 21:05:08 +00:00
+								        if vimeo_config:
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								            seed_status = vimeo_config.get('seed_status') or {}
-												[vimeo] Capture and output error message (#5294)

											
										
										
											2015-03-26 21:05:08 +00:00
+								            if seed_status.get('state') == 'failed':
 								                raise ExtractorError(
-												[vimeo] Fix error parsing

											
										
										
											2015-10-20 08:30:31 +00:00
+								                    '%s said: %s' % (self.IE_NAME, seed_status['title']),
-												[vimeo] Capture and output error message (#5294)

											
										
										
											2015-03-26 21:05:08 +00:00
+								                    expected=True)
-												[vimeo] Extract license (closes #11880)

											
										
										
											2017-01-31 17:49:28 +00:00
+								        cc_license = None
-												[vimeo] Extract upload timestamp

											
										
										
											2017-01-31 17:58:02 +00:00
+								        timestamp = None
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								        video_description = None
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								        info_dict = {}
-												[vimeo] Add fallback for config URL
Closes #1662

											
										
										
											2021-11-22 19:39:17 +00:00
+								        config_url = None
-												[vimeo] Extract license (closes #11880)

											
										
										
											2017-01-31 17:49:28 +00:00
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								        channel_id = self._search_regex(
 								            r'vimeo\.com/channels/([^/]+)', url, 'channel id', default=None)
 								        if channel_id:
 								            config_url = self._html_search_regex(
-												[vimeo] Add fallback for config URL
Closes #1662

											
										
										
											2021-11-22 19:39:17 +00:00
+								                r'\bdata-config-url="([^"]+)"', webpage, 'config URL', default=None)
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								            video_description = clean_html(get_element_by_class('description', webpage))
 								            info_dict.update({
 								                'channel_id': channel_id,
 								                'channel_url': 'https://vimeo.com/channels/' + channel_id,
 								            })
-												[vimeo] Add fallback for config URL
Closes #1662

											
										
										
											2021-11-22 19:39:17 +00:00
+								        if not config_url:
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								            page_config = self._parse_json(self._search_regex(
 								                r'vimeo\.(?:clip|vod_title)_page_config\s*=\s*({.+?});',
 								                webpage, 'page config', default='{}'), video_id, fatal=False)
 								            if not page_config:
 								                return self._extract_from_api(video_id)
 								            config_url = page_config['player']['config_url']
 								            cc_license = page_config.get('cc_license')
 								            clip = page_config.get('clip') or {}
 								            timestamp = clip.get('uploaded_on')
 								            video_description = clean_html(
 								                clip.get('description') or page_config.get('description_html_escaped'))
 								        config = self._download_json(config_url, video_id)
-												Update to ytdl-commit-cf2dbec
https://github.com/ytdl-org/youtube-dl/commit/cf2dbec6301177a1fddf72862de05fa912d9869d

Except: [kakao] improve info extraction and detect geo restriction
https://github.com/ytdl-org/youtube-dl/commit/d8085580f63ad3b146a31712ff76cf41d5a4558a

											
										
										
											2021-02-19 20:44:36 +00:00
+								        video = config.get('video') or {}
 								        vod = video.get('vod') or {}
-												[vimeo] redirect to feature url only in the case of a trailer(closes #14591)

											
										
										
											2018-09-15 05:30:57 +00:00
-												[vimeo] Fix rented videos (Closes #9830)

											
										
										
											2016-06-18 20:56:01 +00:00
+								        def is_rented():
 								            if '>You rented this title.<' in webpage:
 								                return True
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								            if try_get(config, lambda x: x['user']['purchased']):
-												[vimeo] Fix rented videos (Closes #9830)

											
										
										
											2016-06-18 20:56:01 +00:00
+								                return True
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								            for purchase_option in (vod.get('purchase_options') or []):
-												[vimeo] redirect to feature url only in the case of a trailer(closes #14591)

											
										
										
											2018-09-15 05:30:57 +00:00
+								                if purchase_option.get('purchased'):
 								                    return True
 								                label = purchase_option.get('label_string')
 								                if label and (label.startswith('You rented this') or label.endswith(' remaining')):
 								                    return True
-												[vimeo] Fix rented videos (Closes #9830)

											
										
										
											2016-06-18 20:56:01 +00:00
+								            return False
-												[vimeo] redirect to feature url only in the case of a trailer(closes #14591)

											
										
										
											2018-09-15 05:30:57 +00:00
+								        if is_rented() and vod.get('is_trailer'):
 								            feature_id = vod.get('feature_id')
-												[vimeo] Automatically pickup full movie when rented (Closes #8171)

											
										
										
											2016-01-08 04:41:24 +00:00
+								            if feature_id and not data.get('force_feature_id', False):
 								                return self.url_result(smuggle_url(
 								                    'https://player.vimeo.com/player/%s' % feature_id,
 								                    {'force_feature_id': True}), 'Vimeo')
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								        if not video_description:
 								            video_description = self._html_search_regex(
 								                r'(?s)<div\s+class="[^"]*description[^"]*"[^>]*>(.*?)</div>',
 								                webpage, 'description', default=None)
-												[vimeo] Fix description extraction

											
										
										
											2014-09-29 20:23:21 +00:00
+								        if not video_description:
 								            video_description = self._html_search_meta(
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								                ['description', 'og:description', 'twitter:description'],
 								                webpage, default=None)
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								        if not video_description and is_pro:
-												[vimeo] Fix description extraction

											
										
										
											2014-09-29 20:23:21 +00:00
+								            orig_webpage = self._download_webpage(
 								                orig_url, video_id,
 								                note='Downloading webpage for description',
 								                fatal=False)
 								            if orig_webpage:
 								                video_description = self._html_search_meta(
 								                    'description', orig_webpage, default=None)
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								        if not video_description:
-												Fix inconsistent use of `report_warning`

											
										
										
											2021-04-16 10:01:10 +00:00
+								            self.report_warning('Cannot find video description')
-												Move Vimeo into its own file

											
										
										
											2013-06-23 18:18:21 +00:00
-												[vimeo] Extract upload timestamp

											
										
										
											2017-01-31 17:58:02 +00:00
+								        if not timestamp:
 								            timestamp = self._search_regex(
 								                r'<time[^>]+datetime="([^"]+)"', webpage,
 								                'timestamp', default=None)
-												Move Vimeo into its own file

											
										
										
											2013-06-23 18:18:21 +00:00
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								        view_count = int_or_none(self._search_regex(r'UserPlays:(\d+)', webpage, 'view count', default=None))
 								        like_count = int_or_none(self._search_regex(r'UserLikes:(\d+)', webpage, 'like count', default=None))
 								        comment_count = int_or_none(self._search_regex(r'UserComments:(\d+)', webpage, 'comment count', default=None))
-												[vimeo] Extract views count, likes count and comments count (#1895)

											
										
										
											2013-12-06 12:03:08 +00:00
-												[vimeo] Implement the new format selection system (closes PR #996)

Rebased and deleted some parts to use the new system instead of copying the one from YoutubeIE

											
										
										
											2013-07-05 16:10:57 +00:00
+								        formats = []
-												[vimeo:review] improve config url extraction and extract original format(closes #20305)

											
										
										
											2019-03-10 14:03:32 +00:00
 								        source_format = self._extract_original_format(
-												Update to ytdl-commit-cf2dbec
https://github.com/ytdl-org/youtube-dl/commit/cf2dbec6301177a1fddf72862de05fa912d9869d

Except: [kakao] improve info extraction and detect geo restriction
https://github.com/ytdl-org/youtube-dl/commit/d8085580f63ad3b146a31712ff76cf41d5a4558a

											
										
										
											2021-02-19 20:44:36 +00:00
+								            'https://vimeo.com/' + video_id, video_id, video.get('unlisted_hash'))
-												[vimeo:review] improve config url extraction and extract original format(closes #20305)

											
										
										
											2019-03-10 14:03:32 +00:00
+								        if source_format:
 								            formats.append(source_format)
-												[vimeo] Add support for subtitles (Closes #2239)
											
										
										
											2014-02-03 13:02:58 +00:00
-												[vimeo] Extract JSON LD (closes #16295)

											
										
										
											2018-04-27 19:48:20 +00:00
+								        info_dict_config = self._parse_config(config, video_id)
 								        formats.extend(info_dict_config['formats'])
-												[vimeo] Fix extraction for VimeoReview videos

											
										
										
											2016-06-11 13:35:08 +00:00
+								        self._vimeo_sort_formats(formats)
-												[vimeo] Extract license (closes #11880)

											
										
										
											2017-01-31 17:49:28 +00:00
-												[vimeo] Extract JSON LD (closes #16295)

											
										
										
											2018-04-27 19:48:20 +00:00
+								        json_ld = self._search_json_ld(webpage, video_id, default={})
-												[vimeo] Extract license (closes #11880)

											
										
										
											2017-01-31 17:49:28 +00:00
+								        if not cc_license:
 								            cc_license = self._search_regex(
 								                r'<link[^>]+rel=["\']license["\'][^>]+href=(["\'])(?P<license>(?:(?!\1).)+)\1',
 								                webpage, 'license', default=None, group='license')
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								        info_dict.update({
-												[vimeo] Fix extraction for VimeoReview videos

											
										
										
											2016-06-11 13:35:08 +00:00
+								            'formats': formats,
-												[vimeo] Extract upload timestamp

											
										
										
											2017-01-31 17:58:02 +00:00
+								            'timestamp': unified_timestamp(timestamp),
-												[vimeo] Remove superfluous whitespace
											
										
										
											2014-02-03 13:24:11 +00:00
+								            'description': video_description,
-												Add the 'webpage_url' field to info_dict

The url for the video page, it must allow to reproduce the result.
It's automatically set by YoutubeDL if it's missing.

											
										
										
											2013-11-03 11:11:13 +00:00
+								            'webpage_url': url,
-												[vimeo] Extract views count, likes count and comments count (#1895)

											
										
										
											2013-12-06 12:03:08 +00:00
+								            'view_count': view_count,
 								            'like_count': like_count,
 								            'comment_count': comment_count,
-												[vimeo] Extract license (closes #11880)

											
										
										
											2017-01-31 17:49:28 +00:00
+								            'license': cc_license,
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								        })
-												[vimeo] Fix extraction for VimeoReview videos

											
										
										
											2016-06-11 13:35:08 +00:00
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								        return merge_dicts(info_dict, info_dict_config, json_ld)
-												[vimeo] add an extractor for channels

											
										
										
											2013-07-29 11:12:09 +00:00
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								class VimeoOndemandIE(VimeoIE):
-												[vimeo:ondemand] Clarify IE_NAME

											
										
										
											2016-03-09 18:52:52 +00:00
+								    IE_NAME = 'vimeo:ondemand'
-												[vimeo] Fix embedded `player.vimeo` URL
Closes #1138, partially fixes #1323
Cherry-picked from upstream commit 3ae9c0f410b1d4f63e8bada67dd62a8d2852be32

											
										
										
											2021-10-22 00:27:15 +00:00
+								    _VALID_URL = r'https?://(?:www\.)?vimeo\.com/ondemand/(?:[^/]+/)?(?P<id>[^/?#&]+)'
-												[vimeo:ondemand] Separate ondemand extractor (Closes #8330, closes #8801)

											
										
										
											2016-03-09 18:51:07 +00:00
+								    _TESTS = [{
 								        # ondemand video not available via https://vimeo.com/id
 								        'url': 'https://vimeo.com/ondemand/20704',
 								        'md5': 'c424deda8c7f73c1dfb3edd7630e2f35',
 								        'info_dict': {
 								            'id': '105442900',
 								            'ext': 'mp4',
 								            'title': 'המעבדה - במאי יותם פלדמן',
 								            'uploader': 'גם סרטים',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											2017-01-02 12:08:07 +00:00
+								            'uploader_url': r're:https?://(?:www\.)?vimeo\.com/gumfilms',
-												[vimeo:ondemand] Separate ondemand extractor (Closes #8330, closes #8801)

											
										
										
											2016-03-09 18:51:07 +00:00
+								            'uploader_id': 'gumfilms',
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								            'description': 'md5:4c027c965e439de4baab621e48b60791',
 								            'upload_date': '20140906',
 								            'timestamp': 1410032453,
-												[vimeo:ondemand] Separate ondemand extractor (Closes #8330, closes #8801)

											
										
										
											2016-03-09 18:51:07 +00:00
+								        },
-												[vimeo:ondemand] Fix test (closes #11651)

											
										
										
											2017-01-11 15:51:03 +00:00
+								        'params': {
 								            'format': 'best[protocol=https]',
 								        },
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								        'expected_warnings': ['Unable to download JSON metadata'],
-												[vimeo:ondemand] Pass Referer along with embed URL (#10624)

											
										
										
											2016-09-12 14:48:45 +00:00
+								    }, {
 								        # requires Referer to be passed along with og:video:url
 								        'url': 'https://vimeo.com/ondemand/36938/126682985',
 								        'info_dict': {
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								            'id': '126584684',
-												[vimeo:ondemand] Pass Referer along with embed URL (#10624)

											
										
										
											2016-09-12 14:48:45 +00:00
+								            'ext': 'mp4',
 								            'title': 'Rävlock, rätt läte på rätt plats',
 								            'uploader': 'Lindroth & Norin',
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								            'uploader_url': r're:https?://(?:www\.)?vimeo\.com/lindrothnorin',
 								            'uploader_id': 'lindrothnorin',
 								            'description': 'md5:c3c46a90529612c8279fb6af803fc0df',
 								            'upload_date': '20150502',
 								            'timestamp': 1430586422,
-												[vimeo:ondemand] Pass Referer along with embed URL (#10624)

											
										
										
											2016-09-12 14:48:45 +00:00
+								        },
 								        'params': {
 								            'skip_download': True,
 								        },
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								        'expected_warnings': ['Unable to download JSON metadata'],
-												[vimeo:ondemand] Separate ondemand extractor (Closes #8330, closes #8801)

											
										
										
											2016-03-09 18:51:07 +00:00
+								    }, {
 								        'url': 'https://vimeo.com/ondemand/nazmaalik',
 								        'only_matching': True,
 								    }, {
 								        'url': 'https://vimeo.com/ondemand/141692381',
 								        'only_matching': True,
 								    }, {
 								        'url': 'https://vimeo.com/ondemand/thelastcolony/150274832',
 								        'only_matching': True,
 								    }]
-												[vimeo] Fix login (Closes #6488)

											
										
										
											2015-08-10 17:35:08 +00:00
+								class VimeoChannelIE(VimeoBaseInfoExtractor):
-												[vimeo] Use unicode_literals

											
										
										
											2014-01-06 22:38:16 +00:00
+								    IE_NAME = 'vimeo:channel'
-												[vimeo] Use https for all vimeo.com urls

Unfortunately vimeopro.com doesn't support it yet.

											
										
										
											2015-03-12 18:08:16 +00:00
+								    _VALID_URL = r'https://vimeo\.com/channels/(?P<id>[^/?#]+)/?(?:$|[?#])'
-												[vimeo] add an extractor for channels

											
										
										
											2013-07-29 11:12:09 +00:00
+								    _MORE_PAGES_INDICATOR = r'<a.+?rel="next"'
-												[vimeo:watchlater] Fix extraction (Closes #3886)

											
										
										
											2015-08-10 17:58:01 +00:00
+								    _TITLE = None
-												[vimeo] Add an extractor for users (closes #1871)

											
										
										
											2013-12-01 21:36:18 +00:00
+								    _TITLE_RE = r'<link rel="alternate"[^>]+?title="(.*?)"'
-												[vimeo] Move all testcases to extractors and clean up

Previously, these extractors all defined their own suitable methods.
No test_all_urls tests that everything is in order, automatically :)

											
										
										
											2014-08-27 09:36:01 +00:00
+								    _TESTS = [{
-												[vimeo] Use https for all vimeo.com urls

Unfortunately vimeopro.com doesn't support it yet.

											
										
										
											2015-03-12 18:08:16 +00:00
+								        'url': 'https://vimeo.com/channels/tributes',
-												[vimeo] Move all testcases to extractors and clean up

Previously, these extractors all defined their own suitable methods.
No test_all_urls tests that everything is in order, automatically :)

											
										
										
											2014-08-27 09:36:01 +00:00
+								        'info_dict': {
-												[vimeo] Amend playlist tests

											
										
										
											2015-02-17 23:33:31 +00:00
+								            'id': 'tributes',
-												[vimeo] Move all testcases to extractors and clean up

Previously, these extractors all defined their own suitable methods.
No test_all_urls tests that everything is in order, automatically :)

											
										
										
											2014-08-27 09:36:01 +00:00
+								            'title': 'Vimeo Tributes',
 								        },
 								        'playlist_mincount': 25,
 								    }]
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								    _BASE_URL_TEMPL = 'https://vimeo.com/channels/%s'
-												[vimeo] add an extractor for channels

											
										
										
											2013-07-29 11:12:09 +00:00
-												[vimeo] Add an extractor for albums (closes #1911)

											
										
										
											2013-12-06 20:47:32 +00:00
+								    def _page_url(self, base_url, pagenum):
 								        return '%s/videos/page:%d/' % (base_url, pagenum)
-												[vimeo] Add an extractor for groups

											
										
										
											2013-12-06 21:01:41 +00:00
+								    def _extract_list_title(self, webpage):
-												[vimeo:channel,group] Make title extraction no fatal

											
										
										
											2019-06-22 19:16:09 +00:00
+								        return self._TITLE or self._html_search_regex(
 								            self._TITLE_RE, webpage, 'list title', fatal=False)
-												[vimeo] Add an extractor for groups

											
										
										
											2013-12-06 21:01:41 +00:00
-												[vimeo] Improve playlists extraction

											
										
										
											2015-11-19 15:29:32 +00:00
+								    def _title_and_entries(self, list_id, base_url):
-												[vimeo] add an extractor for channels

											
										
										
											2013-07-29 11:12:09 +00:00
+								        for pagenum in itertools.count(1):
-												[vimeo:album] Add support for album passwords (Fixes #4917)

											
										
										
											2015-02-10 03:53:21 +00:00
+								            page_url = self._page_url(base_url, pagenum)
-												[vimeo] Add an extractor for users (closes #1871)

											
										
										
											2013-12-01 21:36:18 +00:00
+								            webpage = self._download_webpage(
-												[vimeo:album] Add support for album passwords (Fixes #4917)

											
										
										
											2015-02-10 03:53:21 +00:00
+								                page_url, list_id,
-												[vimeo] Use unicode_literals

											
										
										
											2014-01-06 22:38:16 +00:00
+								                'Downloading page %s' % pagenum)
-												[vimeo:album] Add support for album passwords (Fixes #4917)

											
										
										
											2015-02-10 03:53:21 +00:00
 								            if pagenum == 1:
-												[vimeo] Improve playlists extraction

											
										
										
											2015-11-19 15:29:32 +00:00
+								                yield self._extract_list_title(webpage)
-												[vimeo:channel] Improve playlist extraction

											
										
										
											2016-06-22 18:28:36 +00:00
+								            # Try extracting href first since not all videos are available via
 								            # short https://vimeo.com/id URL (e.g. https://vimeo.com/channels/tributes/6213729)
 								            clips = re.findall(
-												[vimeo:channel] Extract videos' titles for playlist entries

											
										
										
											2017-01-21 07:47:39 +00:00
+								                r'id="clip_(\d+)"[^>]*>\s*<a[^>]+href="(/(?:[^/]+/)*\1)(?:[^>]+\btitle="([^"]+)")?', webpage)
-												[vimeo:channel] Improve playlist extraction

											
										
										
											2016-06-22 18:28:36 +00:00
+								            if clips:
-												[vimeo:channel] Extract videos' titles for playlist entries

											
										
										
											2017-01-21 07:47:39 +00:00
+								                for video_id, video_url, video_title in clips:
-												[vimeo:channel] Improve playlist extraction

											
										
										
											2016-06-22 18:28:36 +00:00
+								                    yield self.url_result(
 								                        compat_urlparse.urljoin(base_url, video_url),
-												[vimeo:channel] Extract videos' titles for playlist entries

											
										
										
											2017-01-21 07:47:39 +00:00
+								                        VimeoIE.ie_key(), video_id=video_id, video_title=video_title)
-												[vimeo:channel] Improve playlist extraction

											
										
										
											2016-06-22 18:28:36 +00:00
+								            # More relaxed fallback
 								            else:
 								                for video_id in re.findall(r'id=["\']clip_(\d+)', webpage):
 								                    yield self.url_result(
 								                        'https://vimeo.com/%s' % video_id,
 								                        VimeoIE.ie_key(), video_id=video_id)
-												[vimeo:album] Add support for album passwords (Fixes #4917)

											
										
										
											2015-02-10 03:53:21 +00:00
-												[vimeo] add an extractor for channels

											
										
										
											2013-07-29 11:12:09 +00:00
+								            if re.search(self._MORE_PAGES_INDICATOR, webpage, re.DOTALL) is None:
 								                break
-												[vimeo] Improve playlists extraction

											
										
										
											2015-11-19 15:29:32 +00:00
+								    def _extract_videos(self, list_id, base_url):
 								        title_and_entries = self._title_and_entries(list_id, base_url)
 								        list_title = next(title_and_entries)
 								        return self.playlist_result(title_and_entries, list_id, list_title)
-												[vimeo] Add an extractor for users (closes #1871)

											
										
										
											2013-12-01 21:36:18 +00:00
 								    def _real_extract(self, url):
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								        channel_id = self._match_id(url)
 								        return self._extract_videos(channel_id, self._BASE_URL_TEMPL % channel_id)
-												[vimeo] Add an extractor for users (closes #1871)

											
										
										
											2013-12-01 21:36:18 +00:00
 								class VimeoUserIE(VimeoChannelIE):
-												[vimeo] Use unicode_literals

											
										
										
											2014-01-06 22:38:16 +00:00
+								    IE_NAME = 'vimeo:user'
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								    _VALID_URL = r'https://vimeo\.com/(?!(?:[0-9]+|watchlater)(?:$|[?#/]))(?P<id>[^/]+)(?:/videos|[#?]|$)'
-												[vimeo] Add an extractor for users (closes #1871)

											
										
										
											2013-12-01 21:36:18 +00:00
+								    _TITLE_RE = r'<a[^>]+?class="user">([^<>]+?)</a>'
-												[vimeo] Move all testcases to extractors and clean up

Previously, these extractors all defined their own suitable methods.
No test_all_urls tests that everything is in order, automatically :)

											
										
										
											2014-08-27 09:36:01 +00:00
+								    _TESTS = [{
-												[vimeo] Use https for all vimeo.com urls

Unfortunately vimeopro.com doesn't support it yet.

											
										
										
											2015-03-12 18:08:16 +00:00
+								        'url': 'https://vimeo.com/nkistudio/videos',
-												[vimeo] Move all testcases to extractors and clean up

Previously, these extractors all defined their own suitable methods.
No test_all_urls tests that everything is in order, automatically :)

											
										
										
											2014-08-27 09:36:01 +00:00
+								        'info_dict': {
 								            'title': 'Nki',
-												[vimeo] Amend playlist tests

											
										
										
											2015-02-17 23:33:31 +00:00
+								            'id': 'nkistudio',
-												[vimeo] Move all testcases to extractors and clean up

Previously, these extractors all defined their own suitable methods.
No test_all_urls tests that everything is in order, automatically :)

											
										
										
											2014-08-27 09:36:01 +00:00
+								        },
 								        'playlist_mincount': 66,
 								    }]
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								    _BASE_URL_TEMPL = 'https://vimeo.com/%s'
-												[vimeo] Add an extractor for albums (closes #1911)

											
										
										
											2013-12-06 20:47:32 +00:00
-												[vimeo] fix album extraction(closes #23864)

											
										
										
											2020-01-27 22:37:29 +00:00
+								class VimeoAlbumIE(VimeoBaseInfoExtractor):
-												[vimeo] Use unicode_literals

											
										
										
											2014-01-06 22:38:16 +00:00
+								    IE_NAME = 'vimeo:album'
-												[vimeo] fix album extraction

closes #1933
closes #15704
closes #15855
closes #18967
closes #21986

											
										
										
											2019-08-03 09:29:20 +00:00
+								    _VALID_URL = r'https://vimeo\.com/(?:album|showcase)/(?P<id>\d+)(?:$|[?#]|/(?!video))'
-												[vimeo] Add an extractor for albums (closes #1911)

											
										
										
											2013-12-06 20:47:32 +00:00
+								    _TITLE_RE = r'<header id="page_header">\n\s*<h1>(.*?)</h1>'
-												[vimeo] Move all testcases to extractors and clean up

Previously, these extractors all defined their own suitable methods.
No test_all_urls tests that everything is in order, automatically :)

											
										
										
											2014-08-27 09:36:01 +00:00
+								    _TESTS = [{
-												[vimeo:album] Fix password protected videos

Since it only uses https now, don't recognize http urls.

											
										
										
											2015-03-06 21:16:26 +00:00
+								        'url': 'https://vimeo.com/album/2632481',
-												[vimeo] Move all testcases to extractors and clean up

Previously, these extractors all defined their own suitable methods.
No test_all_urls tests that everything is in order, automatically :)

											
										
										
											2014-08-27 09:36:01 +00:00
+								        'info_dict': {
-												[vimeo] Amend playlist tests

											
										
										
											2015-02-17 23:33:31 +00:00
+								            'id': '2632481',
-												[vimeo] Move all testcases to extractors and clean up

Previously, these extractors all defined their own suitable methods.
No test_all_urls tests that everything is in order, automatically :)

											
										
										
											2014-08-27 09:36:01 +00:00
+								            'title': 'Staff Favorites: November 2013',
 								        },
 								        'playlist_mincount': 13,
-												[vimeo:album] Add support for album passwords (Fixes #4917)

											
										
										
											2015-02-10 03:53:21 +00:00
+								    }, {
 								        'note': 'Password-protected album',
 								        'url': 'https://vimeo.com/album/3253534',
 								        'info_dict': {
 								            'title': 'test',
 								            'id': '3253534',
 								        },
 								        'playlist_count': 1,
 								        'params': {
-												renaming issues resolved


											
										
										
											2020-09-02 20:37:35 +00:00
+								            'videopassword': 'youtube-dl',
-												[vimeo:album] Add support for album passwords (Fixes #4917)

											
										
										
											2015-02-10 03:53:21 +00:00
+								        }
-												[vimeo] Move all testcases to extractors and clean up

Previously, these extractors all defined their own suitable methods.
No test_all_urls tests that everything is in order, automatically :)

											
										
										
											2014-08-27 09:36:01 +00:00
+								    }]
-												[vimeo] fix album extraction

closes #1933
closes #15704
closes #15855
closes #18967
closes #21986

											
										
										
											2019-08-03 09:29:20 +00:00
+								    _PAGE_SIZE = 100
-												Updated to release 2020.11.21.1

											
										
										
											2020-11-21 14:50:42 +00:00
+								    def _fetch_page(self, album_id, authorization, hashed_pass, page):
-												[vimeo] fix album extraction

closes #1933
closes #15704
closes #15855
closes #18967
closes #21986

											
										
										
											2019-08-03 09:29:20 +00:00
+								        api_page = page + 1
 								        query = {
-												[vimeo] improve album videos id extraction(closes #22599)

											
										
										
											2019-10-15 20:01:59 +00:00
+								            'fields': 'link,uri',
-												[vimeo] fix album extraction

closes #1933
closes #15704
closes #15855
closes #18967
closes #21986

											
										
										
											2019-08-03 09:29:20 +00:00
+								            'page': api_page,
 								            'per_page': self._PAGE_SIZE,
 								        }
 								        if hashed_pass:
 								            query['_hashed_pass'] = hashed_pass
-												Update to ytdl-commit-7e79ba7

https://github.com/ytdl-org/youtube-dl/commit/7e79ba7dd6e6649dd2ce3a74004b2044f2182881
[vimeo:album] Fix extraction for albums with number of videos multiple to page size

											
										
										
											2021-03-21 18:57:54 +00:00
+								        try:
 								            videos = self._download_json(
 								                'https://api.vimeo.com/albums/%s/videos' % album_id,
 								                album_id, 'Downloading page %d' % api_page, query=query, headers={
 								                    'Authorization': 'jwt ' + authorization,
 								                })['data']
 								        except ExtractorError as e:
 								            if isinstance(e.cause, compat_HTTPError) and e.cause.code == 400:
 								                return
-												[vimeo] fix album extraction

closes #1933
closes #15704
closes #15855
closes #18967
closes #21986

											
										
										
											2019-08-03 09:29:20 +00:00
+								        for video in videos:
 								            link = video.get('link')
 								            if not link:
 								                continue
-												[vimeo] improve album videos id extraction(closes #22599)

											
										
										
											2019-10-15 20:01:59 +00:00
+								            uri = video.get('uri')
 								            video_id = self._search_regex(r'/videos/(\d+)', uri, 'video_id', default=None) if uri else None
 								            yield self.url_result(link, VimeoIE.ie_key(), video_id)
-												[vimeo] Add an extractor for albums (closes #1911)

											
										
										
											2013-12-06 20:47:32 +00:00
 								    def _real_extract(self, url):
-												[vimeo:album] Add support for album passwords (Fixes #4917)

											
										
										
											2015-02-10 03:53:21 +00:00
+								        album_id = self._match_id(url)
-												Merge 'ytdl-org/youtube-dl/master' release 2020.11.19

Old Extractors left behind:
	VLivePlaylistIE
	YoutubeSearchURLIE
	YoutubeShowIE
	YoutubeFavouritesIE

If removing old extractors, make corresponding changes in
	docs/supportedsites.md
	youtube_dlc/extractor/extractors.py

Not merged:
	.github/ISSUE_TEMPLATE/1_broken_site.md
	.github/ISSUE_TEMPLATE/2_site_support_request.md
	.github/ISSUE_TEMPLATE/3_site_feature_request.md
	.github/ISSUE_TEMPLATE/4_bug_report.md
	.github/ISSUE_TEMPLATE/5_feature_request.md
	test/test_all_urls.py
	youtube_dlc/version.py
	Changelog

											
										
										
											2020-11-19 19:22:59 +00:00
+								        viewer = self._download_json(
 								            'https://vimeo.com/_rv/viewer', album_id, fatal=False)
 								        if not viewer:
 								            webpage = self._download_webpage(url, album_id)
 								            viewer = self._parse_json(self._search_regex(
 								                r'bootstrap_data\s*=\s*({.+?})</script>',
 								                webpage, 'bootstrap data'), album_id)['viewer']
-												[vimeo] fix album extraction(closes #23864)

											
										
										
											2020-01-27 22:37:29 +00:00
+								        jwt = viewer['jwt']
 								        album = self._download_json(
 								            'https://api.vimeo.com/albums/' + album_id,
 								            album_id, headers={'Authorization': 'jwt ' + jwt},
 								            query={'fields': 'description,name,privacy'})
 								        hashed_pass = None
 								        if try_get(album, lambda x: x['privacy']['view']) == 'password':
-												[extractor] Add `write_debug` and `get_param`

											
										
										
											2021-05-17 12:23:08 +00:00
+								            password = self.get_param('videopassword')
-												[vimeo] fix album extraction(closes #23864)

											
										
										
											2020-01-27 22:37:29 +00:00
+								            if not password:
 								                raise ExtractorError(
 								                    'This album is protected by a password, use the --video-password option',
 								                    expected=True)
 								            self._set_vimeo_cookie('vuid', viewer['vuid'])
 								            try:
 								                hashed_pass = self._download_json(
 								                    'https://vimeo.com/showcase/%s/auth' % album_id,
 								                    album_id, 'Verifying the password', data=urlencode_postdata({
 								                        'password': password,
 								                        'token': viewer['xsrft'],
 								                    }), headers={
 								                        'X-Requested-With': 'XMLHttpRequest',
 								                    })['hashed_pass']
 								            except ExtractorError as e:
 								                if isinstance(e.cause, compat_HTTPError) and e.cause.code == 401:
 								                    raise ExtractorError('Wrong password', expected=True)
 								                raise
-												[vimeo] fix album extraction

closes #1933
closes #15704
closes #15855
closes #18967
closes #21986

											
										
										
											2019-08-03 09:29:20 +00:00
+								        entries = OnDemandPagedList(functools.partial(
-												[vimeo] fix album extraction(closes #23864)

											
										
										
											2020-01-27 22:37:29 +00:00
+								            self._fetch_page, album_id, jwt, hashed_pass), self._PAGE_SIZE)
 								        return self.playlist_result(
 								            entries, album_id, album.get('name'), album.get('description'))
-												[vimeo] Add an extractor for groups

											
										
										
											2013-12-06 21:01:41 +00:00
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								class VimeoGroupsIE(VimeoChannelIE):
-												[vimeo] Use unicode_literals

											
										
										
											2014-01-06 22:38:16 +00:00
+								    IE_NAME = 'vimeo:group'
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								    _VALID_URL = r'https://vimeo\.com/groups/(?P<id>[^/]+)(?:/(?!videos?/\d+)|$)'
-												[vimeo] Move all testcases to extractors and clean up

Previously, these extractors all defined their own suitable methods.
No test_all_urls tests that everything is in order, automatically :)

											
										
										
											2014-08-27 09:36:01 +00:00
+								    _TESTS = [{
-												[vimeo] Detect source extension
and misc cleanup

Cherry-picked from #1477
Closes #1402

Authored by: flashdagger

											
										
										
											2021-11-05 20:45:08 +00:00
+								        'url': 'https://vimeo.com/groups/meetup',
-												[vimeo] Move all testcases to extractors and clean up

Previously, these extractors all defined their own suitable methods.
No test_all_urls tests that everything is in order, automatically :)

											
										
										
											2014-08-27 09:36:01 +00:00
+								        'info_dict': {
-												[vimeo] Detect source extension
and misc cleanup

Cherry-picked from #1477
Closes #1402

Authored by: flashdagger

											
										
										
											2021-11-05 20:45:08 +00:00
+								            'id': 'meetup',
 								            'title': 'Vimeo Meetup!',
-												[vimeo] Move all testcases to extractors and clean up

Previously, these extractors all defined their own suitable methods.
No test_all_urls tests that everything is in order, automatically :)

											
										
										
											2014-08-27 09:36:01 +00:00
+								        },
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								        'playlist_mincount': 27,
-												[vimeo] Move all testcases to extractors and clean up

Previously, these extractors all defined their own suitable methods.
No test_all_urls tests that everything is in order, automatically :)

											
										
										
											2014-08-27 09:36:01 +00:00
+								    }]
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								    _BASE_URL_TEMPL = 'https://vimeo.com/groups/%s'
-												[vimeo] Add support for review pages

Since the regexp is already overboarding and review pages have a distinct URL format (with non-trivial stuff after the ID), use a dedicated IE.
Fixes #2106

											
										
										
											2014-01-06 16:31:47 +00:00
-												[vimeo] Fix extraction for VimeoReview videos

											
										
										
											2016-06-11 13:35:08 +00:00
+								class VimeoReviewIE(VimeoBaseInfoExtractor):
-												[vimeo] Use unicode_literals

											
										
										
											2014-01-06 22:38:16 +00:00
+								    IE_NAME = 'vimeo:review'
 								    IE_DESC = 'Review pages on vimeo'
-												[vimeo:review] improve config url extraction and extract original format(closes #20305)

											
										
										
											2019-03-10 14:03:32 +00:00
+								    _VALID_URL = r'(?P<url>https://vimeo\.com/[^/]+/review/(?P<id>[^/]+)/[0-9a-f]{10})'
-												[vimeo] Move test case to where it belongs

											
										
										
											2014-08-27 09:13:42 +00:00
+								    _TESTS = [{
-												[vimeo] Add support for review pages

Since the regexp is already overboarding and review pages have a distinct URL format (with non-trivial stuff after the ID), use a dedicated IE.
Fixes #2106

											
										
										
											2014-01-06 16:31:47 +00:00
+								        'url': 'https://vimeo.com/user21297594/review/75524534/3c257a1b5d',
 								        'md5': 'c507a72f780cacc12b2248bb4006d253',
 								        'info_dict': {
-												[vimeo] Modernize test definition

											
										
										
											2015-02-01 11:12:27 +00:00
+								            'id': '75524534',
 								            'ext': 'mp4',
-												[vimeo] Add support for review pages

Since the regexp is already overboarding and review pages have a distinct URL format (with non-trivial stuff after the ID), use a dedicated IE.
Fixes #2106

											
										
										
											2014-01-06 16:31:47 +00:00
+								            'title': "DICK HARDWICK 'Comedian'",
 								            'uploader': 'Richard Hardwick',
-												[vimeo] Fix extraction for VimeoReview videos

											
										
										
											2016-06-11 13:35:08 +00:00
+								            'uploader_id': 'user21297594',
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								            'description': "Comedian Dick Hardwick's five minute demo filmed in front of a live theater audience.\nEdit by Doug Mattocks",
 								        },
-												[vimeo] Move test case to where it belongs

											
										
										
											2014-08-27 09:13:42 +00:00
+								    }, {
 								        'note': 'video player needs Referer',
-												[vimeo] Use https for all vimeo.com urls

Unfortunately vimeopro.com doesn't support it yet.

											
										
										
											2015-03-12 18:08:16 +00:00
+								        'url': 'https://vimeo.com/user22258446/review/91613211/13f927e053',
-												[vimeo] Move test case to where it belongs

											
										
										
											2014-08-27 09:13:42 +00:00
+								        'md5': '6295fdab8f4bf6a002d058b2c6dce276',
 								        'info_dict': {
 								            'id': '91613211',
 								            'ext': 'mp4',
-												[vimeo:review] Fix test title

											
										
										
											2014-10-26 23:13:40 +00:00
+								            'title': 're:(?i)^Death by dogma versus assembling agile . Sander Hoogendoorn',
-												[vimeo] Move test case to where it belongs

											
										
										
											2014-08-27 09:13:42 +00:00
+								            'uploader': 'DevWeek Events',
 								            'duration': 2773,
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											2017-01-02 12:08:07 +00:00
+								            'thumbnail': r're:^https?://.*\.jpg$',
-												[vimeo] Fix extraction for VimeoReview videos

											
										
										
											2016-06-11 13:35:08 +00:00
+								            'uploader_id': 'user22258446',
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								        },
 								        'skip': 'video gone',
-												[vimeo:review] Fix extraction for password-protected videos

Closes #9853

											
										
										
											2016-06-24 08:48:37 +00:00
+								    }, {
 								        'note': 'Password protected',
 								        'url': 'https://vimeo.com/user37284429/review/138823582/c4d865efde',
 								        'info_dict': {
 								            'id': '138823582',
 								            'ext': 'mp4',
 								            'title': 'EFFICIENT PICKUP MASTERCLASS MODULE 1',
 								            'uploader': 'TMB',
 								            'uploader_id': 'user37284429',
 								        },
 								        'params': {
 								            'videopassword': 'holygrail',
 								        },
-												[vimeo:review] Fix extraction (#10900)

Now Vimeo Review videos uses React. Thanks @davekaro for analyzing the
problem!

											
										
										
											2016-10-11 17:48:06 +00:00
+								        'skip': 'video gone',
-												[vimeo] Move test case to where it belongs

											
										
										
											2014-08-27 09:13:42 +00:00
+								    }]
-												[vimeo] Add support for review pages

Since the regexp is already overboarding and review pages have a distinct URL format (with non-trivial stuff after the ID), use a dedicated IE.
Fixes #2106

											
										
										
											2014-01-06 16:31:47 +00:00
-												[vimeo:review] Fix extraction for password-protected videos

Closes #9853

											
										
										
											2016-06-24 08:48:37 +00:00
+								    def _real_initialize(self):
 								        self._login()
-												[vimeo] Add support for review pages

Since the regexp is already overboarding and review pages have a distinct URL format (with non-trivial stuff after the ID), use a dedicated IE.
Fixes #2106

											
										
										
											2014-01-06 16:31:47 +00:00
+								    def _real_extract(self, url):
-												[extractor] Common function `_match_valid_url`

											
										
										
											2021-08-19 01:41:24 +00:00
+								        page_url, video_id = self._match_valid_url(url).groups()
-												Update to ytdl v2021-04-01
https://github.com/ytdl-org/youtube-dl/commit/14f29f087e6097feb46bdb84878924bc410a57eb

Closes #205

											
										
										
											2021-04-01 08:28:33 +00:00
+								        data = self._download_json(
 								            page_url.replace('/review/', '/review/data/'), video_id)
 								        if data.get('isLocked') is True:
 								            video_password = self._get_video_password()
 								            viewer = self._download_json(
 								                'https://vimeo.com/_rv/viewer', video_id)
 								            webpage = self._verify_video_password(
 								                'https://vimeo.com/' + video_id, video_id,
 								                video_password, viewer['xsrft'], viewer['vuid'])
 								            clip_page_config = self._parse_json(self._search_regex(
 								                r'window\.vimeo\.clip_page_config\s*=\s*({.+?});',
 								                webpage, 'clip page config'), video_id)
 								            config_url = clip_page_config['player']['config_url']
 								            clip_data = clip_page_config.get('clip') or {}
 								        else:
 								            clip_data = data['clipData']
 								            config_url = clip_data['configUrl']
-												[vimeo:review] Fix extraction for password-protected videos

Closes #9853

											
										
										
											2016-06-24 08:48:37 +00:00
+								        config = self._download_json(config_url, video_id)
-												[vimeo] Fix extraction for VimeoReview videos

											
										
										
											2016-06-11 13:35:08 +00:00
+								        info_dict = self._parse_config(config, video_id)
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								        source_format = self._extract_original_format(
 								            page_url + '/action', video_id)
-												[vimeo:review] improve config url extraction and extract original format(closes #20305)

											
										
										
											2019-03-10 14:03:32 +00:00
+								        if source_format:
 								            info_dict['formats'].append(source_format)
-												[vimeo] Fix extraction for VimeoReview videos

											
										
										
											2016-06-11 13:35:08 +00:00
+								        self._vimeo_sort_formats(info_dict['formats'])
-												[vimeo] improve extraction

- fix review extraction
- fix ondemand extraction
- make password protected player case as an expected error(closes #22896)
- simplify channel based extractors code

											
										
										
											2019-11-27 12:57:30 +00:00
+								        info_dict['description'] = clean_html(clip_data.get('description'))
-												[vimeo] Fix extraction for VimeoReview videos

											
										
										
											2016-06-11 13:35:08 +00:00
+								        return info_dict
-												[vimeo] Add an extractor for the watch later list (closes #2787)

											
										
										
											2014-04-24 19:51:20 +00:00
-												[vimeo] Fix login (Closes #6488)

											
										
										
											2015-08-10 17:35:08 +00:00
+								class VimeoWatchLaterIE(VimeoChannelIE):
-												[vimeo] Add an extractor for the watch later list (closes #2787)

											
										
										
											2014-04-24 19:51:20 +00:00
+								    IE_NAME = 'vimeo:watchlater'
 								    IE_DESC = 'Vimeo watch later list, "vimeowatchlater" keyword (requires authentication)'
-												[vimeo:watchlater] Fix extraction (Closes #3886)

											
										
										
											2015-08-10 17:58:01 +00:00
+								    _VALID_URL = r'https://vimeo\.com/(?:home/)?watchlater|:vimeowatchlater'
 								    _TITLE = 'Watch Later'
-												[vimeo] Add an extractor for the watch later list (closes #2787)

											
										
										
											2014-04-24 19:51:20 +00:00
+								    _LOGIN_REQUIRED = True
-												[vimeo] Move all testcases to extractors and clean up

Previously, these extractors all defined their own suitable methods.
No test_all_urls tests that everything is in order, automatically :)

											
										
										
											2014-08-27 09:36:01 +00:00
+								    _TESTS = [{
-												[vimeo:watchlater] Fix extraction (Closes #3886)

											
										
										
											2015-08-10 17:58:01 +00:00
+								        'url': 'https://vimeo.com/watchlater',
-												[vimeo] Move all testcases to extractors and clean up

Previously, these extractors all defined their own suitable methods.
No test_all_urls tests that everything is in order, automatically :)

											
										
										
											2014-08-27 09:36:01 +00:00
+								        'only_matching': True,
 								    }]
-												[vimeo] Add an extractor for the watch later list (closes #2787)

											
										
										
											2014-04-24 19:51:20 +00:00
 								    def _real_initialize(self):
 								        self._login()
 								    def _page_url(self, base_url, pagenum):
 								        url = '%s/page:%d/' % (base_url, pagenum)
-												Rename compat_urllib_request_Request to sanitized_Request and move to utils

											
										
										
											2015-11-20 14:33:49 +00:00
+								        request = sanitized_Request(url)
-												[vimeo] Add an extractor for the watch later list (closes #2787)

											
										
										
											2014-04-24 19:51:20 +00:00
+								        # Set the header to get a partial html page with the ids,
 								        # the normal page doesn't contain them.
 								        request.add_header('X-Requested-With', 'XMLHttpRequest')
 								        return request
 								    def _real_extract(self, url):
-												[vimeo:watchlater] Fix extraction (Closes #3886)

											
										
										
											2015-08-10 17:58:01 +00:00
+								        return self._extract_videos('watchlater', 'https://vimeo.com/watchlater')
-												[vimeo:likes] Add new extractor (Fixes #3835)

											
										
										
											2014-09-28 10:14:16 +00:00
-												[vimeo:likes] Implement extrator in terms of channel extractor

This allows to obtain videos' ids before extraction (#21493)

											
										
										
											2019-06-22 19:13:46 +00:00
+								class VimeoLikesIE(VimeoChannelIE):
-												[vimeo:likes] Relax _VALID_URL and fix single page likes extraction (closes #16475)

											
										
										
											2018-05-17 16:21:40 +00:00
+								    _VALID_URL = r'https://(?:www\.)?vimeo\.com/(?P<id>[^/]+)/likes/?(?:$|[?#]|sort:)'
-												[vimeo:likes] Add new extractor (Fixes #3835)

											
										
										
											2014-09-28 10:14:16 +00:00
+								    IE_NAME = 'vimeo:likes'
 								    IE_DESC = 'Vimeo user likes'
-												[vimeo:likes] Relax _VALID_URL and fix single page likes extraction (closes #16475)

											
										
										
											2018-05-17 16:21:40 +00:00
+								    _TESTS = [{
-												[vimeo:likes] Support large like lists (Fixes #3847)

											
										
										
											2014-09-28 22:36:06 +00:00
+								        'url': 'https://vimeo.com/user755559/likes/',
 								        'playlist_mincount': 293,
-												[refactor] Single quotes consistency

											
										
										
											2016-02-14 09:37:17 +00:00
+								        'info_dict': {
-												[vimeo:likes] Implement extrator in terms of channel extractor

This allows to obtain videos' ids before extraction (#21493)

											
										
										
											2019-06-22 19:13:46 +00:00
+								            'id': 'user755559',
 								            'title': 'urza’s Likes',
-												[vimeo:likes] Add new extractor (Fixes #3835)

											
										
										
											2014-09-28 10:14:16 +00:00
+								        },
-												[vimeo:likes] Relax _VALID_URL and fix single page likes extraction (closes #16475)

											
										
										
											2018-05-17 16:21:40 +00:00
+								    }, {
 								        'url': 'https://vimeo.com/stormlapse/likes',
 								        'only_matching': True,
 								    }]
-												[vimeo:likes] Add new extractor (Fixes #3835)

											
										
										
											2014-09-28 10:14:16 +00:00
-												[vimeo:likes] Implement extrator in terms of channel extractor

This allows to obtain videos' ids before extraction (#21493)

											
										
										
											2019-06-22 19:13:46 +00:00
+								    def _page_url(self, base_url, pagenum):
 								        return '%s/page:%d/' % (base_url, pagenum)
-												[vimeo:likes] Add new extractor (Fixes #3835)

											
										
										
											2014-09-28 10:14:16 +00:00
+								    def _real_extract(self, url):
 								        user_id = self._match_id(url)
-												[vimeo:likes] Implement extrator in terms of channel extractor

This allows to obtain videos' ids before extraction (#21493)

											
										
										
											2019-06-22 19:13:46 +00:00
+								        return self._extract_videos(user_id, 'https://vimeo.com/%s/likes' % user_id)
-												[vimeo] Add support for VHX(Vimeo OTT)(#14835)

											
										
										
											2018-11-28 18:53:22 +00:00
-												[vimeo] fix VHX embed extraction

											
										
										
											2019-10-14 17:37:35 +00:00
+								class VHXEmbedIE(VimeoBaseInfoExtractor):
-												[vimeo] Add support for VHX(Vimeo OTT)(#14835)

											
										
										
											2018-11-28 18:53:22 +00:00
+								    IE_NAME = 'vhx:embed'
 								    _VALID_URL = r'https?://embed\.vhx\.tv/videos/(?P<id>\d+)'
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 12:26:37 +00:00
+								    @staticmethod
 								    def _extract_url(webpage):
 								        mobj = re.search(
 								            r'<iframe[^>]+src="(https?://embed\.vhx\.tv/videos/\d+[^"]*)"', webpage)
 								        return unescapeHTML(mobj.group(1)) if mobj else None
-												[vimeo] Add support for VHX(Vimeo OTT)(#14835)

											
										
										
											2018-11-28 18:53:22 +00:00
+								    def _real_extract(self, url):
 								        video_id = self._match_id(url)
 								        webpage = self._download_webpage(url, video_id)
-												[vimeo] fix VHX embed extraction

											
										
										
											2019-10-14 17:37:35 +00:00
+								        config_url = self._parse_json(self._search_regex(
 								            r'window\.OTTData\s*=\s*({.+})', webpage,
 								            'ott data'), video_id, js_to_json)['config_url']
 								        config = self._download_json(config_url, video_id)
 								        info = self._parse_config(config, video_id)
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 12:26:37 +00:00
+								        info['id'] = video_id
-												[vimeo] fix VHX embed extraction

											
										
										
											2019-10-14 17:37:35 +00:00
+								        self._vimeo_sort_formats(info['formats'])
 								        return info