yt-dlp/yt_dlp/extractor/generic.py

import os
import re
import types
import urllib.parse
import xml.etree.ElementTree

from .common import InfoExtractor  # isort: split
from .commonprotocols import RtmpIE
from .youtube import YoutubeIE
from ..compat import compat_etree_fromstring
from ..utils import (
    KNOWN_EXTENSIONS,
    MEDIA_EXTENSIONS,
    ExtractorError,
    UnsupportedError,
    determine_ext,
    determine_protocol,
    dict_get,
    extract_basic_auth,
    filter_dict,
    format_field,
    int_or_none,
    is_html,
    js_to_json,
    merge_dicts,
    mimetype2ext,
    orderedSet,
    parse_duration,
    parse_resolution,
    smuggle_url,
    str_or_none,
    traverse_obj,
    try_call,
    unescapeHTML,
    unified_timestamp,
    unsmuggle_url,
    update_url_query,
    url_or_none,
    urlhandle_detect_ext,
    urljoin,
    variadic,
    xpath_attr,
    xpath_text,
    xpath_with_ns,
)


class GenericIE(InfoExtractor):
    IE_DESC = 'Generic downloader that works on some sites'
    _VALID_URL = r'.*'
    IE_NAME = 'generic'
    _NETRC_MACHINE = False  # Suppress username warning
    _TESTS = [
        # Direct link to a video
        {
            'url': 'http://media.w3.org/2010/05/sintel/trailer.mp4',
            'md5': '67d406c2bcb6af27fa886f31aa934bbe',
            'info_dict': {
                'id': 'trailer',
                'ext': 'mp4',
                'title': 'trailer',
                'upload_date': '20100513',
                'direct': True,
                'timestamp': 1273772943.0,
            }
        },
        # Direct link to media delivered compressed (until Accept-Encoding is *)
        {
            'url': 'http://calimero.tk/muzik/FictionJunction-Parallel_Hearts.flac',
            'md5': '128c42e68b13950268b648275386fc74',
            'info_dict': {
                'id': 'FictionJunction-Parallel_Hearts',
                'ext': 'flac',
                'title': 'FictionJunction-Parallel_Hearts',
                'upload_date': '20140522',
            },
            'expected_warnings': [
                'URL could be a direct video link, returning it as such.'
            ],
            'skip': 'URL invalid',
        },
        # Direct download with broken HEAD
        {
            'url': 'http://ai-radio.org:8000/radio.opus',
            'info_dict': {
                'id': 'radio',
                'ext': 'opus',
                'title': 'radio',
            },
            'params': {
                'skip_download': True,  # infinite live stream
            },
            'expected_warnings': [
                r'501.*Not Implemented',
                r'400.*Bad Request',
            ],
        },
        # Direct link with incorrect MIME type
        {
            'url': 'http://ftp.nluug.nl/video/nluug/2014-11-20_nj14/zaal-2/5_Lennart_Poettering_-_Systemd.webm',
            'md5': '4ccbebe5f36706d85221f204d7eb5913',
            'info_dict': {
                'url': 'http://ftp.nluug.nl/video/nluug/2014-11-20_nj14/zaal-2/5_Lennart_Poettering_-_Systemd.webm',
                'id': '5_Lennart_Poettering_-_Systemd',
                'ext': 'webm',
                'title': '5_Lennart_Poettering_-_Systemd',
                'upload_date': '20141120',
                'direct': True,
                'timestamp': 1416498816.0,
            },
            'expected_warnings': [
                'URL could be a direct video link, returning it as such.'
            ]
        },
        # RSS feed
        {
            'url': 'http://phihag.de/2014/youtube-dl/rss2.xml',
            'info_dict': {
                'id': 'https://phihag.de/2014/youtube-dl/rss2.xml',
                'title': 'Zero Punctuation',
                'description': 're:.*groundbreaking video review series.*'
            },
            'playlist_mincount': 11,
        },
        # RSS feed with enclosure
        {
            'url': 'http://podcastfeeds.nbcnews.com/audio/podcast/MSNBC-MADDOW-NETCAST-M4V.xml',
            'info_dict': {
                'id': 'http://podcastfeeds.nbcnews.com/nbcnews/video/podcast/MSNBC-MADDOW-NETCAST-M4V.xml',
                'title': 'MSNBC Rachel Maddow (video)',
                'description': 're:.*her unique approach to storytelling.*',
            },
            'playlist': [{
                'info_dict': {
                    'ext': 'mov',
                    'id': 'pdv_maddow_netcast_mov-12-03-2020-223726',
                    'title': 'MSNBC Rachel Maddow (video) - 12-03-2020-223726',
                    'description': 're:.*her unique approach to storytelling.*',
                    'upload_date': '20201204',
                },
            }],
            'skip': 'Dead link',
        },
        # RSS feed with item with description and thumbnails
        {
            'url': 'https://anchor.fm/s/dd00e14/podcast/rss',
            'info_dict': {
                'id': 'https://anchor.fm/s/dd00e14/podcast/rss',
                'title': 're:.*100% Hydrogen.*',
                'description': 're:.*In this episode.*',
            },
            'playlist': [{
                'info_dict': {
                    'ext': 'm4a',
                    'id': '818a5d38-01cd-152f-2231-ee479677fa82',
                    'title': 're:Hydrogen!',
                    'description': 're:.*In this episode we are going.*',
                    'timestamp': 1567977776,
                    'upload_date': '20190908',
                    'duration': 423,
                    'thumbnail': r're:^https?://.*\.jpg$',
                    'episode_number': 1,
                    'season_number': 1,
                    'age_limit': 0,
                    'season': 'Season 1',
                    'direct': True,
                    'episode': 'Episode 1',
                },
            }],
            'params': {
                'skip_download': True,
            },
        },
        # RSS feed with enclosures and unsupported link URLs
        {
            'url': 'http://www.hellointernet.fm/podcast?format=rss',
            'info_dict': {
                'id': 'http://www.hellointernet.fm/podcast?format=rss',
                'description': 'CGP Grey and Brady Haran talk about YouTube, life, work, whatever.',
                'title': 'Hello Internet',
            },
            'playlist_mincount': 100,
        },
        # RSS feed with guid
        {
            'url': 'https://www.omnycontent.com/d/playlist/a7b4f8fe-59d9-4afc-a79a-a90101378abf/bf2c1d80-3656-4449-9d00-a903004e8f84/efbff746-e7c1-463a-9d80-a903004e8f8f/podcast.rss',
            'info_dict': {
                'id': 'https://www.omnycontent.com/d/playlist/a7b4f8fe-59d9-4afc-a79a-a90101378abf/bf2c1d80-3656-4449-9d00-a903004e8f84/efbff746-e7c1-463a-9d80-a903004e8f8f/podcast.rss',
                'description': 'md5:be809a44b63b0c56fb485caf68685520',
                'title': 'The Little Red Podcast',
            },
            'playlist_mincount': 76,
        },
        # SMIL from http://videolectures.net/promogram_igor_mekjavic_eng
        {
            'url': 'http://videolectures.net/promogram_igor_mekjavic_eng/video/1/smil.xml',
            'info_dict': {
                'id': 'smil',
                'ext': 'mp4',
                'title': 'Automatics, robotics and biocybernetics',
                'description': 'md5:815fc1deb6b3a2bff99de2d5325be482',
                'upload_date': '20130627',
                'formats': 'mincount:16',
                'subtitles': 'mincount:1',
            },
            'params': {
                'force_generic_extractor': True,
                'skip_download': True,
            },
        },
        # SMIL from http://www1.wdr.de/mediathek/video/livestream/index.html
        {
            'url': 'http://metafilegenerator.de/WDR/WDR_FS/hds/hds.smil',
            'info_dict': {
                'id': 'hds',
                'ext': 'flv',
                'title': 'hds',
                'formats': 'mincount:1',
            },
            'params': {
                'skip_download': True,
            },
        },
        # SMIL from https://www.restudy.dk/video/play/id/1637
        {
            'url': 'https://www.restudy.dk/awsmedia/SmilDirectory/video_1637.xml',
            'info_dict': {
                'id': 'video_1637',
                'ext': 'flv',
                'title': 'video_1637',
                'formats': 'mincount:3',
            },
            'params': {
                'skip_download': True,
            },
        },
        # SMIL from http://adventure.howstuffworks.com/5266-cool-jobs-iditarod-musher-video.htm
        {
            'url': 'http://services.media.howstuffworks.com/videos/450221/smil-service.smil',
            'info_dict': {
                'id': 'smil-service',
                'ext': 'flv',
                'title': 'smil-service',
                'formats': 'mincount:1',
            },
            'params': {
                'skip_download': True,
            },
        },
        # SMIL from http://new.livestream.com/CoheedandCambria/WebsterHall/videos/4719370
        {
            'url': 'http://api.new.livestream.com/accounts/1570303/events/1585861/videos/4719370.smil',
            'info_dict': {
                'id': '4719370',
                'ext': 'mp4',
                'title': '571de1fd-47bc-48db-abf9-238872a58d1f',
                'formats': 'mincount:3',
            },
            'params': {
                'skip_download': True,
            },
        },
        # XSPF playlist from http://www.telegraaf.nl/tv/nieuws/binnenland/24353229/__Tikibad_ontruimd_wegens_brand__.html
        {
            'url': 'http://www.telegraaf.nl/xml/playlist/2015/8/7/mZlp2ctYIUEB.xspf',
            'info_dict': {
                'id': 'mZlp2ctYIUEB',
                'ext': 'mp4',
                'title': 'Tikibad ontruimd wegens brand',
                'description': 'md5:05ca046ff47b931f9b04855015e163a4',
                'thumbnail': r're:^https?://.*\.jpg$',
                'duration': 33,
            },
            'params': {
                'skip_download': True,
            },
            'skip': '404 Not Found',
        },
        # MPD from http://dash-mse-test.appspot.com/media.html
        {
            'url': 'http://yt-dash-mse-test.commondatastorage.googleapis.com/media/car-20120827-manifest.mpd',
            'md5': '4b57baab2e30d6eb3a6a09f0ba57ef53',
            'info_dict': {
                'id': 'car-20120827-manifest',
                'ext': 'mp4',
                'title': 'car-20120827-manifest',
                'formats': 'mincount:9',
                'upload_date': '20130904',
                'timestamp': 1378272859.0,
            },
        },
        # m3u8 served with Content-Type: audio/x-mpegURL; charset=utf-8
        {
            'url': 'http://once.unicornmedia.com/now/master/playlist/bb0b18ba-64f5-4b1b-a29f-0ac252f06b68/77a785f3-5188-4806-b788-0893a61634ed/93677179-2d99-4ef4-9e17-fe70d49abfbf/content.m3u8',
            'info_dict': {
                'id': 'content',
                'ext': 'mp4',
                'title': 'content',
                'formats': 'mincount:8',
            },
            'params': {
                # m3u8 downloads
                'skip_download': True,
            },
            'skip': 'video gone',
        },
        # m3u8 served with Content-Type: text/plain
        {
            'url': 'http://www.nacentapps.com/m3u8/index.m3u8',
            'info_dict': {
                'id': 'index',
                'ext': 'mp4',
                'title': 'index',
                'upload_date': '20140720',
                'formats': 'mincount:11',
            },
            'params': {
                # m3u8 downloads
                'skip_download': True,
            },
            'skip': 'video gone',
        },
        # google redirect
        {
            'url': 'http://www.google.com/url?sa=t&rct=j&q=&esrc=s&source=web&cd=1&cad=rja&ved=0CCUQtwIwAA&url=http%3A%2F%2Fwww.youtube.com%2Fwatch%3Fv%3DcmQHVoWB5FY&ei=F-sNU-LLCaXk4QT52ICQBQ&usg=AFQjCNEw4hL29zgOohLXvpJ-Bdh2bils1Q&bvm=bv.61965928,d.bGE',
            'info_dict': {
                'id': 'cmQHVoWB5FY',
                'ext': 'mp4',
                'upload_date': '20130224',
                'uploader_id': '@TheVerge',
                'description': r're:^Chris Ziegler takes a look at the\.*',
                'uploader': 'The Verge',
                'title': 'First Firefox OS phones side-by-side',
            },
            'params': {
                'skip_download': False,
            }
        },
        {
            # redirect in Refresh HTTP header
            'url': 'https://www.facebook.com/l.php?u=https%3A%2F%2Fwww.youtube.com%2Fwatch%3Fv%3DpO8h3EaFRdo&h=TAQHsoToz&enc=AZN16h-b6o4Zq9pZkCCdOLNKMN96BbGMNtcFwHSaazus4JHT_MFYkAA-WARTX2kvsCIdlAIyHZjl6d33ILIJU7Jzwk_K3mcenAXoAzBNoZDI_Q7EXGDJnIhrGkLXo_LJ_pAa2Jzbx17UHMd3jAs--6j2zaeto5w9RTn8T_1kKg3fdC5WPX9Dbb18vzH7YFX0eSJmoa6SP114rvlkw6pkS1-T&s=1',
            'info_dict': {
                'id': 'pO8h3EaFRdo',
                'ext': 'mp4',
                'title': 'Tripeo Boiler Room x Dekmantel Festival DJ Set',
                'description': 'md5:6294cc1af09c4049e0652b51a2df10d5',
                'upload_date': '20150917',
                'uploader_id': 'brtvofficial',
                'uploader': 'Boiler Room',
            },
            'params': {
                'skip_download': False,
            },
        },
        {
            'url': 'http://www.hodiho.fr/2013/02/regis-plante-sa-jeep.html',
            'md5': '85b90ccc9d73b4acd9138d3af4c27f89',
            'info_dict': {
                'id': '13601338388002',
                'ext': 'mp4',
                'uploader': 'www.hodiho.fr',
                'title': 'R\u00e9gis plante sa Jeep',
            }
        },
        # bandcamp page with custom domain
        {
            'add_ie': ['Bandcamp'],
            'url': 'http://bronyrock.com/track/the-pony-mash',
            'info_dict': {
                'id': '3235767654',
                'ext': 'mp3',
                'title': 'The Pony Mash',
                'uploader': 'M_Pallante',
            },
            'skip': 'There is a limit of 200 free downloads / month for the test song',
        },
        # embed.ly video
        {
            'url': 'http://www.tested.com/science/weird/460206-tested-grinding-coffee-2000-frames-second/',
            'info_dict': {
                'id': '9ODmcdjQcHQ',
                'ext': 'mp4',
                'title': 'Tested: Grinding Coffee at 2000 Frames Per Second',
                'upload_date': '20140225',
                'description': 'md5:06a40fbf30b220468f1e0957c0f558ff',
                'uploader': 'Tested',
                'uploader_id': 'testedcom',
            },
            # No need to test YoutubeIE here
            'params': {
                'skip_download': True,
            },
        },
        # funnyordie embed
        {
            'url': 'http://www.theguardian.com/world/2014/mar/11/obama-zach-galifianakis-between-two-ferns',
            'info_dict': {
                'id': '18e820ec3f',
                'ext': 'mp4',
                'title': 'Between Two Ferns with Zach Galifianakis: President Barack Obama',
                'description': 'Episode 18: President Barack Obama sits down with Zach Galifianakis for his most memorable interview yet.',
            },
            # HEAD requests lead to endless 301, while GET is OK
            'expected_warnings': ['301'],
        },
        # RUTV embed
        {
            'url': 'http://www.rg.ru/2014/03/15/reg-dfo/anklav-anons.html',
            'info_dict': {
                'id': '776940',
                'ext': 'mp4',
                'title': 'Охотское море стало целиком российским',
                'description': 'md5:5ed62483b14663e2a95ebbe115eb8f43',
            },
            'params': {
                # m3u8 download
                'skip_download': True,
            },
        },
        # TVC embed
        {
            'url': 'http://sch1298sz.mskobr.ru/dou_edu/karamel_ki/filial_galleries/video/iframe_src_http_tvc_ru_video_iframe_id_55304_isplay_false_acc_video_id_channel_brand_id_11_show_episodes_episode_id_32307_frameb/',
            'info_dict': {
                'id': '55304',
                'ext': 'mp4',
                'title': 'Дошкольное воспитание',
            },
        },
        # SportBox embed
        {
            'url': 'http://www.vestifinance.ru/articles/25753',
            'info_dict': {
                'id': '25753',
                'title': 'Прямые трансляции с Форума-выставки "Госзаказ-2013"',
            },
            'playlist': [{
                'info_dict': {
                    'id': '370908',
                    'title': 'Госзаказ. День 3',
                    'ext': 'mp4',
                }
            }, {
                'info_dict': {
                    'id': '370905',
                    'title': 'Госзаказ. День 2',
                    'ext': 'mp4',
                }
            }, {
                'info_dict': {
                    'id': '370902',
                    'title': 'Госзаказ. День 1',
                    'ext': 'mp4',
                }
            }],
            'params': {
                # m3u8 download
                'skip_download': True,
            },
        },
        # Myvi.ru embed
        {
            'url': 'http://www.kinomyvi.tv/news/detail/Pervij-dublirovannij-trejler--Uzhastikov-_nOw1',
            'info_dict': {
                'id': 'f4dafcad-ff21-423d-89b5-146cfd89fa1e',
                'ext': 'mp4',
                'title': 'Ужастики, русский трейлер (2015)',
                'thumbnail': r're:^https?://.*\.jpg$',
                'duration': 153,
            },
            'skip': 'Site dead',
        },
        # XHamster embed
        {
            'url': 'http://www.numisc.com/forum/showthread.php?11696-FM15-which-pumiscer-was-this-%28-vid-%29-%28-alfa-as-fuck-srx-%29&s=711f5db534502e22260dec8c5e2d66d8',
            'info_dict': {
                'id': 'showthread',
                'title': '[NSFL] [FM15] which pumiscer was this ( vid ) ( alfa as fuck srx )',
            },
            'playlist_mincount': 7,
            # This forum does not allow <iframe> syntaxes anymore
            # Now HTML tags are displayed as-is
            'skip': 'No videos on this page',
        },
        # Embedded TED video
        {
            'url': 'http://en.support.wordpress.com/videos/ted-talks/',
            'md5': '65fdff94098e4a607385a60c5177c638',
            'info_dict': {
                'id': '1969',
                'ext': 'mp4',
                'title': 'Hidden miracles of the natural world',
                'uploader': 'Louie Schwartzberg',
                'description': 'md5:8145d19d320ff3e52f28401f4c4283b9',
            }
        },
        # nowvideo embed hidden behind percent encoding
        {
            'url': 'http://www.waoanime.tv/the-super-dimension-fortress-macross-episode-1/',
            'md5': '2baf4ddd70f697d94b1c18cf796d5107',
            'info_dict': {
                'id': '06e53103ca9aa',
                'ext': 'flv',
                'title': 'Macross Episode 001  Watch Macross Episode 001 onl',
                'description': 'No description',
            },
        },
        # arte embed
        {
            'url': 'http://www.tv-replay.fr/redirection/20-03-14/x-enius-arte-10753389.html',
            'md5': '7653032cbb25bf6c80d80f217055fa43',
            'info_dict': {
                'id': '048195-004_PLUS7-F',
                'ext': 'flv',
                'title': 'X:enius',
                'description': 'md5:d5fdf32ef6613cdbfd516ae658abf168',
                'upload_date': '20140320',
            },
            'params': {
                'skip_download': 'Requires rtmpdump'
            },
            'skip': 'video gone',
        },
        # francetv embed
        {
            'url': 'http://www.tsprod.com/replay-du-concert-alcaline-de-calogero',
            'info_dict': {
                'id': 'EV_30231',
                'ext': 'mp4',
                'title': 'Alcaline, le concert avec Calogero',
                'description': 'md5:61f08036dcc8f47e9cfc33aed08ffaff',
                'upload_date': '20150226',
                'timestamp': 1424989860,
                'duration': 5400,
            },
            'params': {
                # m3u8 downloads
                'skip_download': True,
            },
            'expected_warnings': [
                'Forbidden'
            ]
        },
        # Condé Nast embed
        {
            'url': 'http://www.wired.com/2014/04/honda-asimo/',
            'md5': 'ba0dfe966fa007657bd1443ee672db0f',
            'info_dict': {
                'id': '53501be369702d3275860000',
                'ext': 'mp4',
                'title': 'Honda’s  New Asimo Robot Is More Human Than Ever',
            }
        },
        # Dailymotion embed
        {
            'url': 'http://www.spi0n.com/zap-spi0n-com-n216/',
            'md5': '441aeeb82eb72c422c7f14ec533999cd',
            'info_dict': {
                'id': 'k2mm4bCdJ6CQ2i7c8o2',
                'ext': 'mp4',
                'title': 'Le Zap de Spi0n n°216 - Zapping du Web',
                'description': 'md5:faf028e48a461b8b7fad38f1e104b119',
                'uploader': 'Spi0n',
                'uploader_id': 'xgditw',
                'upload_date': '20140425',
                'timestamp': 1398441542,
            },
            'add_ie': ['Dailymotion'],
        },
        # DailyMail embed
        {
            'url': 'http://www.bumm.sk/krimi/2017/07/05/biztonsagi-kamera-buktatta-le-az-agg-ferfit-utlegelo-apolot',
            'info_dict': {
                'id': '1495629',
                'ext': 'mp4',
                'title': 'Care worker punches elderly dementia patient in head 11 times',
                'description': 'md5:3a743dee84e57e48ec68bf67113199a5',
            },
            'add_ie': ['DailyMail'],
            'params': {
                'skip_download': True,
            },
        },
        # YouTube embed
        {
            'url': 'http://www.badzine.de/ansicht/datum/2014/06/09/so-funktioniert-die-neue-englische-badminton-liga.html',
            'info_dict': {
                'id': 'FXRb4ykk4S0',
                'ext': 'mp4',
                'title': 'The NBL Auction 2014',
                'uploader': 'BADMINTON England',
                'uploader_id': 'BADMINTONEvents',
                'upload_date': '20140603',
                'description': 'md5:9ef128a69f1e262a700ed83edb163a73',
            },
            'add_ie': ['Youtube'],
            'params': {
                'skip_download': True,
            }
        },
        # MTVServices embed
        {
            'url': 'http://www.vulture.com/2016/06/new-key-peele-sketches-released.html',
            'md5': 'ca1aef97695ef2c1d6973256a57e5252',
            'info_dict': {
                'id': '769f7ec0-0692-4d62-9b45-0d88074bffc1',
                'ext': 'mp4',
                'title': 'Key and Peele|October 10, 2012|2|203|Liam Neesons - Uncensored',
                'description': 'Two valets share their love for movie star Liam Neesons.',
                'timestamp': 1349922600,
                'upload_date': '20121011',
            },
        },
        # YouTube embed via <data-embed-url="">
        {
            'url': 'https://play.google.com/store/apps/details?id=com.gameloft.android.ANMP.GloftA8HM',
            'info_dict': {
                'id': '4vAffPZIT44',
                'ext': 'mp4',
                'title': 'Asphalt 8: Airborne - Update - Welcome to Dubai!',
                'uploader': 'Gameloft',
                'uploader_id': 'gameloft',
                'upload_date': '20140828',
                'description': 'md5:c80da9ed3d83ae6d1876c834de03e1c4',
            },
            'params': {
                'skip_download': True,
            }
        },
        # Flowplayer
        {
            'url': 'http://www.handjobhub.com/video/busty-blonde-siri-tit-fuck-while-wank-6313.html',
            'md5': '9d65602bf31c6e20014319c7d07fba27',
            'info_dict': {
                'id': '5123ea6d5e5a7',
                'ext': 'mp4',
                'age_limit': 18,
                'uploader': 'www.handjobhub.com',
                'title': 'Busty Blonde Siri Tit Fuck While Wank at HandjobHub.com',
            }
        },
        # MLB embed
        {
            'url': 'http://umpire-empire.com/index.php/topic/58125-laz-decides-no-thats-low/',
            'md5': '96f09a37e44da40dd083e12d9a683327',
            'info_dict': {
                'id': '33322633',
                'ext': 'mp4',
                'title': 'Ump changes call to ball',
                'description': 'md5:71c11215384298a172a6dcb4c2e20685',
                'duration': 48,
                'timestamp': 1401537900,
                'upload_date': '20140531',
                'thumbnail': r're:^https?://.*\.jpg$',
            },
        },
        # Wistia standard embed (async)
        {
            'url': 'https://www.getdrip.com/university/brennan-dunn-drip-workshop/',
            'info_dict': {
                'id': '807fafadvk',
                'ext': 'mp4',
                'title': 'Drip Brennan Dunn Workshop',
                'description': 'a JV Webinars video from getdrip-1',
                'duration': 4986.95,
                'timestamp': 1463607249,
                'upload_date': '20160518',
            },
            'params': {
                'skip_download': True,
            },
            'skip': 'webpage 404 not found',
        },
        # Soundcloud embed
        {
            'url': 'http://nakedsecurity.sophos.com/2014/10/29/sscc-171-are-you-sure-that-1234-is-a-bad-password-podcast/',
            'info_dict': {
                'id': '174391317',
                'ext': 'mp3',
                'description': 'md5:ff867d6b555488ad3c52572bb33d432c',
                'uploader': 'Sophos Security',
                'title': 'Chet Chat 171 - Oct 29, 2014',
                'upload_date': '20141029',
            }
        },
        # Soundcloud multiple embeds
        {
            'url': 'http://www.guitarplayer.com/lessons/1014/legato-workout-one-hour-to-more-fluid-performance---tab/52809',
            'info_dict': {
                'id': '52809',
                'title': 'Guitar Essentials: Legato Workout—One-Hour to Fluid Performance  | TAB + AUDIO',
            },
            'playlist_mincount': 7,
        },
        # TuneIn station embed
        {
            'url': 'http://radiocnrv.com/promouvoir-radio-cnrv/',
            'info_dict': {
                'id': '204146',
                'ext': 'mp3',
                'title': 'CNRV',
                'location': 'Paris, France',
                'is_live': True,
            },
            'params': {
                # Live stream
                'skip_download': True,
            },
        },
        # Livestream embed
        {
            'url': 'http://www.esa.int/Our_Activities/Space_Science/Rosetta/Philae_comet_touch-down_webcast',
            'info_dict': {
                'id': '67864563',
                'ext': 'flv',
                'upload_date': '20141112',
                'title': 'Rosetta #CometLanding webcast HL 10',
            }
        },
        # Another Livestream embed, without 'new.' in URL
        {
            'url': 'https://www.freespeech.org/',
            'info_dict': {
                'id': '123537347',
                'ext': 'mp4',
                'title': 're:^FSTV [0-9]{4}-[0-9]{2}-[0-9]{2} [0-9]{2}:[0-9]{2}$',
            },
            'params': {
                # Live stream
                'skip_download': True,
            },
        },
        # LazyYT
        {
            'url': 'https://skiplagged.com/',
            'info_dict': {
                'id': 'skiplagged',
                'title': 'Skiplagged: The smart way to find cheap flights',
            },
            'playlist_mincount': 1,
            'add_ie': ['Youtube'],
        },
        # Libsyn embed
        {
            'url': 'http://undergroundwellness.com/podcasts/306-5-steps-to-permanent-gut-healing/',
            'info_dict': {
                'id': '3793998',
                'ext': 'mp3',
                'upload_date': '20141126',
                'title': 'Underground Wellness Radio - Jack Tips: 5 Steps to Permanent Gut Healing',
                'thumbnail': 'https://assets.libsyn.com/secure/item/3793998/?height=90&width=90',
                'duration': 3989.0,
            }
        },
        # Cinerama player
        {
            'url': 'http://www.abc.net.au/7.30/content/2015/s4164797.htm',
            'info_dict': {
                'id': '730m_DandD_1901_512k',
                'ext': 'mp4',
                'uploader': 'www.abc.net.au',
                'title': 'Game of Thrones with dice - Dungeons and Dragons fantasy role-playing game gets new life - 19/01/2015',
            }
        },
        # embedded viddler video
        {
            'url': 'http://deadspin.com/i-cant-stop-watching-john-wall-chop-the-nuggets-with-th-1681801597',
            'info_dict': {
                'id': '4d03aad9',
                'ext': 'mp4',
                'uploader': 'deadspin',
                'title': 'WALL-TO-GORTAT',
                'timestamp': 1422285291,
                'upload_date': '20150126',
            },
            'add_ie': ['Viddler'],
        },
        # Libsyn embed
        {
            'url': 'http://thedailyshow.cc.com/podcast/episodetwelve',
            'info_dict': {
                'id': '3377616',
                'ext': 'mp3',
                'title': "The Daily Show Podcast without Jon Stewart - Episode 12: Bassem Youssef: Egypt's Jon Stewart",
                'description': 'md5:601cb790edd05908957dae8aaa866465',
                'upload_date': '20150220',
            },
            'skip': 'All The Daily Show URLs now redirect to http://www.cc.com/shows/',
        },
        # jwplayer YouTube
        {
            'url': 'http://media.nationalarchives.gov.uk/index.php/webinar-using-discovery-national-archives-online-catalogue/',
            'info_dict': {
                'id': 'Mrj4DVp2zeA',
                'ext': 'mp4',
                'upload_date': '20150212',
                'uploader': 'The National Archives UK',
                'description': 'md5:8078af856dca76edc42910b61273dbbf',
                'uploader_id': 'NationalArchives08',
                'title': 'Webinar: Using Discovery, The National Archives’ online catalogue',
            },
        },
        # jwplayer rtmp
        {
            'url': 'http://www.suffolk.edu/sjc/live.php',
            'info_dict': {
                'id': 'live',
                'ext': 'flv',
                'title': 'Massachusetts Supreme Judicial Court Oral Arguments',
                'uploader': 'www.suffolk.edu',
            },
            'params': {
                'skip_download': True,
            },
            'skip': 'Only has video a few mornings per month, see http://www.suffolk.edu/sjc/',
        },
        # jwplayer with only the json URL
        {
            'url': 'https://www.hollywoodreporter.com/news/general-news/dunkirk-team-reveals-what-christopher-nolan-said-oscar-win-meet-your-oscar-winner-1092454',
            'info_dict': {
                'id': 'TljWkvWH',
                'ext': 'mp4',
                'upload_date': '20180306',
                'title': 'md5:91eb1862f6526415214f62c00b453936',
                'description': 'md5:73048ae50ae953da10549d1d2fe9b3aa',
                'timestamp': 1520367225,
            },
            'params': {
                'skip_download': True,
            },
        },
        # Complex jwplayer
        {
            'url': 'http://www.indiedb.com/games/king-machine/videos',
            'info_dict': {
                'id': 'videos',
                'ext': 'mp4',
                'title': 'king machine trailer 1',
                'description': 'Browse King Machine videos & audio for sweet media. Your eyes will thank you.',
                'thumbnail': r're:^https?://.*\.jpg$',
            },
        },
        {
            # Youtube embed, formerly: Video.js embed, multiple formats
            'url': 'http://ortcam.com/solidworks-урок-6-настройка-чертежа_33f9b7351.html',
            'info_dict': {
                'id': 'yygqldloqIk',
                'ext': 'mp4',
                'title': 'SolidWorks. Урок 6 Настройка чертежа',
                'description': 'md5:baf95267792646afdbf030e4d06b2ab3',
                'upload_date': '20130314',
                'uploader': 'PROстое3D',
                'uploader_id': 'PROstoe3D',
            },
            'params': {
                'skip_download': True,
            },
        },
        {
            # Video.js embed, single format
            'url': 'https://www.vooplayer.com/v3/watch/watch.php?v=NzgwNTg=',
            'info_dict': {
                'id': 'watch',
                'ext': 'mp4',
                'title': 'Step 1 -  Good Foundation',
                'description': 'md5:d1e7ff33a29fc3eb1673d6c270d344f4',
            },
            'params': {
                'skip_download': True,
            },
            'skip': '404 Not Found',
        },
        # rtl.nl embed
        {
            'url': 'http://www.rtlnieuws.nl/nieuws/buitenland/aanslagen-kopenhagen',
            'playlist_mincount': 5,
            'info_dict': {
                'id': 'aanslagen-kopenhagen',
                'title': 'Aanslagen Kopenhagen',
            }
        },
        # Zapiks embed
        {
            'url': 'http://www.skipass.com/news/116090-bon-appetit-s5ep3-baqueira-mi-cor.html',
            'info_dict': {
                'id': '118046',
                'ext': 'mp4',
                'title': 'EP3S5 - Bon Appétit - Baqueira Mi Corazon !',
            }
        },
        # Kaltura embed (different embed code)
        {
            'url': 'http://www.premierchristianradio.com/Shows/Saturday/Unbelievable/Conference-Videos/Os-Guinness-Is-It-Fools-Talk-Unbelievable-Conference-2014',
            'info_dict': {
                'id': '1_a52wc67y',
                'ext': 'flv',
                'upload_date': '20150127',
                'uploader_id': 'PremierMedia',
                'timestamp': int,
                'title': 'Os Guinness // Is It Fools Talk? // Unbelievable? Conference 2014',
            },
        },
        # Kaltura embed with single quotes
        {
            'url': 'http://fod.infobase.com/p_ViewPlaylist.aspx?AssignmentID=NUN8ZY',
            'info_dict': {
                'id': '0_izeg5utt',
                'ext': 'mp4',
                'title': '35871',
                'timestamp': 1355743100,
                'upload_date': '20121217',
                'uploader_id': 'cplapp@learn360.com',
            },
            'add_ie': ['Kaltura'],
        },
        {
            # Kaltura embedded via quoted entry_id
            'url': 'https://www.oreilly.com/ideas/my-cloud-makes-pretty-pictures',
            'info_dict': {
                'id': '0_utuok90b',
                'ext': 'mp4',
                'title': '06_matthew_brender_raj_dutt',
                'timestamp': 1466638791,
                'upload_date': '20160622',
            },
            'add_ie': ['Kaltura'],
            'expected_warnings': [
                'Could not send HEAD request'
            ],
            'params': {
                'skip_download': True,
            }
        },
        {
            # Kaltura embedded, some fileExt broken (#11480)
            'url': 'http://www.cornell.edu/video/nima-arkani-hamed-standard-models-of-particle-physics',
            'info_dict': {
                'id': '1_sgtvehim',
                'ext': 'mp4',
                'title': 'Our "Standard Models" of particle physics and cosmology',
                'description': 'md5:67ea74807b8c4fea92a6f38d6d323861',
                'timestamp': 1321158993,
                'upload_date': '20111113',
                'uploader_id': 'kps1',
            },
            'add_ie': ['Kaltura'],
        },
        {
            # Kaltura iframe embed
            'url': 'http://www.gsd.harvard.edu/event/i-m-pei-a-centennial-celebration/',
            'md5': 'ae5ace8eb09dc1a35d03b579a9c2cc44',
            'info_dict': {
                'id': '0_f2cfbpwy',
                'ext': 'mp4',
                'title': 'I. M. Pei: A Centennial Celebration',
                'description': 'md5:1db8f40c69edc46ca180ba30c567f37c',
                'upload_date': '20170403',
                'uploader_id': 'batchUser',
                'timestamp': 1491232186,
            },
            'add_ie': ['Kaltura'],
        },
        {
            # Kaltura iframe embed, more sophisticated
            'url': 'http://www.cns.nyu.edu/~eero/math-tools/Videos/lecture-05sep2017.html',
            'info_dict': {
                'id': '1_9gzouybz',
                'ext': 'mp4',
                'title': 'lecture-05sep2017',
                'description': 'md5:40f347d91fd4ba047e511c5321064b49',
                'upload_date': '20170913',
                'uploader_id': 'eps2',
                'timestamp': 1505340777,
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': ['Kaltura'],
        },
        {
            # meta twitter:player
            'url': 'http://thechive.com/2017/12/08/all-i-want-for-christmas-is-more-twerk/',
            'info_dict': {
                'id': '0_01b42zps',
                'ext': 'mp4',
                'title': 'Main Twerk (Video)',
                'upload_date': '20171208',
                'uploader_id': 'sebastian.salinas@thechive.com',
                'timestamp': 1512713057,
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': ['Kaltura'],
        },
        # referrer protected EaglePlatform embed
        {
            'url': 'https://tvrain.ru/lite/teleshow/kak_vse_nachinalos/namin-418921/',
            'info_dict': {
                'id': '582306',
                'ext': 'mp4',
                'title': 'Стас Намин: «Мы нарушили девственность Кремля»',
                'thumbnail': r're:^https?://.*\.jpg$',
                'duration': 3382,
                'view_count': int,
            },
            'params': {
                'skip_download': True,
            },
        },
        # ClipYou (EaglePlatform) embed (custom URL)
        {
            'url': 'http://muz-tv.ru/play/7129/',
            # Not checking MD5 as sometimes the direct HTTP link results in 404 and HLS is used
            'info_dict': {
                'id': '12820',
                'ext': 'mp4',
                'title': "'O Sole Mio",
                'thumbnail': r're:^https?://.*\.jpg$',
                'duration': 216,
                'view_count': int,
            },
            'params': {
                'skip_download': True,
            },
            'skip': 'This video is unavailable.',
        },
        # Pladform embed
        {
            'url': 'http://muz-tv.ru/kinozal/view/7400/',
            'info_dict': {
                'id': '100183293',
                'ext': 'mp4',
                'title': 'Тайны перевала Дятлова • 1 серия 2 часть',
                'description': 'Документальный сериал-расследование одной из самых жутких тайн ХХ века',
                'thumbnail': r're:^https?://.*\.jpg$',
                'duration': 694,
                'age_limit': 0,
            },
            'skip': 'HTTP Error 404: Not Found',
        },
        # Playwire embed
        {
            'url': 'http://www.cinemablend.com/new/First-Joe-Dirt-2-Trailer-Teaser-Stupid-Greatness-70874.html',
            'info_dict': {
                'id': '3519514',
                'ext': 'mp4',
                'title': 'Joe Dirt 2 Beautiful Loser Teaser Trailer',
                'thumbnail': r're:^https?://.*\.png$',
                'duration': 45.115,
            },
        },
        # Crooks and Liars embed
        {
            'url': 'http://crooksandliars.com/2015/04/fox-friends-says-protecting-atheists',
            'info_dict': {
                'id': '8RUoRhRi',
                'ext': 'mp4',
                'title': "Fox & Friends Says Protecting Atheists From Discrimination Is Anti-Christian!",
                'description': 'md5:e1a46ad1650e3a5ec7196d432799127f',
                'timestamp': 1428207000,
                'upload_date': '20150405',
                'uploader': 'Heather',
            },
        },
        # Crooks and Liars external embed
        {
            'url': 'http://theothermccain.com/2010/02/02/video-proves-that-bill-kristol-has-been-watching-glenn-beck/comment-page-1/',
            'info_dict': {
                'id': 'MTE3MjUtMzQ2MzA',
                'ext': 'mp4',
                'title': 'md5:5e3662a81a4014d24c250d76d41a08d5',
                'description': 'md5:9b8e9542d6c3c5de42d6451b7d780cec',
                'timestamp': 1265032391,
                'upload_date': '20100201',
                'uploader': 'Heather',
            },
        },
        # NBC Sports vplayer embed
        {
            'url': 'http://www.riderfans.com/forum/showthread.php?121827-Freeman&s=e98fa1ea6dc08e886b1678d35212494a',
            'info_dict': {
                'id': 'ln7x1qSThw4k',
                'ext': 'flv',
                'title': "PFT Live: New leader in the 'new-look' defense",
                'description': 'md5:65a19b4bbfb3b0c0c5768bed1dfad74e',
                'uploader': 'NBCU-SPORTS',
                'upload_date': '20140107',
                'timestamp': 1389118457,
            },
            'skip': 'Invalid Page URL',
        },
        # NBC News embed
        {
            'url': 'http://www.vulture.com/2016/06/letterman-couldnt-care-less-about-late-night.html',
            'md5': '1aa589c675898ae6d37a17913cf68d66',
            'info_dict': {
                'id': 'x_dtl_oa_LettermanliftPR_160608',
                'ext': 'mp4',
                'title': 'David Letterman: A Preview',
                'description': 'A preview of Tom Brokaw\'s interview with David Letterman as part of the On Assignment series powered by Dateline. Airs Sunday June 12 at 7/6c.',
                'upload_date': '20160609',
                'timestamp': 1465431544,
                'uploader': 'NBCU-NEWS',
            },
        },
        # UDN embed
        {
            'url': 'https://video.udn.com/news/300346',
            'md5': 'fd2060e988c326991037b9aff9df21a6',
            'info_dict': {
                'id': '300346',
                'ext': 'mp4',
                'title': '中一中男師變性 全校師生力挺',
                'thumbnail': r're:^https?://.*\.jpg$',
            },
            'params': {
                # m3u8 download
                'skip_download': True,
            },
            'expected_warnings': ['Failed to parse JSON Expecting value'],
        },
        # Kinja embed
        {
            'url': 'http://www.clickhole.com/video/dont-understand-bitcoin-man-will-mumble-explanatio-2537',
            'info_dict': {
                'id': '106351',
                'ext': 'mp4',
                'title': 'Don’t Understand Bitcoin? This Man Will Mumble An Explanation At You',
                'description': 'Migrated from OnionStudios',
                'thumbnail': r're:^https?://.*\.jpe?g$',
                'uploader': 'clickhole',
                'upload_date': '20150527',
                'timestamp': 1432744860,
            }
        },
        # SnagFilms embed
        {
            'url': 'http://whilewewatch.blogspot.ru/2012/06/whilewewatch-whilewewatch-gripping.html',
            'info_dict': {
                'id': '74849a00-85a9-11e1-9660-123139220831',
                'ext': 'mp4',
                'title': '#whilewewatch',
            }
        },
        # AdobeTVVideo embed
        {
            'url': 'https://helpx.adobe.com/acrobat/how-to/new-experience-acrobat-dc.html?set=acrobat--get-started--essential-beginners',
            'md5': '43662b577c018ad707a63766462b1e87',
            'info_dict': {
                'id': '2456',
                'ext': 'mp4',
                'title': 'New experience with Acrobat DC',
                'description': 'New experience with Acrobat DC',
                'duration': 248.667,
            },
        },
        # Another form of arte.tv embed
        {
            'url': 'http://www.tv-replay.fr/redirection/09-04-16/arte-reportage-arte-11508975.html',
            'md5': '850bfe45417ddf221288c88a0cffe2e2',
            'info_dict': {
                'id': '030273-562_PLUS7-F',
                'ext': 'mp4',
                'title': 'ARTE Reportage - Nulle part, en France',
                'description': 'md5:e3a0e8868ed7303ed509b9e3af2b870d',
                'upload_date': '20160409',
            },
        },
        # Duplicated embedded video URLs
        {
            'url': 'http://www.hudl.com/athlete/2538180/highlights/149298443',
            'info_dict': {
                'id': '149298443_480_16c25b74_2',
                'ext': 'mp4',
                'title': 'vs. Blue Orange Spring Game',
                'uploader': 'www.hudl.com',
            },
        },
        # twitter:player:stream embed
        {
            'url': 'http://www.rtl.be/info/video/589263.aspx?CategoryID=288',
            'info_dict': {
                'id': 'master',
                'ext': 'mp4',
                'title': 'Une nouvelle espèce de dinosaure découverte en Argentine',
                'uploader': 'www.rtl.be',
            },
            'params': {
                # m3u8 downloads
                'skip_download': True,
            },
        },
        # twitter:player embed
        {
            'url': 'http://www.theatlantic.com/video/index/484130/what-do-black-holes-sound-like/',
            'md5': 'a3e0df96369831de324f0778e126653c',
            'info_dict': {
                'id': '4909620399001',
                'ext': 'mp4',
                'title': 'What Do Black Holes Sound Like?',
                'description': 'what do black holes sound like',
                'upload_date': '20160524',
                'uploader_id': '29913724001',
                'timestamp': 1464107587,
                'uploader': 'TheAtlantic',
            },
            'skip': 'Private Youtube video',
        },
        # Facebook <iframe> embed
        {
            'url': 'https://www.hostblogger.de/blog/archives/6181-Auto-jagt-Betonmischer.html',
            'md5': 'fbcde74f534176ecb015849146dd3aee',
            'info_dict': {
                'id': '599637780109885',
                'ext': 'mp4',
                'title': 'Facebook video #599637780109885',
            },
        },
        # Facebook <iframe> embed, plugin video
        {
            'url': 'http://5pillarsuk.com/2017/06/07/tariq-ramadan-disagrees-with-pr-exercise-by-imams-refusing-funeral-prayers-for-london-attackers/',
            'info_dict': {
                'id': '1754168231264132',
                'ext': 'mp4',
                'title': 'About the Imams and Religious leaders refusing to perform funeral prayers for...',
                'uploader': 'Tariq Ramadan (official)',
                'timestamp': 1496758379,
                'upload_date': '20170606',
            },
            'params': {
                'skip_download': True,
            },
        },
        # Facebook API embed
        {
            'url': 'http://www.lothype.com/blue-stars-2016-preview-standstill-full-show/',
            'md5': 'a47372ee61b39a7b90287094d447d94e',
            'info_dict': {
                'id': '10153467542406923',
                'ext': 'mp4',
                'title': 'Facebook video #10153467542406923',
            },
        },
        # Wordpress "YouTube Video Importer" plugin
        {
            'url': 'http://www.lothype.com/blue-devils-drumline-stanford-lot-2016/',
            'md5': 'd16797741b560b485194eddda8121b48',
            'info_dict': {
                'id': 'HNTXWDXV9Is',
                'ext': 'mp4',
                'title': 'Blue Devils Drumline Stanford lot 2016',
                'upload_date': '20160627',
                'uploader_id': 'GENOCIDE8GENERAL10',
                'uploader': 'cylus cyrus',
            },
        },
        {
            # video stored on custom kaltura server
            'url': 'http://www.expansion.com/multimedia/videos.html?media=EQcM30NHIPv',
            'md5': '537617d06e64dfed891fa1593c4b30cc',
            'info_dict': {
                'id': '0_1iotm5bh',
                'ext': 'mp4',
                'title': 'Elecciones británicas: 5 lecciones para Rajoy',
                'description': 'md5:435a89d68b9760b92ce67ed227055f16',
                'uploader_id': 'videos.expansion@el-mundo.net',
                'upload_date': '20150429',
                'timestamp': 1430303472,
            },
            'add_ie': ['Kaltura'],
        },
        {
            # multiple kaltura embeds, nsfw
            'url': 'https://www.quartier-rouge.be/prive/femmes/kamila-avec-video-jaime-sadomie.html',
            'info_dict': {
                'id': 'kamila-avec-video-jaime-sadomie',
                'title': "Kamila avec vídeo “J'aime sadomie”",
            },
            'playlist_count': 8,
        },
        {
            # Non-standard Vimeo embed
            'url': 'https://openclassrooms.com/courses/understanding-the-web',
            'md5': '64d86f1c7d369afd9a78b38cbb88d80a',
            'info_dict': {
                'id': '148867247',
                'ext': 'mp4',
                'title': 'Understanding the web - Teaser',
                'description': 'This is "Understanding the web - Teaser" by openclassrooms on Vimeo, the home for high quality videos and the people who love them.',
                'upload_date': '20151214',
                'uploader': 'OpenClassrooms',
                'uploader_id': 'openclassrooms',
            },
            'add_ie': ['Vimeo'],
        },
        {
            # generic vimeo embed that requires original URL passed as Referer
            'url': 'http://racing4everyone.eu/2016/07/30/formula-1-2016-round12-germany/',
            'only_matching': True,
        },
        {
            'url': 'https://support.arkena.com/display/PLAY/Ways+to+embed+your+video',
            'md5': 'b96f2f71b359a8ecd05ce4e1daa72365',
            'info_dict': {
                'id': 'b41dda37-d8e7-4d3f-b1b5-9a9db578bdfe',
                'ext': 'mp4',
                'title': 'Big Buck Bunny',
                'description': 'Royalty free test video',
                'timestamp': 1432816365,
                'upload_date': '20150528',
                'is_live': False,
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': ['Arkena'],
        },
        {
            'url': 'http://nova.bg/news/view/2016/08/16/156543/%D0%BD%D0%B0-%D0%BA%D0%BE%D1%81%D1%8A%D0%BC-%D0%BE%D1%82-%D0%B2%D0%B7%D1%80%D0%B8%D0%B2-%D0%BE%D1%82%D1%86%D0%B5%D0%BF%D0%B8%D1%85%D0%B0-%D1%86%D1%8F%D0%BB-%D0%BA%D0%B2%D0%B0%D1%80%D1%82%D0%B0%D0%BB-%D0%B7%D0%B0%D1%80%D0%B0%D0%B4%D0%B8-%D0%B8%D0%B7%D1%82%D0%B8%D1%87%D0%B0%D0%BD%D0%B5-%D0%BD%D0%B0-%D0%B3%D0%B0%D0%B7-%D0%B2-%D0%BF%D0%BB%D0%BE%D0%B2%D0%B4%D0%B8%D0%B2/',
            'info_dict': {
                'id': '1c7141f46c',
                'ext': 'mp4',
                'title': 'НА КОСЪМ ОТ ВЗРИВ: Изтичане на газ на бензиностанция в Пловдив',
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': ['Vbox7'],
        },
        {
            # DBTV embeds
            'url': 'http://www.dagbladet.no/2016/02/23/nyheter/nordlys/ski/troms/ver/43254897/',
            'info_dict': {
                'id': '43254897',
                'title': 'Etter ett års planlegging, klaffet endelig alt: - Jeg måtte ta en liten dans',
            },
            'playlist_mincount': 3,
        },
        {
            # Videa embeds
            'url': 'http://forum.dvdtalk.com/movie-talk/623756-deleted-magic-star-wars-ot-deleted-alt-scenes-docu-style.html',
            'info_dict': {
                'id': '623756-deleted-magic-star-wars-ot-deleted-alt-scenes-docu-style',
                'title': 'Deleted Magic - Star Wars: OT Deleted / Alt. Scenes Docu. Style - DVD Talk Forum',
            },
            'playlist_mincount': 2,
        },
        {
            # 20 minuten embed
            'url': 'http://www.20min.ch/schweiz/news/story/So-kommen-Sie-bei-Eis-und-Schnee-sicher-an-27032552',
            'info_dict': {
                'id': '523629',
                'ext': 'mp4',
                'title': 'So kommen Sie bei Eis und Schnee sicher an',
                'description': 'md5:117c212f64b25e3d95747e5276863f7d',
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': ['TwentyMinuten'],
        },
        {
            # VideoPress embed
            'url': 'https://en.support.wordpress.com/videopress/',
            'info_dict': {
                'id': 'OcobLTqC',
                'ext': 'm4v',
                'title': 'IMG_5786',
                'timestamp': 1435711927,
                'upload_date': '20150701',
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': ['VideoPress'],
        },
        {
            # Rutube embed
            'url': 'http://magazzino.friday.ru/videos/vipuski/kazan-2',
            'info_dict': {
                'id': '9b3d5bee0a8740bf70dfd29d3ea43541',
                'ext': 'flv',
                'title': 'Магаззино: Казань 2',
                'description': 'md5:99bccdfac2269f0e8fdbc4bbc9db184a',
                'uploader': 'Магаззино',
                'upload_date': '20170228',
                'uploader_id': '996642',
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': ['Rutube'],
        },
        {
            # glomex:embed
            'url': 'https://www.skai.gr/news/world/iatrikos-syllogos-tourkias-to-turkovac-aplo-dialyma-erntogan-eiste-apateones-kai-pseytes',
            'info_dict': {
                'id': 'v-ch2nkhcirwc9-sf',
                'ext': 'mp4',
                'title': 'md5:786e1e24e06c55993cee965ef853a0c1',
                'description': 'md5:8b517a61d577efe7e36fde72fd535995',
                'timestamp': 1641885019,
                'upload_date': '20220111',
                'duration': 460000,
                'thumbnail': 'https://i3thumbs.glomex.com/dC1idjJwdndiMjRzeGwvMjAyMi8wMS8xMS8wNy8xMF8zNV82MWRkMmQ2YmU5ZTgyLmpwZw==/profile:player-960x540',
            },
        },
        {
            # megatvcom:embed
            'url': 'https://www.in.gr/2021/12/18/greece/apokalypsi-mega-poios-parelave-tin-ereyna-tsiodra-ek-merous-tis-kyvernisis-o-prothypourgos-telika-gnorize/',
            'info_dict': {
                'id': 'apokalypsi-mega-poios-parelave-tin-ereyna-tsiodra-ek-merous-tis-kyvernisis-o-prothypourgos-telika-gnorize',
                'title': 'md5:5e569cf996ec111057c2764ec272848f',
            },
            'playlist': [{
                'md5': '1afa26064ff00ccb91617957dbc73dc1',
                'info_dict': {
                    'ext': 'mp4',
                    'id': '564916',
                    'display_id': 'md5:6cdf22d3a2e7bacb274b7295089a1770',
                    'title': 'md5:33b9dd39584685b62873043670eb52a6',
                    'description': 'md5:c1db7310f390518ac36dd69d947ef1a1',
                    'timestamp': 1639753145,
                    'upload_date': '20211217',
                    'thumbnail': 'https://www.megatv.com/wp-content/uploads/2021/12/prezerakos-1024x597.jpg',
                },
            }, {
                'md5': '4a1c220695f1ef865a8b7966a53e2474',
                'info_dict': {
                    'ext': 'mp4',
                    'id': '564905',
                    'display_id': 'md5:ead15695e485e649aed2b81ebd699b88',
                    'title': 'md5:2b71fd54249a3ca34609fe39ae31c47b',
                    'description': 'md5:c42e12f638d0a97d6de4508e2c4df982',
                    'timestamp': 1639753047,
                    'upload_date': '20211217',
                    'thumbnail': 'https://www.megatv.com/wp-content/uploads/2021/12/tsiodras-mitsotakis-1024x545.jpg',
                },
            }]
        },
        {
            'url': 'https://www.ertnews.gr/video/manolis-goyalles-o-anthropos-piso-apo-ti-diadiktyaki-vasilopita/',
            'info_dict': {
                'id': '2022/tv/news-themata-ianouarios/20220114-apotis6-gouales-pita.mp4',
                'ext': 'mp4',
                'title': 'md5:df64f5b61c06d0e9556c0cdd5cf14464',
                'thumbnail': 'https://www.ert.gr/themata/photos/2021/20220114-apotis6-gouales-pita.jpg',
            },
        },
        {
            # ThePlatform embedded with whitespaces in URLs
            'url': 'http://www.golfchannel.com/topics/shows/golftalkcentral.htm',
            'only_matching': True,
        },
        {
            # Senate ISVP iframe https
            'url': 'https://www.hsgac.senate.gov/hearings/canadas-fast-track-refugee-plan-unanswered-questions-and-implications-for-us-national-security',
            'md5': 'fb8c70b0b515e5037981a2492099aab8',
            'info_dict': {
                'id': 'govtaff020316',
                'ext': 'mp4',
                'title': 'Integrated Senate Video Player',
            },
            'add_ie': ['SenateISVP'],
        },
        {
            # Limelight embeds (1 channel embed + 4 media embeds)
            'url': 'http://www.sedona.com/FacilitatorTraining2017',
            'info_dict': {
                'id': 'FacilitatorTraining2017',
                'title': 'Facilitator Training 2017',
            },
            'playlist_mincount': 5,
        },
        {
            # Limelight embed (LimelightPlayerUtil.embed)
            'url': 'https://tv5.ca/videos?v=xuu8qowr291ri',
            'info_dict': {
                'id': '95d035dc5c8a401588e9c0e6bd1e9c92',
                'ext': 'mp4',
                'title': '07448641',
                'timestamp': 1499890639,
                'upload_date': '20170712',
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': ['LimelightMedia'],
        },
        {
            'url': 'http://kron4.com/2017/04/28/standoff-with-walnut-creek-murder-suspect-ends-with-arrest/',
            'info_dict': {
                'id': 'standoff-with-walnut-creek-murder-suspect-ends-with-arrest',
                'title': 'Standoff with Walnut Creek murder suspect ends',
                'description': 'md5:3ccc48a60fc9441eeccfc9c469ebf788',
            },
            'playlist_mincount': 4,
        },
        {
            # WashingtonPost embed
            'url': 'http://www.vanityfair.com/hollywood/2017/04/donald-trump-tv-pitches',
            'info_dict': {
                'id': '8caf6e88-d0ec-11e5-90d3-34c2c42653ac',
                'ext': 'mp4',
                'title': "No one has seen the drama series based on Trump's life \u2014 until now",
                'description': 'Donald Trump wanted a weekly TV drama based on his life. It never aired. But The Washington Post recently obtained a scene from the pilot script — and enlisted actors.',
                'timestamp': 1455216756,
                'uploader': 'The Washington Post',
                'upload_date': '20160211',
            },
            'add_ie': ['WashingtonPost'],
        },
        {
            # JOJ.sk embeds
            'url': 'https://www.noviny.sk/slovensko/238543-slovenskom-sa-prehnala-vlna-silnych-burok',
            'info_dict': {
                'id': '238543-slovenskom-sa-prehnala-vlna-silnych-burok',
                'title': 'Slovenskom sa prehnala vlna silných búrok',
            },
            'playlist_mincount': 5,
            'add_ie': ['Joj'],
        },
        {
            # AMP embed (see https://www.ampproject.org/docs/reference/components/amp-video)
            'url': 'https://tvrain.ru/amp/418921/',
            'md5': 'cc00413936695987e8de148b67d14f1d',
            'info_dict': {
                'id': '418921',
                'ext': 'mp4',
                'title': 'Стас Намин: «Мы нарушили девственность Кремля»',
            },
        },
        {
            # multiple HTML5 videos on one page
            'url': 'https://www.paragon-software.com/home/rk-free/keyscenarios.html',
            'info_dict': {
                'id': 'keyscenarios',
                'title': 'Rescue Kit 14 Free Edition - Getting started',
            },
            'playlist_count': 4,
        },
        {
            # vshare embed
            'url': 'https://youtube-dl-demo.neocities.org/vshare.html',
            'md5': '17b39f55b5497ae8b59f5fbce8e35886',
            'info_dict': {
                'id': '0f64ce6',
                'title': 'vl14062007715967',
                'ext': 'mp4',
            }
        },
        {
            'url': 'http://www.heidelberg-laureate-forum.org/blog/video/lecture-friday-september-23-2016-sir-c-antony-r-hoare/',
            'md5': 'aecd089f55b1cb5a59032cb049d3a356',
            'info_dict': {
                'id': '90227f51a80c4d8f86c345a7fa62bd9a1d',
                'ext': 'mp4',
                'title': 'Lecture: Friday, September 23, 2016 - Sir Tony Hoare',
                'description': 'md5:5a51db84a62def7b7054df2ade403c6c',
                'timestamp': 1474354800,
                'upload_date': '20160920',
            }
        },
        {
            'url': 'http://www.kidzworld.com/article/30935-trolls-the-beat-goes-on-interview-skylar-astin-and-amanda-leighton',
            'info_dict': {
                'id': '1731611',
                'ext': 'mp4',
                'title': 'Official Trailer | TROLLS: THE BEAT GOES ON!',
                'description': 'md5:eb5f23826a027ba95277d105f248b825',
                'timestamp': 1516100691,
                'upload_date': '20180116',
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': ['SpringboardPlatform'],
        },
        {
            'url': 'https://www.yapfiles.ru/show/1872528/690b05d3054d2dbe1e69523aa21bb3b1.mp4.html',
            'info_dict': {
                'id': 'vMDE4NzI1Mjgt690b',
                'ext': 'mp4',
                'title': 'Котята',
            },
            'add_ie': ['YapFiles'],
            'params': {
                'skip_download': True,
            },
        },
        {
            # CloudflareStream embed
            'url': 'https://www.cloudflare.com/products/cloudflare-stream/',
            'info_dict': {
                'id': '31c9291ab41fac05471db4e73aa11717',
                'ext': 'mp4',
                'title': '31c9291ab41fac05471db4e73aa11717',
            },
            'add_ie': ['CloudflareStream'],
            'params': {
                'skip_download': True,
            },
        },
        {
            # PeerTube embed
            'url': 'https://joinpeertube.org/fr/home/',
            'info_dict': {
                'id': 'home',
                'title': 'Reprenez le contrôle de vos vidéos ! #JoinPeertube',
            },
            'playlist_count': 2,
        },
        {
            # Indavideo embed
            'url': 'https://streetkitchen.hu/receptek/igy_kell_otthon_hamburgert_sutni/',
            'info_dict': {
                'id': '1693903',
                'ext': 'mp4',
                'title': 'Így kell otthon hamburgert sütni',
                'description': 'md5:f5a730ecf900a5c852e1e00540bbb0f7',
                'timestamp': 1426330212,
                'upload_date': '20150314',
                'uploader': 'StreetKitchen',
                'uploader_id': '546363',
            },
            'add_ie': ['IndavideoEmbed'],
            'params': {
                'skip_download': True,
            },
        },
        {
            # APA embed via JWPlatform embed
            'url': 'http://www.vol.at/blue-man-group/5593454',
            'info_dict': {
                'id': 'jjv85FdZ',
                'ext': 'mp4',
                'title': '"Blau ist mysteriös": Die Blue Man Group im Interview',
                'description': 'md5:d41d8cd98f00b204e9800998ecf8427e',
                'thumbnail': r're:^https?://.*\.jpg$',
                'duration': 254,
                'timestamp': 1519211149,
                'upload_date': '20180221',
            },
            'params': {
                'skip_download': True,
            },
        },
        {
            'url': 'http://share-videos.se/auto/video/83645793?uid=13',
            'md5': 'b68d276de422ab07ee1d49388103f457',
            'info_dict': {
                'id': '83645793',
                'title': 'Lock up and get excited',
                'ext': 'mp4'
            },
            'skip': 'TODO: fix nested playlists processing in tests',
        },
        {
            # Viqeo embeds
            'url': 'https://viqeo.tv/',
            'info_dict': {
                'id': 'viqeo',
                'title': 'All-new video platform',
            },
            'playlist_count': 6,
        },
        # {
        #     # Zype embed
        #     'url': 'https://www.cookscountry.com/episode/554-smoky-barbecue-favorites',
        #     'info_dict': {
        #         'id': '5b400b834b32992a310622b9',
        #         'ext': 'mp4',
        #         'title': 'Smoky Barbecue Favorites',
        #         'thumbnail': r're:^https?://.*\.jpe?g',
        #         'description': 'md5:5ff01e76316bd8d46508af26dc86023b',
        #         'upload_date': '20170909',
        #         'timestamp': 1504915200,
        #     },
        #     'add_ie': [ZypeIE.ie_key()],
        #     'params': {
        #         'skip_download': True,
        #     },
        # },
        {
            # videojs embed
            'url': 'https://video.sibnet.ru/shell.php?videoid=3422904',
            'info_dict': {
                'id': 'shell',
                'ext': 'mp4',
                'title': 'Доставщик пиццы спросил разрешения сыграть на фортепиано',
                'description': 'md5:89209cdc587dab1e4a090453dbaa2cb1',
                'thumbnail': r're:^https?://.*\.jpg$',
            },
            'params': {
                'skip_download': True,
            },
            'expected_warnings': ['Failed to download MPD manifest'],
        },
        {
            # DailyMotion embed with DM.player
            'url': 'https://www.beinsports.com/us/copa-del-rey/video/the-locker-room-valencia-beat-barca-in-copa/1203804',
            'info_dict': {
                'id': 'k6aKkGHd9FJs4mtJN39',
                'ext': 'mp4',
                'title': 'The Locker Room: Valencia Beat Barca In Copa del Rey Final',
                'description': 'This video is private.',
                'uploader_id': 'x1jf30l',
                'uploader': 'beIN SPORTS USA',
                'upload_date': '20190528',
                'timestamp': 1559062971,
            },
            'params': {
                'skip_download': True,
            },
        },
        {
            # tvopengr:embed
            'url': 'https://www.ethnos.gr/World/article/190604/hparosiaxekinoynoisynomiliessthgeneyhmethskiatoypolemoypanoapothnoykrania',
            'md5': 'eb0c3995d0a6f18f6538c8e057865d7d',
            'info_dict': {
                'id': '101119',
                'ext': 'mp4',
                'display_id': 'oikarpoitondiapragmateyseonhparosias',
                'title': 'md5:b979f4d640c568617d6547035528a149',
                'description': 'md5:e54fc1977c7159b01cc11cd7d9d85550',
                'timestamp': 1641772800,
                'upload_date': '20220110',
                'thumbnail': 'https://opentv-static.siliconweb.com/imgHandler/1920/70bc39fa-895b-4918-a364-c39d2135fc6d.jpg',

            }
        },
        {
            # blogger embed
            'url': 'https://blog.tomeuvizoso.net/2019/01/a-panfrost-milestone.html',
            'md5': 'f1bc19b6ea1b0fd1d81e84ca9ec467ac',
            'info_dict': {
                'id': 'BLOGGER-video-3c740e3a49197e16-796',
                'ext': 'mp4',
                'title': 'Blogger',
                'thumbnail': r're:^https?://.*',
            },
        },
        # {
        #     # TODO: find another test
        #     # http://schema.org/VideoObject
        #     'url': 'https://flipagram.com/f/nyvTSJMKId',
        #     'md5': '888dcf08b7ea671381f00fab74692755',
        #     'info_dict': {
        #         'id': 'nyvTSJMKId',
        #         'ext': 'mp4',
        #         'title': 'Flipagram by sjuria101 featuring Midnight Memories by One Direction',
        #         'description': '#love for cats.',
        #         'timestamp': 1461244995,
        #         'upload_date': '20160421',
        #     },
        #     'params': {
        #         'force_generic_extractor': True,
        #     },
        # },
        {
            # VHX Embed
            'url': 'https://demo.vhx.tv/category-c/videos/file-example-mp4-480-1-5mg-copy',
            'info_dict': {
                'id': '858208',
                'ext': 'mp4',
                'title': 'Untitled',
                'uploader_id': 'user80538407',
                'uploader': 'OTT Videos',
            },
        },
        {
            # ArcPublishing PoWa video player
            'url': 'https://www.adn.com/politics/2020/11/02/video-senate-candidates-campaign-in-anchorage-on-eve-of-election-day/',
            'md5': 'b03b2fac8680e1e5a7cc81a5c27e71b3',
            'info_dict': {
                'id': '8c99cb6e-b29c-4bc9-9173-7bf9979225ab',
                'ext': 'mp4',
                'title': 'Senate candidates wave to voters on Anchorage streets',
                'description': 'md5:91f51a6511f090617353dc720318b20e',
                'timestamp': 1604378735,
                'upload_date': '20201103',
                'duration': 1581,
            },
        },
        {
            # MyChannels SDK embed
            # https://www.24kitchen.nl/populair/deskundige-dit-waarom-sommigen-gevoelig-zijn-voor-voedselallergieen
            'url': 'https://www.demorgen.be/nieuws/burgemeester-rotterdam-richt-zich-in-videoboodschap-tot-relschoppers-voelt-het-goed~b0bcfd741/',
            'md5': '90c0699c37006ef18e198c032d81739c',
            'info_dict': {
                'id': '194165',
                'ext': 'mp4',
                'title': 'Burgemeester Aboutaleb spreekt relschoppers toe',
                'timestamp': 1611740340,
                'upload_date': '20210127',
                'duration': 159,
            },
        },
        {
            # Simplecast player embed
            'url': 'https://www.bio.org/podcast',
            'info_dict': {
                'id': 'podcast',
                'title': 'I AM BIO Podcast | BIO',
            },
            'playlist_mincount': 52,
        }, {
            # WimTv embed player
            'url': 'http://www.msmotor.tv/wearefmi-pt-2-2021/',
            'info_dict': {
                'id': 'wearefmi-pt-2-2021',
                'title': '#WEAREFMI – PT.2 – 2021 – MsMotorTV',
            },
            'playlist_count': 1,
        }, {
            # KVS Player
            'url': 'https://www.kvs-demo.com/videos/105/kelis-4th-of-july/',
            'info_dict': {
                'id': '105',
                'display_id': 'kelis-4th-of-july',
                'ext': 'mp4',
                'title': 'Kelis - 4th Of July',
                'description': 'Kelis - 4th Of July',
                'thumbnail': r're:https://(?:www\.)?kvs-demo.com/contents/videos_screenshots/0/105/preview.jpg',
            },
            'params': {
                'skip_download': True,
            },
            'expected_warnings': ['Untested major version'],
        }, {
            # KVS Player
            'url': 'https://www.kvs-demo.com/embed/105/',
            'info_dict': {
                'id': '105',
                'display_id': 'kelis-4th-of-july',
                'ext': 'mp4',
                'title': 'Kelis - 4th Of July / Embed Player',
                'thumbnail': r're:https://(?:www\.)?kvs-demo.com/contents/videos_screenshots/0/105/preview.jpg',
            },
            'params': {
                'skip_download': True,
            },
        }, {
            'url': 'https://youix.com/video/leningrad-zoj/',
            'md5': '94f96ba95706dc3880812b27b7d8a2b8',
            'info_dict': {
                'id': '18485',
                'display_id': 'leningrad-zoj',
                'ext': 'mp4',
                'title': 'Клип: Ленинград - ЗОЖ скачать, смотреть онлайн | Youix.com',
                'thumbnail': r're:https://youix.com/contents/videos_screenshots/18000/18485/preview(?:_480x320_youix_com.mp4)?\.jpg',
            },
        }, {
            # KVS Player
            'url': 'https://youix.com/embed/18485',
            'md5': '94f96ba95706dc3880812b27b7d8a2b8',
            'info_dict': {
                'id': '18485',
                'display_id': 'leningrad-zoj',
                'ext': 'mp4',
                'title': 'Ленинград - ЗОЖ',
                'thumbnail': r're:https://youix.com/contents/videos_screenshots/18000/18485/preview(?:_480x320_youix_com.mp4)?\.jpg',
            },
        }, {
            # KVS Player
            'url': 'https://bogmedia.org/videos/21217/40-nochey-40-nights-2016/',
            'md5': '94166bdb26b4cb1fb9214319a629fc51',
            'info_dict': {
                'id': '21217',
                'display_id': '40-nochey-2016',
                'ext': 'mp4',
                'title': '40 ночей (2016) - BogMedia.org',
                'description': 'md5:4e6d7d622636eb7948275432eb256dc3',
                'thumbnail': 'https://bogmedia.org/contents/videos_screenshots/21000/21217/preview_480p.mp4.jpg',
            },
        },
        {
            # KVS Player (for sites that serve kt_player.js via non-https urls)
            'url': 'http://www.camhub.world/embed/389508',
            'md5': 'fbe89af4cfb59c8fd9f34a202bb03e32',
            'info_dict': {
                'id': '389508',
                'display_id': 'syren-de-mer-onlyfans-05-07-2020have-a-happy-safe-holiday5f014e68a220979bdb8cd-source',
                'ext': 'mp4',
                'title': 'Syren De Mer onlyfans_05-07-2020Have_a_happy_safe_holiday5f014e68a220979bdb8cd_source / Embed плеер',
                'thumbnail': r're:https?://www\.camhub\.world/contents/videos_screenshots/389000/389508/preview\.mp4\.jpg',
            },
        },
        {
            # Reddit-hosted video that will redirect and be processed by RedditIE
            # Redirects to https://www.reddit.com/r/videos/comments/6rrwyj/that_small_heart_attack/
            'url': 'https://v.redd.it/zv89llsvexdz',
            'md5': '87f5f02f6c1582654146f830f21f8662',
            'info_dict': {
                'id': 'zv89llsvexdz',
                'ext': 'mp4',
                'timestamp': 1501941939.0,
                'title': 'That small heart attack.',
                'upload_date': '20170805',
                'uploader': 'Antw87'
            }
        },
        {
            # 1080p Reddit-hosted video that will redirect and be processed by RedditIE
            'url': 'https://v.redd.it/33hgok7dfbz71/',
            'md5': '7a1d587940242c9bb3bd6eb320b39258',
            'info_dict': {
                'id': '33hgok7dfbz71',
                'ext': 'mp4',
                'title': "The game Didn't want me to Knife that Guy I guess",
                'uploader': 'paraf1ve',
                'timestamp': 1636788683.0,
                'upload_date': '20211113'
            }
        },
        {
            # MainStreaming player
            'url': 'https://www.lactv.it/2021/10/03/lac-news24-la-settimana-03-10-2021/',
            'info_dict': {
                'id': 'EUlZfGWkGpOd',
                'title': 'La Settimana ',
                'description': '03 Ottobre ore 02:00',
                'ext': 'mp4',
                'live_status': 'not_live',
                'thumbnail': r're:https?://[A-Za-z0-9-]*\.msvdn.net/image/\w+/poster',
                'duration': 1512
            }
        },
        {
            # Multiple gfycat iframe embeds
            'url': 'https://www.gezip.net/bbs/board.php?bo_table=entertaine&wr_id=613422',
            'info_dict': {
                'title': '재이, 윤, 세은 황금 드레스를 입고 빛난다',
                'id': 'board'
            },
            'playlist_count': 8,
        },
        {
            # Multiple gfycat gifs (direct links)
            'url': 'https://www.gezip.net/bbs/board.php?bo_table=entertaine&wr_id=612199',
            'info_dict': {
                'title': '옳게 된 크롭 니트 스테이씨 아이사',
                'id': 'board'
            },
            'playlist_count': 6
        },
        {
            # Multiple gfycat embeds, with uppercase "IFR" in urls
            'url': 'https://kkzz.kr/?vid=2295',
            'info_dict': {
                'title': '지방시 앰버서더 에스파 카리나 움짤',
                'id': '?vid=2295'
            },
            'playlist_count': 9
        },
        {
            # Panopto embeds
            'url': 'https://www.monash.edu/learning-teaching/teachhq/learning-technologies/panopto/how-to/insert-a-quiz-into-a-panopto-video',
            'info_dict': {
                'ext': 'mp4',
                'id': '0bd3f16c-824a-436a-8486-ac5900693aef',
                'title': 'Quizzes in Panopto',
            },
        },
        {
            # Ruutu embed
            'url': 'https://www.nelonen.fi/ohjelmat/madventures-suomi/2160731-riku-ja-tunna-lahtevat-peurajahtiin-tv-sta-tutun-biologin-kanssa---metsastysreissu-huipentuu-kasvissyojan-painajaiseen',
            'md5': 'a2513a98d3496099e6eced40f7e6a14b',
            'info_dict': {
                'id': '4044426',
                'ext': 'mp4',
                'title': 'Riku ja Tunna lähtevät peurajahtiin tv:stä tutun biologin kanssa – metsästysreissu huipentuu kasvissyöjän painajaiseen!',
                'thumbnail': r're:^https?://.+\.jpg$',
                'duration': 108,
                'series': 'Madventures Suomi',
                'description': 'md5:aa55b44bd06a1e337a6f1d0b46507381',
                'categories': ['Matkailu', 'Elämäntyyli'],
                'age_limit': 0,
                'upload_date': '20220308',
            },
        },
        {
            # Multiple Ruutu embeds
            'url': 'https://www.hs.fi/kotimaa/art-2000008762560.html',
            'info_dict': {
                'title': 'Koronavirus | Epidemiahuippu voi olla Suomessa ohi, mutta koronaviruksen poistamista yleisvaarallisten tautien joukosta harkitaan vasta syksyllä',
                'id': 'art-2000008762560'
            },
            'playlist_count': 3
        },
        {
            # Ruutu embed in hs.fi with a single video
            'url': 'https://www.hs.fi/kotimaa/art-2000008793421.html',
            'md5': 'f8964e65d8fada6e8a562389bf366bb4',
            'info_dict': {
                'id': '4081841',
                'ext': 'mp4',
                'title': 'Puolustusvoimat siirsi panssariajoneuvoja harjoituksiin Niinisaloon 2.5.2022',
                'thumbnail': r're:^https?://.+\.jpg$',
                'duration': 138,
                'age_limit': 0,
                'upload_date': '20220504',
            },
        },
        {
            # Webpage contains double BOM
            'url': 'https://www.filmarkivet.se/movies/paris-d-moll/',
            'md5': 'df02cadc719dcc63d43288366f037754',
            'info_dict': {
                'id': 'paris-d-moll',
                'ext': 'mp4',
                'upload_date': '20220518',
                'title': 'Paris d-moll',
                'description': 'md5:319e37ea5542293db37e1e13072fe330',
                'thumbnail': 'https://www.filmarkivet.se/wp-content/uploads/parisdmoll2.jpg',
                'timestamp': 1652833414,
                'age_limit': 0,
            }
        },
        {
            'url': 'https://www.mollymovieclub.com/p/interstellar?s=r#details',
            'md5': '198bde8bed23d0b23c70725c83c9b6d9',
            'info_dict': {
                'id': '53602801',
                'ext': 'mpga',
                'title': 'Interstellar',
                'description': 'Listen now | Episode One',
                'thumbnail': 'md5:c30d9c83f738e16d8551d7219d321538',
                'uploader': 'Molly Movie Club',
                'uploader_id': '839621',
            },
        },
        {
            'url': 'https://www.blockedandreported.org/p/episode-117-lets-talk-about-depp?s=r',
            'md5': 'c0cc44ee7415daeed13c26e5b56d6aa0',
            'info_dict': {
                'id': '57962052',
                'ext': 'mpga',
                'title': 'md5:855b2756f0ee10f6723fa00b16266f8d',
                'description': 'md5:fe512a5e94136ad260c80bde00ea4eef',
                'thumbnail': 'md5:2218f27dfe517bb5ac16c47d0aebac59',
                'uploader': 'Blocked and Reported',
                'uploader_id': '500230',
            },
        },
        {
            'url': 'https://www.skimag.com/video/ski-people-1980/',
            'md5': '022a7e31c70620ebec18deeab376ee03',
            'info_dict': {
                'id': 'YTmgRiNU',
                'ext': 'mp4',
                'title': '1980 Ski People',
                'timestamp': 1610407738,
                'description': 'md5:cf9c3d101452c91e141f292b19fe4843',
                'thumbnail': 'https://cdn.jwplayer.com/v2/media/YTmgRiNU/poster.jpg?width=720',
                'duration': 5688.0,
                'upload_date': '20210111',
            }
        },
        {
            'note': 'JSON LD with multiple @type',
            'url': 'https://www.nu.nl/280161/video/hoe-een-bladvlo-dit-verwoestende-japanse-onkruid-moet-vernietigen.html',
            'md5': 'c7949f34f57273013fb7ccb1156393db',
            'info_dict': {
                'id': 'ipy2AcGL',
                'ext': 'mp4',
                'description': 'md5:6a9d644bab0dc2dc06849c2505d8383d',
                'thumbnail': r're:https://media\.nu\.nl/m/.+\.jpg',
                'title': 'Hoe een bladvlo dit verwoestende Japanse onkruid moet vernietigen',
                'timestamp': 1586577474,
                'upload_date': '20200411',
                'age_limit': 0,
                'duration': 111.0,
            }
        },
        {
            'note': 'JSON LD with unexpected data type',
            'url': 'https://www.autoweek.nl/autotests/artikel/porsche-911-gt3-rs-rij-impressie-2/',
            'info_dict': {
                'id': 'porsche-911-gt3-rs-rij-impressie-2',
                'ext': 'mp4',
                'title': 'Test: Porsche 911 GT3 RS',
                'description': 'Je ziet het niet, maar het is er wel. Downforce, hebben we het dan over. En in de nieuwe Porsche 911 GT3 RS is er zelfs heel veel downforce.',
                'timestamp': 1664920902,
                'upload_date': '20221004',
                'thumbnail': r're:^https://media.autoweek.nl/m/.+\.jpg$',
                'age_limit': 0,
                'direct': True,
            }
        },
        {
            'note': 'server returns data in brotli compression by default if `accept-encoding: *` is specified.',
            'url': 'https://www.extra.cz/cauky-lidi-70-dil-babis-predstavil-pohadky-prymulanek-nebo-andrejovy-nove-saty-ac867',
            'info_dict': {
                'id': 'cauky-lidi-70-dil-babis-predstavil-pohadky-prymulanek-nebo-andrejovy-nove-saty-ac867',
                'ext': 'mp4',
                'title': 'čauky lidi 70 finall',
                'description': 'čauky lidi 70 finall',
                'thumbnail': 'h',
                'upload_date': '20220606',
                'timestamp': 1654513791,
                'duration': 318.0,
                'direct': True,
                'age_limit': 0,
            },
        },
        {
            'url': 'https://shooshtime.com/videos/284002/just-out-of-the-shower-joi/',
            'md5': 'e2f0a4c329f7986280b7328e24036d60',
            'info_dict': {
                'id': '284002',
                'display_id': 'just-out-of-the-shower-joi',
                'ext': 'mp4',
                'title': 'Just Out Of The Shower JOI - Shooshtime',
                'thumbnail': 'https://i.shoosh.co/contents/videos_screenshots/284000/284002/preview.mp4.jpg',
                'height': 720,
                'age_limit': 18,
            },
        },
        {
            'note': 'Live HLS direct link',
            'url': 'https://d18j67ugtrocuq.cloudfront.net/out/v1/2767aec339144787926bd0322f72c6e9/index.m3u8',
            'info_dict': {
                'id': 'index',
                'title': r're:index',
                'ext': 'mp4',
                'live_status': 'is_live',
            },
            'params': {
                'skip_download': 'm3u8',
            },
        },
        {
            'note': 'Video.js VOD HLS',
            'url': 'https://gist.githubusercontent.com/bashonly/2aae0862c50f4a4b84f220c315767208/raw/e3380d413749dabbe804c9c2d8fd9a45142475c7/videojs_hls_test.html',
            'info_dict': {
                'id': 'videojs_hls_test',
                'title': 'video',
                'ext': 'mp4',
                'age_limit': 0,
                'duration': 1800,
            },
            'params': {
                'skip_download': 'm3u8',
            },
        },
    ]

    def report_following_redirect(self, new_url):
        """Report information extraction."""
        self._downloader.to_screen('[redirect] Following redirect to %s' % new_url)

    def report_detected(self, name, num=1, note=None):
        if num > 1:
            name += 's'
        elif not num:
            return
        else:
            num = 'a'

        self._downloader.write_debug(f'Identified {num} {name}{format_field(note, None, "; %s")}')

    def _extra_manifest_info(self, info, manifest_url):
        fragment_query = self._configuration_arg('fragment_query', [None], casesense=True)[0]
        if fragment_query is not None:
            info['extra_param_to_segment_url'] = (
                urllib.parse.urlparse(fragment_query).query or fragment_query
                or urllib.parse.urlparse(manifest_url).query or None)

        hex_or_none = lambda x: x if re.fullmatch(r'(0x)?[\da-f]+', x, re.IGNORECASE) else None
        info['hls_aes'] = traverse_obj(self._configuration_arg('hls_key', casesense=True), {
            'uri': (0, {url_or_none}), 'key': (0, {hex_or_none}), 'iv': (1, {hex_or_none}),
        }) or None

        variant_query = self._configuration_arg('variant_query', [None], casesense=True)[0]
        if variant_query is not None:
            query = urllib.parse.parse_qs(
                urllib.parse.urlparse(variant_query).query or variant_query
                or urllib.parse.urlparse(manifest_url).query)
            for fmt in self._downloader._get_formats(info):
                fmt['url'] = update_url_query(fmt['url'], query)

        # Attempt to detect live HLS or set VOD duration
        m3u8_format = next((f for f in self._downloader._get_formats(info)
                            if determine_protocol(f) == 'm3u8_native'), None)
        if m3u8_format:
            is_live = self._configuration_arg('is_live', [None])[0]
            if is_live is not None:
                info['live_status'] = 'not_live' if is_live == 'false' else 'is_live'
                return
            headers = m3u8_format.get('http_headers') or info.get('http_headers')
            duration = self._extract_m3u8_vod_duration(
                m3u8_format['url'], info.get('id'), note='Checking m3u8 live status',
                errnote='Failed to download m3u8 media playlist', headers=headers)
            if not duration:
                info['live_status'] = 'is_live'
            info['duration'] = info.get('duration') or duration

    def _extract_rss(self, url, video_id, doc):
        NS_MAP = {
            'itunes': 'http://www.itunes.com/dtds/podcast-1.0.dtd',
        }

        entries = []
        for it in doc.findall('./channel/item'):
            next_url = next(
                (e.attrib.get('url') for e in it.findall('./enclosure')),
                xpath_text(it, 'link', fatal=False))
            if not next_url:
                continue

            guid = try_call(lambda: it.find('guid').text)
            if guid:
                next_url = smuggle_url(next_url, {'force_videoid': guid})

            def itunes(key):
                return xpath_text(it, xpath_with_ns(f'./itunes:{key}', NS_MAP), default=None)

            entries.append({
                '_type': 'url_transparent',
                'url': next_url,
                'title': try_call(lambda: it.find('title').text),
                'description': xpath_text(it, 'description', default=None),
                'timestamp': unified_timestamp(xpath_text(it, 'pubDate', default=None)),
                'duration': parse_duration(itunes('duration')),
                'thumbnail': url_or_none(xpath_attr(it, xpath_with_ns('./itunes:image', NS_MAP), 'href')),
                'episode': itunes('title'),
                'episode_number': int_or_none(itunes('episode')),
                'season_number': int_or_none(itunes('season')),
                'age_limit': {'true': 18, 'yes': 18, 'false': 0, 'no': 0}.get((itunes('explicit') or '').lower()),
            })

        return {
            '_type': 'playlist',
            'id': url,
            'title': try_call(lambda: doc.find('./channel/title').text),
            'description': try_call(lambda: doc.find('./channel/description').text),
            'entries': entries,
        }

    @classmethod
    def _kvs_get_real_url(cls, video_url, license_code):
        if not video_url.startswith('function/0/'):
            return video_url  # not obfuscated

        parsed = urllib.parse.urlparse(video_url[len('function/0/'):])
        license = cls._kvs_get_license_token(license_code)
        urlparts = parsed.path.split('/')

        HASH_LENGTH = 32
        hash = urlparts[3][:HASH_LENGTH]
        indices = list(range(HASH_LENGTH))

        # Swap indices of hash according to the destination calculated from the license token
        accum = 0
        for src in reversed(range(HASH_LENGTH)):
            accum += license[src]
            dest = (src + accum) % HASH_LENGTH
            indices[src], indices[dest] = indices[dest], indices[src]

        urlparts[3] = ''.join(hash[index] for index in indices) + urlparts[3][HASH_LENGTH:]
        return urllib.parse.urlunparse(parsed._replace(path='/'.join(urlparts)))

    @staticmethod
    def _kvs_get_license_token(license):
        license = license.replace('$', '')
        license_values = [int(char) for char in license]

        modlicense = license.replace('0', '1')
        center = len(modlicense) // 2
        fronthalf = int(modlicense[:center + 1])
        backhalf = int(modlicense[center:])
        modlicense = str(4 * abs(fronthalf - backhalf))[:center + 1]

        return [
            (license_values[index + offset] + current) % 10
            for index, current in enumerate(map(int, modlicense))
            for offset in range(4)
        ]

    def _extract_kvs(self, url, webpage, video_id):
        flashvars = self._search_json(
            r'(?s:<script\b[^>]*>.*?var\s+flashvars\s*=)',
            webpage, 'flashvars', video_id, transform_source=js_to_json)

        # extract the part after the last / as the display_id from the
        # canonical URL.
        display_id = self._search_regex(
            r'(?:<link href="https?://[^"]+/(.+?)/?" rel="canonical"\s*/?>'
            r'|<link rel="canonical" href="https?://[^"]+/(.+?)/?"\s*/?>)',
            webpage, 'display_id', fatal=False)
        title = self._html_search_regex(r'<(?:h1|title)>(?:Video: )?(.+?)</(?:h1|title)>', webpage, 'title')

        thumbnail = flashvars['preview_url']
        if thumbnail.startswith('//'):
            protocol, _, _ = url.partition('/')
            thumbnail = protocol + thumbnail

        url_keys = list(filter(re.compile(r'^video_(?:url|alt_url\d*)$').match, flashvars.keys()))
        formats = []
        for key in url_keys:
            if '/get_file/' not in flashvars[key]:
                continue
            format_id = flashvars.get(f'{key}_text', key)
            formats.append({
                'url': urljoin(url, self._kvs_get_real_url(flashvars[key], flashvars['license_code'])),
                'format_id': format_id,
                'ext': 'mp4',
                **(parse_resolution(format_id) or parse_resolution(flashvars[key])),
                'http_headers': {'Referer': url},
            })
            if not formats[-1].get('height'):
                formats[-1]['quality'] = 1

        return {
            'id': flashvars['video_id'],
            'display_id': display_id,
            'title': title,
            'thumbnail': urljoin(url, thumbnail),
            'formats': formats,
        }

    def _real_extract(self, url):
        if url.startswith('//'):
            return self.url_result(self.http_scheme() + url)

        parsed_url = urllib.parse.urlparse(url)
        if not parsed_url.scheme:
            default_search = self.get_param('default_search')
            if default_search is None:
                default_search = 'fixup_error'

            if default_search in ('auto', 'auto_warning', 'fixup_error'):
                if re.match(r'^[^\s/]+\.[^\s/]+/', url):
                    self.report_warning('The url doesn\'t specify the protocol, trying with http')
                    return self.url_result('http://' + url)
                elif default_search != 'fixup_error':
                    if default_search == 'auto_warning':
                        if re.match(r'^(?:url|URL)$', url):
                            raise ExtractorError(
                                'Invalid URL:  %r . Call yt-dlp like this:  yt-dlp -v "https://www.youtube.com/watch?v=BaW_jenozKc"  ' % url,
                                expected=True)
                        else:
                            self.report_warning(
                                'Falling back to youtube search for  %s . Set --default-search "auto" to suppress this warning.' % url)
                    return self.url_result('ytsearch:' + url)

            if default_search in ('error', 'fixup_error'):
                raise ExtractorError(
                    '%r is not a valid URL. '
                    'Set --default-search "ytsearch" (or run  yt-dlp "ytsearch:%s" ) to search YouTube'
                    % (url, url), expected=True)
            else:
                if ':' not in default_search:
                    default_search += ':'
                return self.url_result(default_search + url)

        original_url = url
        url, smuggled_data = unsmuggle_url(url, {})
        force_videoid = None
        is_intentional = smuggled_data.get('to_generic')
        if 'force_videoid' in smuggled_data:
            force_videoid = smuggled_data['force_videoid']
            video_id = force_videoid
        else:
            video_id = self._generic_id(url)

        # Some webservers may serve compressed content of rather big size (e.g. gzipped flac)
        # making it impossible to download only chunk of the file (yet we need only 512kB to
        # test whether it's HTML or not). According to yt-dlp default Accept-Encoding
        # that will always result in downloading the whole file that is not desirable.
        # Therefore for extraction pass we have to override Accept-Encoding to any in order
        # to accept raw bytes and being able to download only a chunk.
        # It may probably better to solve this by checking Content-Type for application/octet-stream
        # after a HEAD request, but not sure if we can rely on this.
        full_response = self._request_webpage(url, video_id, headers=filter_dict({
            'Accept-Encoding': 'identity',
            'Referer': smuggled_data.get('referer'),
        }))
        new_url = full_response.url
        if new_url != extract_basic_auth(url)[0]:
            self.report_following_redirect(new_url)
            if force_videoid:
                new_url = smuggle_url(new_url, {'force_videoid': force_videoid})
            return self.url_result(new_url)

        info_dict = {
            'id': video_id,
            'title': self._generic_title(url),
            'timestamp': unified_timestamp(full_response.headers.get('Last-Modified'))
        }

        # Check for direct link to a video
        content_type = full_response.headers.get('Content-Type', '').lower()
        m = re.match(r'^(?P<type>audio|video|application(?=/(?:ogg$|(?:vnd\.apple\.|x-)?mpegurl)))/(?P<format_id>[^;\s]+)', content_type)
        if m:
            self.report_detected('direct video link')
            headers = filter_dict({'Referer': smuggled_data.get('referer')})
            format_id = str(m.group('format_id'))
            ext = determine_ext(url, default_ext=None) or urlhandle_detect_ext(full_response)
            subtitles = {}
            if format_id.endswith('mpegurl') or ext == 'm3u8':
                formats, subtitles = self._extract_m3u8_formats_and_subtitles(url, video_id, 'mp4', headers=headers)
            elif format_id.endswith('mpd') or format_id.endswith('dash+xml') or ext == 'mpd':
                formats, subtitles = self._extract_mpd_formats_and_subtitles(url, video_id, headers=headers)
            elif format_id == 'f4m' or ext == 'f4m':
                formats = self._extract_f4m_formats(url, video_id, headers=headers)
            else:
                formats = [{
                    'format_id': format_id,
                    'url': url,
                    'ext': ext,
                    'vcodec': 'none' if m.group('type') == 'audio' else None
                }]
                info_dict['direct'] = True
            info_dict.update({
                'formats': formats,
                'subtitles': subtitles,
                'http_headers': headers or None,
            })
            self._extra_manifest_info(info_dict, url)
            return info_dict

        if not self.get_param('test', False) and not is_intentional:
            force = self.get_param('force_generic_extractor', False)
            self.report_warning('%s generic information extractor' % ('Forcing' if force else 'Falling back on'))

        first_bytes = full_response.read(512)

        # Is it an M3U playlist?
        if first_bytes.startswith(b'#EXTM3U'):
            self.report_detected('M3U playlist')
            info_dict['formats'], info_dict['subtitles'] = self._extract_m3u8_formats_and_subtitles(url, video_id, 'mp4')
            self._extra_manifest_info(info_dict, url)
            return info_dict

        # Maybe it's a direct link to a video?
        # Be careful not to download the whole thing!
        if not is_html(first_bytes):
            self.report_warning(
                'URL could be a direct video link, returning it as such.')
            info_dict.update({
                'direct': True,
                'url': url,
            })
            return info_dict

        webpage = self._webpage_read_content(
            full_response, url, video_id, prefix=first_bytes)

        if '<title>DPG Media Privacy Gate</title>' in webpage:
            webpage = self._download_webpage(url, video_id)

        self.report_extraction(video_id)

        # Is it an RSS feed, a SMIL file, an XSPF playlist or a MPD manifest?
        try:
            try:
                doc = compat_etree_fromstring(webpage)
            except xml.etree.ElementTree.ParseError:
                doc = compat_etree_fromstring(webpage.encode('utf-8'))
            if doc.tag == 'rss':
                self.report_detected('RSS feed')
                return self._extract_rss(url, video_id, doc)
            elif doc.tag == 'SmoothStreamingMedia':
                info_dict['formats'], info_dict['subtitles'] = self._parse_ism_formats_and_subtitles(doc, url)
                self.report_detected('ISM manifest')
                return info_dict
            elif re.match(r'^(?:{[^}]+})?smil$', doc.tag):
                smil = self._parse_smil(doc, url, video_id)
                self.report_detected('SMIL file')
                return smil
            elif doc.tag == '{http://xspf.org/ns/0/}playlist':
                self.report_detected('XSPF playlist')
                return self.playlist_result(
                    self._parse_xspf(
                        doc, video_id, xspf_url=url,
                        xspf_base_url=full_response.url),
                    video_id)
            elif re.match(r'(?i)^(?:{[^}]+})?MPD$', doc.tag):
                info_dict['formats'], info_dict['subtitles'] = self._parse_mpd_formats_and_subtitles(
                    doc,
                    mpd_base_url=full_response.url.rpartition('/')[0],
                    mpd_url=url)
                self._extra_manifest_info(info_dict, url)
                self.report_detected('DASH manifest')
                return info_dict
            elif re.match(r'^{http://ns\.adobe\.com/f4m/[12]\.0}manifest$', doc.tag):
                info_dict['formats'] = self._parse_f4m_formats(doc, url, video_id)
                self.report_detected('F4M manifest')
                return info_dict
        except xml.etree.ElementTree.ParseError:
            pass

        info_dict.update({
            # it's tempting to parse this further, but you would
            # have to take into account all the variations like
            #   Video Title - Site Name
            #   Site Name | Video Title
            #   Video Title - Tagline | Site Name
            # and so on and so forth; it's just not practical
            'title': self._generic_title('', webpage, default='video'),
            'description': self._og_search_description(webpage, default=None),
            'thumbnail': self._og_search_thumbnail(webpage, default=None),
            'age_limit': self._rta_search(webpage),
        })

        self._downloader.write_debug('Looking for embeds')
        embeds = list(self._extract_embeds(original_url, webpage, urlh=full_response, info_dict=info_dict))
        if len(embeds) == 1:
            return merge_dicts(embeds[0], info_dict)
        elif embeds:
            return self.playlist_result(embeds, **info_dict)
        raise UnsupportedError(url)

    def _extract_embeds(self, url, webpage, *, urlh=None, info_dict={}):
        """Returns an iterator of video entries"""
        info_dict = types.MappingProxyType(info_dict)  # Prevents accidental mutation
        video_id = traverse_obj(info_dict, 'display_id', 'id') or self._generic_id(url)
        url, smuggled_data = unsmuggle_url(url, {})
        actual_url = urlh.url if urlh else url

        # Sometimes embedded video player is hidden behind percent encoding
        # (e.g. https://github.com/ytdl-org/youtube-dl/issues/2448)
        # Unescaping the whole page allows to handle those cases in a generic way
        # FIXME: unescaping the whole page may break URLs, commenting out for now.
        # There probably should be a second run of generic extractor on unescaped webpage.
        # webpage = urllib.parse.unquote(webpage)

        embeds = []
        for ie in self._downloader._ies.values():
            if ie.ie_key() in smuggled_data.get('block_ies', []):
                continue
            gen = ie.extract_from_webpage(self._downloader, url, webpage)
            current_embeds = []
            try:
                while True:
                    current_embeds.append(next(gen))
            except self.StopExtraction:
                self.report_detected(f'{ie.IE_NAME} exclusive embed', len(current_embeds),
                                     embeds and 'discarding other embeds')
                return current_embeds
            except StopIteration:
                self.report_detected(f'{ie.IE_NAME} embed', len(current_embeds))
                embeds.extend(current_embeds)

        if embeds:
            return embeds

        jwplayer_data = self._find_jwplayer_data(
            webpage, video_id, transform_source=js_to_json)
        if jwplayer_data:
            if isinstance(jwplayer_data.get('playlist'), str):
                self.report_detected('JW Player playlist')
                return [self.url_result(jwplayer_data['playlist'], 'JWPlatform')]
            try:
                info = self._parse_jwplayer_data(
                    jwplayer_data, video_id, require_title=False, base_url=url)
                if traverse_obj(info, 'formats', ('entries', ..., 'formats')):
                    self.report_detected('JW Player data')
                    return [info]
            except ExtractorError:
                # See https://github.com/ytdl-org/youtube-dl/pull/16735
                pass

        # Video.js embed
        mobj = re.search(
            r'(?s)\bvideojs\s*\(.+?([a-zA-Z0-9_$]+)\.src\s*\(\s*((?:\[.+?\]|{.+?}))\s*\)\s*;',
            webpage)
        if mobj is not None:
            varname = mobj.group(1)
            sources = variadic(self._parse_json(
                mobj.group(2), video_id, transform_source=js_to_json, fatal=False) or [])
            formats, subtitles, src = [], {}, None
            for source in sources:
                src = source.get('src')
                if not src or not isinstance(src, str):
                    continue
                src = urllib.parse.urljoin(url, src)
                src_type = source.get('type')
                if isinstance(src_type, str):
                    src_type = src_type.lower()
                ext = determine_ext(src).lower()
                if src_type == 'video/youtube':
                    return [self.url_result(src, YoutubeIE.ie_key())]
                if src_type == 'application/dash+xml' or ext == 'mpd':
                    fmts, subs = self._extract_mpd_formats_and_subtitles(
                        src, video_id, mpd_id='dash', fatal=False)
                    formats.extend(fmts)
                    self._merge_subtitles(subs, target=subtitles)
                elif src_type == 'application/x-mpegurl' or ext == 'm3u8':
                    fmts, subs = self._extract_m3u8_formats_and_subtitles(
                        src, video_id, 'mp4', entry_protocol='m3u8_native',
                        m3u8_id='hls', fatal=False)
                    formats.extend(fmts)
                    self._merge_subtitles(subs, target=subtitles)

                if not formats:
                    formats.append({
                        'url': src,
                        'ext': (mimetype2ext(src_type)
                                or ext if ext in KNOWN_EXTENSIONS else 'mp4'),
                        'http_headers': {
                            'Referer': actual_url,
                        },
                    })
            # https://docs.videojs.com/player#addRemoteTextTrack
            # https://html.spec.whatwg.org/multipage/media.html#htmltrackelement
            for sub_match in re.finditer(rf'(?s){re.escape(varname)}' r'\.addRemoteTextTrack\(({.+?})\s*,\s*(?:true|false)\)', webpage):
                sub = self._parse_json(
                    sub_match.group(1), video_id, transform_source=js_to_json, fatal=False) or {}
                sub_src = str_or_none(sub.get('src'))
                if not sub_src:
                    continue
                subtitles.setdefault(dict_get(sub, ('language', 'srclang')) or 'und', []).append({
                    'url': urllib.parse.urljoin(url, sub_src),
                    'name': sub.get('label'),
                    'http_headers': {
                        'Referer': actual_url,
                    },
                })
            if formats or subtitles:
                self.report_detected('video.js embed')
                info_dict = {'formats': formats, 'subtitles': subtitles}
                if formats:
                    self._extra_manifest_info(info_dict, src)
                return [info_dict]

        # Look for generic KVS player (before json-ld bc of some urls that break otherwise)
        found = self._search_regex((
            r'<script\b[^>]+?\bsrc\s*=\s*(["\'])https?://(?:(?!\1)[^?#])+/kt_player\.js\?v=(?P<ver>\d+(?:\.\d+)+)\1[^>]*>',
            r'kt_player\s*\(\s*(["\'])(?:(?!\1)[\w\W])+\1\s*,\s*(["\'])https?://(?:(?!\2)[^?#])+/kt_player\.swf\?v=(?P<ver>\d+(?:\.\d+)+)\2\s*,',
        ), webpage, 'KVS player', group='ver', default=False)
        if found:
            self.report_detected('KVS Player')
            if found.split('.')[0] not in ('4', '5', '6'):
                self.report_warning(f'Untested major version ({found}) in player engine - download may fail.')
            return [self._extract_kvs(url, webpage, video_id)]

        # Looking for http://schema.org/VideoObject
        json_ld = self._search_json_ld(webpage, video_id, default={})
        if json_ld.get('url') not in (url, None):
            self.report_detected('JSON LD')
            is_direct = json_ld.get('ext') not in (None, *MEDIA_EXTENSIONS.manifests)
            return [merge_dicts({
                '_type': 'video' if is_direct else 'url_transparent',
                'url': smuggle_url(json_ld['url'], {
                    'force_videoid': video_id,
                    'to_generic': True,
                    'referer': url,
                }),
            }, json_ld)]

        def check_video(vurl):
            if YoutubeIE.suitable(vurl):
                return True
            if RtmpIE.suitable(vurl):
                return True
            vpath = urllib.parse.urlparse(vurl).path
            vext = determine_ext(vpath, None)
            return vext not in (None, 'swf', 'png', 'jpg', 'srt', 'sbv', 'sub', 'vtt', 'ttml', 'js', 'xml')

        def filter_video(urls):
            return list(filter(check_video, urls))

        # Start with something easy: JW Player in SWFObject
        found = filter_video(re.findall(r'flashvars: [\'"](?:.*&)?file=(http[^\'"&]*)', webpage))
        if found:
            self.report_detected('JW Player in SFWObject')
        else:
            # Look for gorilla-vid style embedding
            found = filter_video(re.findall(r'''(?sx)
                (?:
                    jw_plugins|
                    JWPlayerOptions|
                    jwplayer\s*\(\s*["'][^'"]+["']\s*\)\s*\.setup
                )
                .*?
                ['"]?file['"]?\s*:\s*["\'](.*?)["\']''', webpage))
            if found:
                self.report_detected('JW Player embed')
        if not found:
            # Broaden the search a little bit
            found = filter_video(re.findall(r'[^A-Za-z0-9]?(?:file|source)=(http[^\'"&]*)', webpage))
            if found:
                self.report_detected('video file')
        if not found:
            # Broaden the findall a little bit: JWPlayer JS loader
            found = filter_video(re.findall(
                r'[^A-Za-z0-9]?(?:file|video_url)["\']?:\s*["\'](http(?![^\'"]+\.[0-9]+[\'"])[^\'"]+)["\']', webpage))
            if found:
                self.report_detected('JW Player JS loader')
        if not found:
            # Flow player
            found = filter_video(re.findall(r'''(?xs)
                flowplayer\("[^"]+",\s*
                    \{[^}]+?\}\s*,
                    \s*\{[^}]+? ["']?clip["']?\s*:\s*\{\s*
                        ["']?url["']?\s*:\s*["']([^"']+)["']
            ''', webpage))
            if found:
                self.report_detected('Flow Player')
        if not found:
            # Cinerama player
            found = re.findall(
                r"cinerama\.embedPlayer\(\s*\'[^']+\',\s*'([^']+)'", webpage)
            if found:
                self.report_detected('Cinerama player')
        if not found:
            # Try to find twitter cards info
            # twitter:player:stream should be checked before twitter:player since
            # it is expected to contain a raw stream (see
            # https://dev.twitter.com/cards/types/player#On_twitter.com_via_desktop_browser)
            found = filter_video(re.findall(
                r'<meta (?:property|name)="twitter:player:stream" (?:content|value)="(.+?)"', webpage))
            if found:
                self.report_detected('Twitter card')
        if not found:
            # We look for Open Graph info:
            # We have to match any number spaces between elements, some sites try to align them, e.g.: statigr.am
            m_video_type = re.findall(r'<meta.*?property="og:video:type".*?content="video/(.*?)"', webpage)
            # We only look in og:video if the MIME type is a video, don't try if it's a Flash player:
            if m_video_type is not None:
                found = filter_video(re.findall(r'<meta.*?property="og:(?:video|audio)".*?content="(.*?)"', webpage))
                if found:
                    self.report_detected('Open Graph video info')
        if not found:
            REDIRECT_REGEX = r'[0-9]{,2};\s*(?:URL|url)=\'?([^\'"]+)'
            found = re.search(
                r'(?i)<meta\s+(?=(?:[a-z-]+="[^"]+"\s+)*http-equiv="refresh")'
                r'(?:[a-z-]+="[^"]+"\s+)*?content="%s' % REDIRECT_REGEX,
                webpage)
            if not found:
                # Look also in Refresh HTTP header
                refresh_header = urlh and urlh.headers.get('Refresh')
                if refresh_header:
                    found = re.search(REDIRECT_REGEX, refresh_header)
            if found:
                new_url = urllib.parse.urljoin(url, unescapeHTML(found.group(1)))
                if new_url != url:
                    self.report_following_redirect(new_url)
                    return [self.url_result(new_url)]
                else:
                    found = None

        if not found:
            # twitter:player is a https URL to iframe player that may or may not
            # be supported by yt-dlp thus this is checked the very last (see
            # https://dev.twitter.com/cards/types/player#On_twitter.com_via_desktop_browser)
            embed_url = self._html_search_meta('twitter:player', webpage, default=None)
            if embed_url and embed_url != url:
                self.report_detected('twitter:player iframe')
                return [self.url_result(embed_url)]

        if not found:
            return []

        domain_name = self._search_regex(r'^(?:https?://)?([^/]*)/.*', url, 'video uploader', default=None)

        entries = []
        for video_url in orderedSet(found):
            video_url = video_url.encode().decode('unicode-escape')
            video_url = unescapeHTML(video_url)
            video_url = video_url.replace('\\/', '/')
            video_url = urllib.parse.urljoin(url, video_url)
            video_id = urllib.parse.unquote(os.path.basename(video_url))

            # Sometimes, jwplayer extraction will result in a YouTube URL
            if YoutubeIE.suitable(video_url):
                entries.append(self.url_result(video_url, 'Youtube'))
                continue

            video_id = os.path.splitext(video_id)[0]
            headers = {
                'referer': actual_url
            }

            entry_info_dict = {
                'id': video_id,
                'uploader': domain_name,
                'title': info_dict['title'],
                'age_limit': info_dict['age_limit'],
                'http_headers': headers,
            }

            if RtmpIE.suitable(video_url):
                entry_info_dict.update({
                    '_type': 'url_transparent',
                    'ie_key': RtmpIE.ie_key(),
                    'url': video_url,
                })
                entries.append(entry_info_dict)
                continue

            ext = determine_ext(video_url)
            if ext == 'smil':
                entry_info_dict = {**self._extract_smil_info(video_url, video_id), **entry_info_dict}
            elif ext == 'xspf':
                return [self._extract_xspf_playlist(video_url, video_id)]
            elif ext == 'm3u8':
                entry_info_dict['formats'], entry_info_dict['subtitles'] = self._extract_m3u8_formats_and_subtitles(video_url, video_id, ext='mp4', headers=headers)
                self._extra_manifest_info(entry_info_dict, video_url)
            elif ext == 'mpd':
                entry_info_dict['formats'], entry_info_dict['subtitles'] = self._extract_mpd_formats_and_subtitles(video_url, video_id, headers=headers)
                self._extra_manifest_info(entry_info_dict, video_url)
            elif ext == 'f4m':
                entry_info_dict['formats'] = self._extract_f4m_formats(video_url, video_id, headers=headers)
            elif re.search(r'(?i)\.(?:ism|smil)/manifest', video_url) and video_url != url:
                # Just matching .ism/manifest is not enough to be reliably sure
                # whether it's actually an ISM manifest or some other streaming
                # manifest since there are various streaming URL formats
                # possible (see [1]) as well as some other shenanigans like
                # .smil/manifest URLs that actually serve an ISM (see [2]) and
                # so on.
                # Thus the most reasonable way to solve this is to delegate
                # to generic extractor in order to look into the contents of
                # the manifest itself.
                # 1. https://azure.microsoft.com/en-us/documentation/articles/media-services-deliver-content-overview/#streaming-url-formats
                # 2. https://svs.itworkscdn.net/lbcivod/smil:itwfcdn/lbci/170976.smil/Manifest
                entry_info_dict = self.url_result(
                    smuggle_url(video_url, {'to_generic': True}),
                    GenericIE.ie_key())
            else:
                entry_info_dict['url'] = video_url

            entries.append(entry_info_dict)

        if len(entries) > 1:
            for num, e in enumerate(entries, start=1):
                # 'url' results don't have a title
                if e.get('title') is not None:
                    e['title'] = '%s (%d)' % (e['title'], num)
        return entries
-												Move GenericIE into its own file

											
										
										
											2013-06-23 18:31:45 +00:00
+								import os
 								import re
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2022-10-09 10:39:36 +00:00
+								import types
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 10:54:43 +00:00
+								import urllib.parse
-												[cleanup] Mark some compat variables for removal (#2173)

Authored by fstirlitz, pukkandan

											
										
										
											2022-04-11 20:09:26 +00:00
+								import xml.etree.ElementTree
-												Move GenericIE into its own file

											
										
										
											2013-06-23 18:31:45 +00:00
-												[extractor] Framework for embed detection (#4307)

											
										
										
											2022-08-01 01:22:03 +00:00
+								from .common import InfoExtractor  # isort: split
-												[cleanup] Sort imports

Using https://github.com/PyCQA/isort

    isort -m VERTICAL_HANGING_INDENT --py 36 -l 80 --rr -n --tc .

											
										
										
											2022-04-11 22:32:57 +00:00
+								from .commonprotocols import RtmpIE
-												[youtube] Support jwplayer with YouTube URLs (Closes #2075)

											
										
										
											2014-01-06 00:42:58 +00:00
+								from .youtube import YoutubeIE
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 10:54:43 +00:00
+								from ..compat import compat_etree_fromstring
-												[util] Move compatibility functions out of util

utils is large enough without these compatibility functions.

Everything that is present in newer versions of Python (i.e. with dev Python it's just an import) goes into compat.py .
Everything else (i.e. youtube-dl-specific helpers) goes into utils.py .

											
										
										
											2014-11-02 10:23:40 +00:00
+								from ..utils import (
-												[cleanup] Sort imports

Using https://github.com/PyCQA/isort

    isort -m VERTICAL_HANGING_INDENT --py 36 -l 80 --rr -n --tc .

											
										
										
											2022-04-11 22:32:57 +00:00
+								    KNOWN_EXTENSIONS,
-												[extractor/generic] Fix JSON LD manifest extraction (#5577)

Closes #5572
Authored by: bashonly, pukkandan
											
										
										
											2022-11-18 02:04:03 +00:00
+								    MEDIA_EXTENSIONS,
-												[cleanup] Sort imports

Using https://github.com/PyCQA/isort

    isort -m VERTICAL_HANGING_INDENT --py 36 -l 80 --rr -n --tc .

											
										
										
											2022-04-11 22:32:57 +00:00
+								    ExtractorError,
 								    UnsupportedError,
-												fix up imports

											
										
										
											2014-08-27 23:00:59 +00:00
+								    determine_ext,
-												[extractor/generic] Attempt to detect live HLS (#6775)

* Extract duration for non-live generic HLS videos
* Add extractor-arg `is_live` to bypass live HLS check

Closes #6705
Authored by: bashonly
											
										
										
											2023-04-13 19:36:06 +00:00
+								    determine_protocol,
-												[generic] Extract subtitles from video.js (#3156)

Authored by: Lesmiscore 
											
										
										
											2022-03-23 06:28:53 +00:00
+								    dict_get,
-												[extractor/generic] Handle basic-auth when checking redirects

Closes #6352

											
										
										
											2023-02-26 04:57:04 +00:00
+								    extract_basic_auth,
-												[ie] Do not smuggle `http_headers`

See: https://github.com/yt-dlp/yt-dlp/security/advisories/GHSA-3ch3-jhc6-5r8x

Authored by: coletdjnz

											
										
										
											2023-08-16 23:42:48 +00:00
+								    filter_dict,
-												[extractor] Framework for embed detection (#4307)

											
										
										
											2022-08-01 01:22:03 +00:00
+								    format_field,
-												Preparing for release

											
										
										
											2021-01-07 06:41:05 +00:00
+								    int_or_none,
-												[generic] Add support for BOMs (Fixes #4753)

											
										
										
											2015-01-23 00:21:30 +00:00
+								    is_html,
-												[generic] Try parsing JWPlayer embedded videos (closes #12030)

											
										
										
											2017-02-16 15:42:36 +00:00
+								    js_to_json,
-												[utils] Introduce merge_dicts

											
										
										
											2018-04-27 19:47:17 +00:00
+								    merge_dicts,
-												[generic] Add support for Video.js embeds

											
										
										
											2017-09-27 17:29:42 +00:00
+								    mimetype2ext,
-												[generic] Simplify playlist support (#2948)

											
										
										
											2014-08-22 16:19:56 +00:00
+								    orderedSet,
-												Preparing for release

											
										
										
											2021-01-07 06:41:05 +00:00
+								    parse_duration,
-												[generic] Improve KVS player extraction (#2328)

Closes #2281
Authored by: trassshhub
											
										
										
											2022-01-13 16:51:00 +00:00
+								    parse_resolution,
-												[generic] Support embedded vimeo videos (#1602)

											
										
										
											2013-10-15 10:05:13 +00:00
+								    smuggle_url,
-												[generic] Extract subtitles from video.js (#3156)

Authored by: Lesmiscore 
											
										
										
											2022-03-23 06:28:53 +00:00
+								    str_or_none,
-												[extractor/generic] Don't return JW player without formats

CLoses #4765

											
										
										
											2022-08-27 00:50:48 +00:00
+								    traverse_obj,
-												[generic] Refactor `_extract_rss`

Closes #3738

											
										
										
											2022-05-17 22:44:13 +00:00
+								    try_call,
-												[generic] Support embedded vimeo videos (#1602)

											
										
										
											2013-10-15 10:05:13 +00:00
+								    unescapeHTML,
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 12:26:37 +00:00
+								    unified_timestamp,
-												[ministrygrid] Add extractor (Fixes #2900)

											
										
										
											2014-08-24 02:47:18 +00:00
+								    unsmuggle_url,
-												[extractor/generic] Add extractor-args `hls_key`, `variant_query` (#6567)

Authored by: bashonly
											
										
										
											2023-03-21 23:12:17 +00:00
+								    update_url_query,
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 12:26:37 +00:00
+								    url_or_none,
-												[cleanup] Misc (#8598)

Authored by: bashonly, pukkandan, seproDev, Grub4K

Co-authored-by: bashonly <bashonly@protonmail.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
Co-authored-by: sepro <4618135+seproDev@users.noreply.github.com>
											
										
										
											2023-12-30 21:27:36 +00:00
+								    urlhandle_detect_ext,
-												Update to ytdl-commit-195f22f6

[generic] Improve KVS (etc) extraction
https://github.com/ytdl-org/youtube-dl/commit/195f22f679330549882a8234e7234942893a4902

Closes #3716
Authored by: Grub4k, pukkandan
											
										
										
											2023-01-02 13:45:36 +00:00
+								    urljoin,
-												[cleanup Misc

Closes #5162

											
										
										
											2022-10-18 17:58:57 +00:00
+								    variadic,
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 12:26:37 +00:00
+								    xpath_attr,
-												[generic] Parse RSS enclosure URLs (Fixes #5091)

											
										
										
											2015-03-02 14:21:11 +00:00
+								    xpath_text,
-												Preparing for release

											
										
										
											2021-01-07 06:41:05 +00:00
+								    xpath_with_ns,
-												Move GenericIE into its own file

											
										
										
											2013-06-23 18:31:45 +00:00
+								)
-												[generic] Support double slash URLs (Fixes #1309)

											
										
										
											2013-08-24 20:49:52 +00:00
-												Move GenericIE into its own file

											
										
										
											2013-06-23 18:31:45 +00:00
+								class GenericIE(InfoExtractor):
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											2014-01-06 00:47:52 +00:00
+								    IE_DESC = 'Generic downloader that works on some sites'
-												Move GenericIE into its own file

											
										
										
											2013-06-23 18:31:45 +00:00
+								    _VALID_URL = r'.*'
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											2014-01-06 00:47:52 +00:00
+								    IE_NAME = 'generic'
-												[cleanup] Fix some typos (#4194)

Authored by: crazymoose77756
											
										
										
											2022-06-27 00:50:06 +00:00
+								    _NETRC_MACHINE = False  # Suppress username warning
-												GenericIE: Detect videos from Brightcove

Brightcove videos info is usually found in an <object class="BrightcoveExperience"></object> node, this is passed to a new method of BrightcoveIE that builds a url to extract the video.

											
										
										
											2013-07-10 15:49:11 +00:00
+								    _TESTS = [
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											2015-05-30 20:22:29 +00:00
+								        # Direct link to a video
 								        {
 								            'url': 'http://media.w3.org/2010/05/sintel/trailer.mp4',
 								            'md5': '67d406c2bcb6af27fa886f31aa934bbe',
 								            'info_dict': {
 								                'id': 'trailer',
 								                'ext': 'mp4',
 								                'title': 'trailer',
 								                'upload_date': '20100513',
-												[cleanup] Update extractor tests (#7718)

Authored by: trainman261
											
										
										
											2023-10-06 23:56:19 +00:00
+								                'direct': True,
 								                'timestamp': 1273772943.0,
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											2015-05-30 20:22:29 +00:00
+								            }
 								        },
-												[extractor/generic] Clarify test comment

											
										
										
											2015-05-30 20:36:20 +00:00
+								        # Direct link to media delivered compressed (until Accept-Encoding is *)
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											2015-05-30 20:22:29 +00:00
+								        {
 								            'url': 'http://calimero.tk/muzik/FictionJunction-Parallel_Hearts.flac',
 								            'md5': '128c42e68b13950268b648275386fc74',
 								            'info_dict': {
 								                'id': 'FictionJunction-Parallel_Hearts',
 								                'ext': 'flac',
 								                'title': 'FictionJunction-Parallel_Hearts',
 								                'upload_date': '20140522',
 								            },
 								            'expected_warnings': [
 								                'URL could be a direct video link, returning it as such.'
-												[generic] Update some _TESTS

											
										
										
											2016-08-28 07:46:11 +00:00
+								            ],
 								            'skip': 'URL invalid',
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											2015-05-30 20:22:29 +00:00
+								        },
 								        # Direct download with broken HEAD
 								        {
 								            'url': 'http://ai-radio.org:8000/radio.opus',
 								            'info_dict': {
 								                'id': 'radio',
 								                'ext': 'opus',
 								                'title': 'radio',
 								            },
 								            'params': {
 								                'skip_download': True,  # infinite live stream
 								            },
 								            'expected_warnings': [
-												[generic] Fix test_Generic_2

Now a HEAD request returns 400 Bad Request

											
										
										
											2016-04-16 11:44:12 +00:00
+								                r'501.*Not Implemented',
 								                r'400.*Bad Request',
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											2015-05-30 20:22:29 +00:00
+								            ],
 								        },
 								        # Direct link with incorrect MIME type
 								        {
 								            'url': 'http://ftp.nluug.nl/video/nluug/2014-11-20_nj14/zaal-2/5_Lennart_Poettering_-_Systemd.webm',
 								            'md5': '4ccbebe5f36706d85221f204d7eb5913',
 								            'info_dict': {
 								                'url': 'http://ftp.nluug.nl/video/nluug/2014-11-20_nj14/zaal-2/5_Lennart_Poettering_-_Systemd.webm',
 								                'id': '5_Lennart_Poettering_-_Systemd',
 								                'ext': 'webm',
 								                'title': '5_Lennart_Poettering_-_Systemd',
 								                'upload_date': '20141120',
-												[cleanup] Update extractor tests (#7718)

Authored by: trainman261
											
										
										
											2023-10-06 23:56:19 +00:00
+								                'direct': True,
 								                'timestamp': 1416498816.0,
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											2015-05-30 20:22:29 +00:00
+								            },
 								            'expected_warnings': [
 								                'URL could be a direct video link, returning it as such.'
 								            ]
 								        },
 								        # RSS feed
 								        {
 								            'url': 'http://phihag.de/2014/youtube-dl/rss2.xml',
 								            'info_dict': {
-												[generic] Set rss `guid` as video id (#2741)

Closes #2424
Authored by: Bricio
											
										
										
											2022-02-11 23:32:58 +00:00
+								                'id': 'https://phihag.de/2014/youtube-dl/rss2.xml',
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											2015-05-30 20:22:29 +00:00
+								                'title': 'Zero Punctuation',
 								                'description': 're:.*groundbreaking video review series.*'
 								            },
 								            'playlist_mincount': 11,
 								        },
 								        # RSS feed with enclosure
 								        {
 								            'url': 'http://podcastfeeds.nbcnews.com/audio/podcast/MSNBC-MADDOW-NETCAST-M4V.xml',
 								            'info_dict': {
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 12:26:37 +00:00
+								                'id': 'http://podcastfeeds.nbcnews.com/nbcnews/video/podcast/MSNBC-MADDOW-NETCAST-M4V.xml',
 								                'title': 'MSNBC Rachel Maddow (video)',
 								                'description': 're:.*her unique approach to storytelling.*',
 								            },
 								            'playlist': [{
 								                'info_dict': {
 								                    'ext': 'mov',
 								                    'id': 'pdv_maddow_netcast_mov-12-03-2020-223726',
 								                    'title': 'MSNBC Rachel Maddow (video) - 12-03-2020-223726',
 								                    'description': 're:.*her unique approach to storytelling.*',
 								                    'upload_date': '20201204',
 								                },
 								            }],
-												[cleanup] Update extractor tests (#7718)

Authored by: trainman261
											
										
										
											2023-10-06 23:56:19 +00:00
+								            'skip': 'Dead link',
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 12:26:37 +00:00
+								        },
 								        # RSS feed with item with description and thumbnails
 								        {
 								            'url': 'https://anchor.fm/s/dd00e14/podcast/rss',
 								            'info_dict': {
 								                'id': 'https://anchor.fm/s/dd00e14/podcast/rss',
 								                'title': 're:.*100% Hydrogen.*',
 								                'description': 're:.*In this episode.*',
 								            },
 								            'playlist': [{
 								                'info_dict': {
 								                    'ext': 'm4a',
-												[cleanup] Update extractor tests (#7718)

Authored by: trainman261
											
										
										
											2023-10-06 23:56:19 +00:00
+								                    'id': '818a5d38-01cd-152f-2231-ee479677fa82',
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 12:26:37 +00:00
+								                    'title': 're:Hydrogen!',
 								                    'description': 're:.*In this episode we are going.*',
 								                    'timestamp': 1567977776,
 								                    'upload_date': '20190908',
-												[cleanup] Update extractor tests (#7718)

Authored by: trainman261
											
										
										
											2023-10-06 23:56:19 +00:00
+								                    'duration': 423,
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 12:26:37 +00:00
+								                    'thumbnail': r're:^https?://.*\.jpg$',
 								                    'episode_number': 1,
 								                    'season_number': 1,
 								                    'age_limit': 0,
-												[generic] Set rss `guid` as video id (#2741)

Closes #2424
Authored by: Bricio
											
										
										
											2022-02-11 23:32:58 +00:00
+								                    'season': 'Season 1',
 								                    'direct': True,
 								                    'episode': 'Episode 1',
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 12:26:37 +00:00
+								                },
 								            }],
 								            'params': {
 								                'skip_download': True,
 								            },
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											2015-05-30 20:22:29 +00:00
+								        },
-												[generic] Prefer enclosures over links in RSS feeds


											
										
										
											2018-04-29 15:14:37 +00:00
+								        # RSS feed with enclosures and unsupported link URLs
 								        {
 								            'url': 'http://www.hellointernet.fm/podcast?format=rss',
 								            'info_dict': {
 								                'id': 'http://www.hellointernet.fm/podcast?format=rss',
 								                'description': 'CGP Grey and Brady Haran talk about YouTube, life, work, whatever.',
 								                'title': 'Hello Internet',
 								            },
 								            'playlist_mincount': 100,
 								        },
-												[generic] Set rss `guid` as video id (#2741)

Closes #2424
Authored by: Bricio
											
										
										
											2022-02-11 23:32:58 +00:00
+								        # RSS feed with guid
 								        {
 								            'url': 'https://www.omnycontent.com/d/playlist/a7b4f8fe-59d9-4afc-a79a-a90101378abf/bf2c1d80-3656-4449-9d00-a903004e8f84/efbff746-e7c1-463a-9d80-a903004e8f8f/podcast.rss',
 								            'info_dict': {
 								                'id': 'https://www.omnycontent.com/d/playlist/a7b4f8fe-59d9-4afc-a79a-a90101378abf/bf2c1d80-3656-4449-9d00-a903004e8f84/efbff746-e7c1-463a-9d80-a903004e8f8f/podcast.rss',
 								                'description': 'md5:be809a44b63b0c56fb485caf68685520',
 								                'title': 'The Little Red Podcast',
 								            },
 								            'playlist_mincount': 76,
 								        },
-												[extractor/generic] Add generic SMIL tests

											
										
										
											2015-08-01 19:16:21 +00:00
+								        # SMIL from http://videolectures.net/promogram_igor_mekjavic_eng
 								        {
 								            'url': 'http://videolectures.net/promogram_igor_mekjavic_eng/video/1/smil.xml',
 								            'info_dict': {
 								                'id': 'smil',
 								                'ext': 'mp4',
 								                'title': 'Automatics, robotics and biocybernetics',
 								                'description': 'md5:815fc1deb6b3a2bff99de2d5325be482',
-												[generic] Update test

											
										
										
											2015-10-31 17:05:30 +00:00
+								                'upload_date': '20130627',
-												[extractor/generic] Add generic SMIL tests

											
										
										
											2015-08-01 19:16:21 +00:00
+								                'formats': 'mincount:16',
 								                'subtitles': 'mincount:1',
 								            },
 								            'params': {
 								                'force_generic_extractor': True,
 								                'skip_download': True,
 								            },
 								        },
 								        # SMIL from http://www1.wdr.de/mediathek/video/livestream/index.html
 								        {
 								            'url': 'http://metafilegenerator.de/WDR/WDR_FS/hds/hds.smil',
 								            'info_dict': {
 								                'id': 'hds',
 								                'ext': 'flv',
 								                'title': 'hds',
 								                'formats': 'mincount:1',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
 								        # SMIL from https://www.restudy.dk/video/play/id/1637
 								        {
 								            'url': 'https://www.restudy.dk/awsmedia/SmilDirectory/video_1637.xml',
 								            'info_dict': {
 								                'id': 'video_1637',
 								                'ext': 'flv',
 								                'title': 'video_1637',
 								                'formats': 'mincount:3',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
 								        # SMIL from http://adventure.howstuffworks.com/5266-cool-jobs-iditarod-musher-video.htm
 								        {
 								            'url': 'http://services.media.howstuffworks.com/videos/450221/smil-service.smil',
 								            'info_dict': {
 								                'id': 'smil-service',
 								                'ext': 'flv',
 								                'title': 'smil-service',
 								                'formats': 'mincount:1',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
 								        # SMIL from http://new.livestream.com/CoheedandCambria/WebsterHall/videos/4719370
 								        {
 								            'url': 'http://api.new.livestream.com/accounts/1570303/events/1585861/videos/4719370.smil',
 								            'info_dict': {
 								                'id': '4719370',
 								                'ext': 'mp4',
 								                'title': '571de1fd-47bc-48db-abf9-238872a58d1f',
 								                'formats': 'mincount:3',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[extractor/generic] Add test for xspf playlist

											
										
										
											2015-08-09 13:47:08 +00:00
+								        # XSPF playlist from http://www.telegraaf.nl/tv/nieuws/binnenland/24353229/__Tikibad_ontruimd_wegens_brand__.html
 								        {
 								            'url': 'http://www.telegraaf.nl/xml/playlist/2015/8/7/mZlp2ctYIUEB.xspf',
 								            'info_dict': {
 								                'id': 'mZlp2ctYIUEB',
 								                'ext': 'mp4',
 								                'title': 'Tikibad ontruimd wegens brand',
 								                'description': 'md5:05ca046ff47b931f9b04855015e163a4',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											2017-01-02 12:08:07 +00:00
+								                'thumbnail': r're:^https?://.*\.jpg$',
-												[extractor/generic] Add test for xspf playlist

											
										
										
											2015-08-09 13:47:08 +00:00
+								                'duration': 33,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[cleanup] Update extractor tests (#7718)

Authored by: trainman261
											
										
										
											2023-10-06 23:56:19 +00:00
+								            'skip': '404 Not Found',
-												[extractor/generic] Add test for xspf playlist

											
										
										
											2015-08-09 13:47:08 +00:00
+								        },
-												[extractor/generic] Add direct mpd url test

											
										
										
											2016-02-12 18:36:47 +00:00
+								        # MPD from http://dash-mse-test.appspot.com/media.html
 								        {
 								            'url': 'http://yt-dash-mse-test.commondatastorage.googleapis.com/media/car-20120827-manifest.mpd',
 								            'md5': '4b57baab2e30d6eb3a6a09f0ba57ef53',
 								            'info_dict': {
 								                'id': 'car-20120827-manifest',
 								                'ext': 'mp4',
 								                'title': 'car-20120827-manifest',
 								                'formats': 'mincount:9',
-												[ThePlatform] Fix tests failed since 79ba9140dc8fcf5883b7473596e8f20cba6b479f

											
										
										
											2016-04-24 12:44:52 +00:00
+								                'upload_date': '20130904',
-												[cleanup] Update extractor tests (#7718)

Authored by: trainman261
											
										
										
											2023-10-06 23:56:19 +00:00
+								                'timestamp': 1378272859.0,
-												[extractor/generic] Add direct mpd url test

											
										
										
											2016-02-12 18:36:47 +00:00
+								            },
 								        },
-												[extractor/generic] Add another test for generic m3u8

											
										
										
											2016-03-18 15:54:33 +00:00
+								        # m3u8 served with Content-Type: audio/x-mpegURL; charset=utf-8
 								        {
 								            'url': 'http://once.unicornmedia.com/now/master/playlist/bb0b18ba-64f5-4b1b-a29f-0ac252f06b68/77a785f3-5188-4806-b788-0893a61634ed/93677179-2d99-4ef4-9e17-fe70d49abfbf/content.m3u8',
 								            'info_dict': {
 								                'id': 'content',
 								                'ext': 'mp4',
 								                'title': 'content',
 								                'formats': 'mincount:8',
 								            },
 								            'params': {
 								                # m3u8 downloads
 								                'skip_download': True,
-												[generic] Update some _TESTS

											
										
										
											2016-08-28 07:46:11 +00:00
+								            },
 								            'skip': 'video gone',
-												[extractor/generic] Add another test for generic m3u8

											
										
										
											2016-03-18 15:54:33 +00:00
+								        },
-												[extractor/generic] Add a test for m3u playlist served without proper Content-Type

											
										
										
											2016-03-18 16:49:11 +00:00
+								        # m3u8 served with Content-Type: text/plain
 								        {
 								            'url': 'http://www.nacentapps.com/m3u8/index.m3u8',
 								            'info_dict': {
 								                'id': 'index',
 								                'ext': 'mp4',
 								                'title': 'index',
 								                'upload_date': '20140720',
 								                'formats': 'mincount:11',
 								            },
 								            'params': {
 								                # m3u8 downloads
 								                'skip_download': True,
-												[generic] Update some _TESTS

											
										
										
											2016-08-28 07:46:11 +00:00
+								            },
 								            'skip': 'video gone',
-												[extractor/generic] Add a test for m3u playlist served without proper Content-Type

											
										
										
											2016-03-18 16:49:11 +00:00
+								        },
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											2015-05-30 20:22:29 +00:00
+								        # google redirect
 								        {
 								            'url': 'http://www.google.com/url?sa=t&rct=j&q=&esrc=s&source=web&cd=1&cad=rja&ved=0CCUQtwIwAA&url=http%3A%2F%2Fwww.youtube.com%2Fwatch%3Fv%3DcmQHVoWB5FY&ei=F-sNU-LLCaXk4QT52ICQBQ&usg=AFQjCNEw4hL29zgOohLXvpJ-Bdh2bils1Q&bvm=bv.61965928,d.bGE',
 								            'info_dict': {
 								                'id': 'cmQHVoWB5FY',
 								                'ext': 'mp4',
 								                'upload_date': '20130224',
-												[cleanup] Update extractor tests (#7718)

Authored by: trainman261
											
										
										
											2023-10-06 23:56:19 +00:00
+								                'uploader_id': '@TheVerge',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											2017-01-02 12:08:07 +00:00
+								                'description': r're:^Chris Ziegler takes a look at the\.*',
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											2015-05-30 20:22:29 +00:00
+								                'uploader': 'The Verge',
 								                'title': 'First Firefox OS phones side-by-side',
 								            },
 								            'params': {
 								                'skip_download': False,
 								            }
 								        },
-												[extractor/generic] Fix following redirect in Refresh HTTP header on python 2

											
										
										
											2015-09-20 05:16:12 +00:00
+								        {
 								            # redirect in Refresh HTTP header
 								            'url': 'https://www.facebook.com/l.php?u=https%3A%2F%2Fwww.youtube.com%2Fwatch%3Fv%3DpO8h3EaFRdo&h=TAQHsoToz&enc=AZN16h-b6o4Zq9pZkCCdOLNKMN96BbGMNtcFwHSaazus4JHT_MFYkAA-WARTX2kvsCIdlAIyHZjl6d33ILIJU7Jzwk_K3mcenAXoAzBNoZDI_Q7EXGDJnIhrGkLXo_LJ_pAa2Jzbx17UHMd3jAs--6j2zaeto5w9RTn8T_1kKg3fdC5WPX9Dbb18vzH7YFX0eSJmoa6SP114rvlkw6pkS1-T&s=1',
 								            'info_dict': {
 								                'id': 'pO8h3EaFRdo',
 								                'ext': 'mp4',
 								                'title': 'Tripeo Boiler Room x Dekmantel Festival DJ Set',
 								                'description': 'md5:6294cc1af09c4049e0652b51a2df10d5',
 								                'upload_date': '20150917',
 								                'uploader_id': 'brtvofficial',
 								                'uploader': 'Boiler Room',
 								            },
 								            'params': {
 								                'skip_download': False,
 								            },
 								        },
-												GenericIE: Detect videos from Brightcove

Brightcove videos info is usually found in an <object class="BrightcoveExperience"></object> node, this is passed to a new method of BrightcoveIE that builds a url to extract the video.

											
										
										
											2013-07-10 15:49:11 +00:00
+								        {
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											2014-01-06 00:47:52 +00:00
+								            'url': 'http://www.hodiho.fr/2013/02/regis-plante-sa-jeep.html',
-												[generic] Update test

											
										
										
											2014-04-14 11:51:46 +00:00
+								            'md5': '85b90ccc9d73b4acd9138d3af4c27f89',
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											2014-01-06 00:47:52 +00:00
+								            'info_dict': {
-												[generic] Update test

											
										
										
											2014-04-14 11:51:46 +00:00
+								                'id': '13601338388002',
 								                'ext': 'mp4',
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											2014-01-06 00:47:52 +00:00
+								                'uploader': 'www.hodiho.fr',
 								                'title': 'R\u00e9gis plante sa Jeep',
-												GenericIE: Detect videos from Brightcove

Brightcove videos info is usually found in an <object class="BrightcoveExperience"></object> node, this is passed to a new method of BrightcoveIE that builds a url to extract the video.

											
										
										
											2013-07-10 15:49:11 +00:00
+								            }
 								        },
-												[generic] Detect bandcamp pages that use custom domains (closes #1662)

They embed the original url in the 'og:url' property.

											
										
										
											2013-10-27 13:40:25 +00:00
+								        # bandcamp page with custom domain
 								        {
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											2014-01-06 00:47:52 +00:00
+								            'add_ie': ['Bandcamp'],
 								            'url': 'http://bronyrock.com/track/the-pony-mash',
 								            'info_dict': {
-												[generic] Modernize tests

											
										
										
											2014-04-14 11:56:29 +00:00
+								                'id': '3235767654',
 								                'ext': 'mp3',
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											2014-01-06 00:47:52 +00:00
+								                'title': 'The Pony Mash',
 								                'uploader': 'M_Pallante',
-												[generic] Detect bandcamp pages that use custom domains (closes #1662)

They embed the original url in the 'og:url' property.

											
										
										
											2013-10-27 13:40:25 +00:00
+								            },
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											2014-01-06 00:47:52 +00:00
+								            'skip': 'There is a limit of 200 free downloads / month for the test song',
-												[generic] Detect bandcamp pages that use custom domains (closes #1662)

They embed the original url in the 'og:url' property.

											
										
										
											2013-10-27 13:40:25 +00:00
+								        },
-												Add support for embed.ly

											
										
										
											2014-02-24 00:15:51 +00:00
+								        # embed.ly video
 								        {
 								            'url': 'http://www.tested.com/science/weird/460206-tested-grinding-coffee-2000-frames-second/',
 								            'info_dict': {
 								                'id': '9ODmcdjQcHQ',
 								                'ext': 'mp4',
-												[generic] Add all test attributes for embedly (#2447)

In the future, we may want to not only print something, but throw an error for untested properties.

											
										
										
											2014-03-05 13:05:44 +00:00
+								                'title': 'Tested: Grinding Coffee at 2000 Frames Per Second',
 								                'upload_date': '20140225',
 								                'description': 'md5:06a40fbf30b220468f1e0957c0f558ff',
 								                'uploader': 'Tested',
 								                'uploader_id': 'testedcom',
-												Add support for embed.ly

											
										
										
											2014-02-24 00:15:51 +00:00
+								            },
 								            # No need to test YoutubeIE here
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[generic/funnyordie] Add support for funnyordie embeds (Fixes #2546)

											
										
										
											2014-03-11 15:51:36 +00:00
+								        # funnyordie embed
 								        {
 								            'url': 'http://www.theguardian.com/world/2014/mar/11/obama-zach-galifianakis-between-two-ferns',
 								            'info_dict': {
 								                'id': '18e820ec3f',
 								                'ext': 'mp4',
 								                'title': 'Between Two Ferns with Zach Galifianakis: President Barack Obama',
 								                'description': 'Episode 18: President Barack Obama sits down with Zach Galifianakis for his most memorable interview yet.',
-												[generic] Add support for embedded rutv player

											
										
										
											2014-03-16 19:00:31 +00:00
+								            },
-												[generic] Update some _TESTS

											
										
										
											2016-08-28 07:46:11 +00:00
+								            # HEAD requests lead to endless 301, while GET is OK
 								            'expected_warnings': ['301'],
-												[generic/funnyordie] Add support for funnyordie embeds (Fixes #2546)

											
										
										
											2014-03-11 15:51:36 +00:00
+								        },
-												[generic] Add support for embedded rutv player

											
										
										
											2014-03-16 19:00:31 +00:00
+								        # RUTV embed
 								        {
 								            'url': 'http://www.rg.ru/2014/03/15/reg-dfo/anklav-anons.html',
 								            'info_dict': {
 								                'id': '776940',
 								                'ext': 'mp4',
 								                'title': 'Охотское море стало целиком российским',
 								                'description': 'md5:5ed62483b14663e2a95ebbe115eb8f43',
 								            },
 								            'params': {
 								                # m3u8 download
 								                'skip_download': True,
 								            },
-												[ted] Simplify embed code (#2587)

											
										
										
											2014-03-20 15:33:23 +00:00
+								        },
-												[extractor/generic] Add test for tvc embed

											
										
										
											2015-06-12 10:28:45 +00:00
+								        # TVC embed
 								        {
 								            'url': 'http://sch1298sz.mskobr.ru/dou_edu/karamel_ki/filial_galleries/video/iframe_src_http_tvc_ru_video_iframe_id_55304_isplay_false_acc_video_id_channel_brand_id_11_show_episodes_episode_id_32307_frameb/',
 								            'info_dict': {
 								                'id': '55304',
 								                'ext': 'mp4',
 								                'title': 'Дошкольное воспитание',
 								            },
 								        },
-												[generic] Add test for sportbox embeds

											
										
										
											2015-05-15 17:18:21 +00:00
+								        # SportBox embed
 								        {
 								            'url': 'http://www.vestifinance.ru/articles/25753',
 								            'info_dict': {
 								                'id': '25753',
-												[generic] Fix an MTV test and another test that breaks nosetests

											
										
										
											2016-07-26 03:11:36 +00:00
+								                'title': 'Прямые трансляции с Форума-выставки "Госзаказ-2013"',
-												[generic] Add test for sportbox embeds

											
										
										
											2015-05-15 17:18:21 +00:00
+								            },
 								            'playlist': [{
 								                'info_dict': {
 								                    'id': '370908',
 								                    'title': 'Госзаказ. День 3',
 								                    'ext': 'mp4',
 								                }
 								            }, {
 								                'info_dict': {
 								                    'id': '370905',
 								                    'title': 'Госзаказ. День 2',
 								                    'ext': 'mp4',
 								                }
 								            }, {
 								                'info_dict': {
 								                    'id': '370902',
 								                    'title': 'Госзаказ. День 1',
 								                    'ext': 'mp4',
 								                }
 								            }],
 								            'params': {
 								                # m3u8 download
 								                'skip_download': True,
 								            },
 								        },
-												[extractor/generic] Add test for myvi embed

											
										
										
											2015-07-09 19:15:55 +00:00
+								        # Myvi.ru embed
 								        {
 								            'url': 'http://www.kinomyvi.tv/news/detail/Pervij-dublirovannij-trejler--Uzhastikov-_nOw1',
 								            'info_dict': {
 								                'id': 'f4dafcad-ff21-423d-89b5-146cfd89fa1e',
 								                'ext': 'mp4',
 								                'title': 'Ужастики, русский трейлер (2015)',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											2017-01-02 12:08:07 +00:00
+								                'thumbnail': r're:^https?://.*\.jpg$',
-												[extractor/generic] Add test for myvi embed

											
										
										
											2015-07-09 19:15:55 +00:00
+								                'duration': 153,
-												[cleanup] Remove dead extractors (#8604)

Closes #1609, Closes #3232, Closes #4763, Closes #6026, Closes #6322, Closes #7912
Authored by: seproDev
											
										
										
											2023-11-26 03:09:59 +00:00
+								            },
 								            'skip': 'Site dead',
-												[extractor/generic] Add test for myvi embed

											
										
										
											2015-07-09 19:15:55 +00:00
+								        },
-												[extractor/generic] Add test for xhamster embed

											
										
										
											2015-06-21 17:18:28 +00:00
+								        # XHamster embed
 								        {
 								            'url': 'http://www.numisc.com/forum/showthread.php?11696-FM15-which-pumiscer-was-this-%28-vid-%29-%28-alfa-as-fuck-srx-%29&s=711f5db534502e22260dec8c5e2d66d8',
 								            'info_dict': {
 								                'id': 'showthread',
 								                'title': '[NSFL] [FM15] which pumiscer was this ( vid ) ( alfa as fuck srx )',
 								            },
 								            'playlist_mincount': 7,
-												[generic] Update some _TESTS

											
										
										
											2016-08-28 07:46:11 +00:00
+								            # This forum does not allow <iframe> syntaxes anymore
 								            # Now HTML tags are displayed as-is
 								            'skip': 'No videos on this page',
-												[extractor/generic] Add test for xhamster embed

											
										
										
											2015-06-21 17:18:28 +00:00
+								        },
-												[ted] Simplify embed code (#2587)

											
										
										
											2014-03-20 15:33:23 +00:00
+								        # Embedded TED video
 								        {
 								            'url': 'http://en.support.wordpress.com/videos/ted-talks/',
-												[generic] Fix testcases

											
										
										
											2014-09-29 03:12:57 +00:00
+								            'md5': '65fdff94098e4a607385a60c5177c638',
-												[ted] Simplify embed code (#2587)

											
										
										
											2014-03-20 15:33:23 +00:00
+								            'info_dict': {
-												[generic] Fix testcases

											
										
										
											2014-09-29 03:12:57 +00:00
+								                'id': '1969',
-												[ted] Simplify embed code (#2587)

											
										
										
											2014-03-20 15:33:23 +00:00
+								                'ext': 'mp4',
-												[generic] Fix testcases

											
										
										
											2014-09-29 03:12:57 +00:00
+								                'title': 'Hidden miracles of the natural world',
 								                'uploader': 'Louie Schwartzberg',
 								                'description': 'md5:8145d19d320ff3e52f28401f4c4283b9',
-												[ted] Simplify embed code (#2587)

											
										
										
											2014-03-20 15:33:23 +00:00
+								            }
-												[generic/funnyordie] Add support for funnyordie embeds (Fixes #2546)

											
										
										
											2014-03-11 15:51:36 +00:00
+								        },
-												[generic] Add nowvideo test hidden behind percent encoding

											
										
										
											2014-03-14 21:39:53 +00:00
+								        # nowvideo embed hidden behind percent encoding
 								        {
 								            'url': 'http://www.waoanime.tv/the-super-dimension-fortress-macross-episode-1/',
 								            'md5': '2baf4ddd70f697d94b1c18cf796d5107',
 								            'info_dict': {
 								                'id': '06e53103ca9aa',
 								                'ext': 'flv',
 								                'title': 'Macross Episode 001  Watch Macross Episode 001 onl',
 								                'description': 'No description',
 								            },
-												Merge remote-tracking branch 'dstftw/generic-webpage-unescape'

Conflicts:
	youtube_dl/extractor/generic.py

											
										
										
											2014-03-21 21:14:24 +00:00
+								        },
-												[arte] Add support for embedded videos (Fixes #2620)

											
										
										
											2014-03-24 21:01:47 +00:00
+								        # arte embed
 								        {
 								            'url': 'http://www.tv-replay.fr/redirection/20-03-14/x-enius-arte-10753389.html',
 								            'md5': '7653032cbb25bf6c80d80f217055fa43',
 								            'info_dict': {
 								                'id': '048195-004_PLUS7-F',
 								                'ext': 'flv',
 								                'title': 'X:enius',
 								                'description': 'md5:d5fdf32ef6613cdbfd516ae658abf168',
 								                'upload_date': '20140320',
 								            },
 								            'params': {
 								                'skip_download': 'Requires rtmpdump'
-												[generic] Update some _TESTS

											
										
										
											2016-08-28 07:46:11 +00:00
+								            },
 								            'skip': 'video gone',
-												[arte] Add support for embedded videos (Fixes #2620)

											
										
										
											2014-03-24 21:01:47 +00:00
+								        },
-												[extractor/generic] Add support for francetv embeds

											
										
										
											2015-07-18 16:56:00 +00:00
+								        # francetv embed
 								        {
 								            'url': 'http://www.tsprod.com/replay-du-concert-alcaline-de-calogero',
 								            'info_dict': {
 								                'id': 'EV_30231',
 								                'ext': 'mp4',
 								                'title': 'Alcaline, le concert avec Calogero',
 								                'description': 'md5:61f08036dcc8f47e9cfc33aed08ffaff',
 								                'upload_date': '20150226',
 								                'timestamp': 1424989860,
 								                'duration': 5400,
 								            },
 								            'params': {
 								                # m3u8 downloads
 								                'skip_download': True,
 								            },
 								            'expected_warnings': [
 								                'Forbidden'
 								            ]
 								        },
-												[condenast|generic] Add support for condenast embeds (Fixes #2783)

											
										
										
											2014-04-21 03:47:52 +00:00
+								        # Condé Nast embed
 								        {
 								            'url': 'http://www.wired.com/2014/04/honda-asimo/',
 								            'md5': 'ba0dfe966fa007657bd1443ee672db0f',
 								            'info_dict': {
 								                'id': '53501be369702d3275860000',
 								                'ext': 'mp4',
 								                'title': 'Honda’s  New Asimo Robot Is More Human Than Ever',
 								            }
-												[generic] Add support for protocol-independent URLs (Fixes #2810)

											
										
										
											2014-04-29 23:46:06 +00:00
+								        },
 								        # Dailymotion embed
 								        {
 								            'url': 'http://www.spi0n.com/zap-spi0n-com-n216/',
 								            'md5': '441aeeb82eb72c422c7f14ec533999cd',
 								            'info_dict': {
 								                'id': 'k2mm4bCdJ6CQ2i7c8o2',
 								                'ext': 'mp4',
 								                'title': 'Le Zap de Spi0n n°216 - Zapping du Web',
-												[ThePlatform] Fix tests failed since 79ba9140dc8fcf5883b7473596e8f20cba6b479f

											
										
										
											2016-04-24 12:44:52 +00:00
+								                'description': 'md5:faf028e48a461b8b7fad38f1e104b119',
-												[generic] Add support for protocol-independent URLs (Fixes #2810)

											
										
										
											2014-04-29 23:46:06 +00:00
+								                'uploader': 'Spi0n',
-												[ThePlatform] Fix tests failed since 79ba9140dc8fcf5883b7473596e8f20cba6b479f

											
										
										
											2016-04-24 12:44:52 +00:00
+								                'uploader_id': 'xgditw',
 								                'upload_date': '20140425',
 								                'timestamp': 1398441542,
-												[generic] Add support for protocol-independent URLs (Fixes #2810)

											
										
										
											2014-04-29 23:46:06 +00:00
+								            },
 								            'add_ie': ['Dailymotion'],
-												[generic] Add support for <embed YouTube

											
										
										
											2014-06-09 20:06:45 +00:00
+								        },
-												[dailymail] Add support for embeds

											
										
										
											2017-07-09 13:06:24 +00:00
+								        # DailyMail embed
 								        {
 								            'url': 'http://www.bumm.sk/krimi/2017/07/05/biztonsagi-kamera-buktatta-le-az-agg-ferfit-utlegelo-apolot',
 								            'info_dict': {
 								                'id': '1495629',
 								                'ext': 'mp4',
 								                'title': 'Care worker punches elderly dementia patient in head 11 times',
 								                'description': 'md5:3a743dee84e57e48ec68bf67113199a5',
 								            },
 								            'add_ie': ['DailyMail'],
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[generic] Add support for <embed YouTube

											
										
										
											2014-06-09 20:06:45 +00:00
+								        # YouTube embed
 								        {
 								            'url': 'http://www.badzine.de/ansicht/datum/2014/06/09/so-funktioniert-die-neue-englische-badminton-liga.html',
 								            'info_dict': {
 								                'id': 'FXRb4ykk4S0',
 								                'ext': 'mp4',
 								                'title': 'The NBL Auction 2014',
 								                'uploader': 'BADMINTON England',
 								                'uploader_id': 'BADMINTONEvents',
 								                'upload_date': '20140603',
 								                'description': 'md5:9ef128a69f1e262a700ed83edb163a73',
 								            },
 								            'add_ie': ['Youtube'],
 								            'params': {
 								                'skip_download': True,
 								            }
 								        },
-												Updated to release 2020.11.21.1

											
										
										
											2020-11-21 14:50:42 +00:00
+								        # MTVServices embed
-												[generic] Extract mtvservices embedded videos

											
										
										
											2014-06-22 19:38:04 +00:00
+								        {
-												[generic] Update test_Generic_40

The original link now redirects to an YouTube user channel.

											
										
										
											2016-06-10 08:39:31 +00:00
+								            'url': 'http://www.vulture.com/2016/06/new-key-peele-sketches-released.html',
 								            'md5': 'ca1aef97695ef2c1d6973256a57e5252',
-												[generic] Extract mtvservices embedded videos

											
										
										
											2014-06-22 19:38:04 +00:00
+								            'info_dict': {
-												[generic] Update test_Generic_40

The original link now redirects to an YouTube user channel.

											
										
										
											2016-06-10 08:39:31 +00:00
+								                'id': '769f7ec0-0692-4d62-9b45-0d88074bffc1',
-												[generic] Extract mtvservices embedded videos

											
										
										
											2014-06-22 19:38:04 +00:00
+								                'ext': 'mp4',
-												[generic] Update test_Generic_40

The original link now redirects to an YouTube user channel.

											
										
										
											2016-06-10 08:39:31 +00:00
+								                'title': 'Key and Peele|October 10, 2012|2|203|Liam Neesons - Uncensored',
 								                'description': 'Two valets share their love for movie star Liam Neesons.',
-												[generic] Fix an MTV test and another test that breaks nosetests

											
										
										
											2016-07-26 03:11:36 +00:00
+								                'timestamp': 1349922600,
 								                'upload_date': '20121011',
-												[generic] Extract mtvservices embedded videos

											
										
										
											2014-06-22 19:38:04 +00:00
+								            },
 								        },
-												Add a _TEST_

											
										
										
											2014-05-21 09:55:37 +00:00
+								        # YouTube embed via <data-embed-url="">
 								        {
 								            'url': 'https://play.google.com/store/apps/details?id=com.gameloft.android.ANMP.GloftA8HM',
 								            'info_dict': {
-												[generic] Fix testcases

											
										
										
											2014-09-29 03:12:57 +00:00
+								                'id': '4vAffPZIT44',
-												Add a _TEST_

											
										
										
											2014-05-21 09:55:37 +00:00
+								                'ext': 'mp4',
-												[generic] Fix testcases

											
										
										
											2014-09-29 03:12:57 +00:00
+								                'title': 'Asphalt 8: Airborne - Update - Welcome to Dubai!',
-												[generic] Simplify playlist support (#2948)

											
										
										
											2014-08-22 16:19:56 +00:00
+								                'uploader': 'Gameloft',
 								                'uploader_id': 'gameloft',
-												[generic] Fix testcases

											
										
										
											2014-09-29 03:12:57 +00:00
+								                'upload_date': '20140828',
 								                'description': 'md5:c80da9ed3d83ae6d1876c834de03e1c4',
-												[generic] Simplify playlist support (#2948)

											
										
										
											2014-08-22 16:19:56 +00:00
+								            },
 								            'params': {
 								                'skip_download': True,
-												Add a _TEST_

											
										
										
											2014-05-21 09:55:37 +00:00
+								            }
-												[generic] Add support for camtasia videos (Fixes #3574)

											
										
										
											2014-08-24 00:02:17 +00:00
+								        },
-												[generic] Automatic detection of flow player and age_limit (Fixes #3576)

											
										
										
											2014-08-24 03:31:32 +00:00
+								        # Flowplayer
 								        {
 								            'url': 'http://www.handjobhub.com/video/busty-blonde-siri-tit-fuck-while-wank-6313.html',
 								            'md5': '9d65602bf31c6e20014319c7d07fba27',
 								            'info_dict': {
 								                'id': '5123ea6d5e5a7',
 								                'ext': 'mp4',
 								                'age_limit': 18,
 								                'uploader': 'www.handjobhub.com',
-												[generic] Fix test title

											
										
										
											2014-10-26 23:45:15 +00:00
+								                'title': 'Busty Blonde Siri Tit Fuck While Wank at HandjobHub.com',
-												[generic] Automatic detection of flow player and age_limit (Fixes #3576)

											
										
										
											2014-08-24 03:31:32 +00:00
+								            }
-												[generic] Fix rss under Python 2.x and move test to extractor

											
										
										
											2014-08-25 16:03:01 +00:00
+								        },
-												[mlb] Add support for embedded videos (Closes #3653)

											
										
										
											2014-09-02 13:19:28 +00:00
+								        # MLB embed
 								        {
 								            'url': 'http://umpire-empire.com/index.php/topic/58125-laz-decides-no-thats-low/',
 								            'md5': '96f09a37e44da40dd083e12d9a683327',
 								            'info_dict': {
 								                'id': '33322633',
 								                'ext': 'mp4',
 								                'title': 'Ump changes call to ball',
 								                'description': 'md5:71c11215384298a172a6dcb4c2e20685',
 								                'duration': 48,
 								                'timestamp': 1401537900,
 								                'upload_date': '20140531',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											2017-01-02 12:08:07 +00:00
+								                'thumbnail': r're:^https?://.*\.jpg$',
-												[mlb] Add support for embedded videos (Closes #3653)

											
										
										
											2014-09-02 13:19:28 +00:00
+								            },
 								        },
-												[extractor/generic] Add test for wistia standard embed

											
										
										
											2016-05-20 15:43:36 +00:00
+								        # Wistia standard embed (async)
 								        {
 								            'url': 'https://www.getdrip.com/university/brennan-dunn-drip-workshop/',
 								            'info_dict': {
 								                'id': '807fafadvk',
 								                'ext': 'mp4',
 								                'title': 'Drip Brennan Dunn Workshop',
 								                'description': 'a JV Webinars video from getdrip-1',
 								                'duration': 4986.95,
 								                'timestamp': 1463607249,
-												[extractor/generic] Remove generic id and title from wistia extractionand update tests

											
										
										
											2016-05-20 15:55:35 +00:00
+								                'upload_date': '20160518',
-												[extractor/generic] Add test for wistia standard embed

											
										
										
											2016-05-20 15:43:36 +00:00
+								            },
 								            'params': {
 								                'skip_download': True,
-												[extractor/wistia] Match IDs in embed URLs (#4990)

Closes #4985
Authored by: bashonly
											
										
										
											2022-09-21 20:53:08 +00:00
+								            },
 								            'skip': 'webpage 404 not found',
 								        },
-												[generic] Allow soundcloud embeds with additional attributes

											
										
										
											2014-10-29 19:27:58 +00:00
+								        # Soundcloud embed
 								        {
 								            'url': 'http://nakedsecurity.sophos.com/2014/10/29/sscc-171-are-you-sure-that-1234-is-a-bad-password-podcast/',
 								            'info_dict': {
 								                'id': '174391317',
 								                'ext': 'mp3',
 								                'description': 'md5:ff867d6b555488ad3c52572bb33d432c',
 								                'uploader': 'Sophos Security',
 								                'title': 'Chet Chat 171 - Oct 29, 2014',
 								                'upload_date': '20141029',
 								            }
-												[generic] Add support for livestream embeds (Fixes #4185)

											
										
										
											2014-11-13 15:12:51 +00:00
+								        },
-												[extractor/generic] Add test for #10179

											
										
										
											2016-07-28 15:20:08 +00:00
+								        # Soundcloud multiple embeds
 								        {
 								            'url': 'http://www.guitarplayer.com/lessons/1014/legato-workout-one-hour-to-more-fluid-performance---tab/52809',
 								            'info_dict': {
 								                'id': '52809',
 								                'title': 'Guitar Essentials: Legato Workout—One-Hour to Fluid Performance  | TAB + AUDIO',
 								            },
 								            'playlist_mincount': 7,
 								        },
-												[tunein] Add support for embeds (closes #11579)

											
										
										
											2017-01-02 18:45:59 +00:00
+								        # TuneIn station embed
 								        {
 								            'url': 'http://radiocnrv.com/promouvoir-radio-cnrv/',
 								            'info_dict': {
 								                'id': '204146',
 								                'ext': 'mp3',
 								                'title': 'CNRV',
 								                'location': 'Paris, France',
 								                'is_live': True,
 								            },
 								            'params': {
 								                # Live stream
 								                'skip_download': True,
 								            },
 								        },
-												[generic] Add support for livestream embeds (Fixes #4185)

											
										
										
											2014-11-13 15:12:51 +00:00
+								        # Livestream embed
 								        {
 								            'url': 'http://www.esa.int/Our_Activities/Space_Science/Rosetta/Philae_comet_touch-down_webcast',
 								            'info_dict': {
 								                'id': '67864563',
 								                'ext': 'flv',
 								                'upload_date': '20141112',
 								                'title': 'Rosetta #CometLanding webcast HL 10',
 								            }
 								        },
-												[generic] Improve Livestream detection (closes #2234)

											
										
										
											2016-05-22 17:39:09 +00:00
+								        # Another Livestream embed, without 'new.' in URL
 								        {
 								            'url': 'https://www.freespeech.org/',
 								            'info_dict': {
 								                'id': '123537347',
 								                'ext': 'mp4',
 								                'title': 're:^FSTV [0-9]{4}-[0-9]{2}-[0-9]{2} [0-9]{2}:[0-9]{2}$',
 								            },
 								            'params': {
 								                # Live stream
 								                'skip_download': True,
 								            },
 								        },
-												[generic] Add support for LazyYT embeds (Fixes #4306)

											
										
										
											2014-11-25 13:34:19 +00:00
+								        # LazyYT
 								        {
-												[generic] Replace LazyYT test with skiplagged

discourse.ubuntu.com has gone away, repalce with skiplagged.com.
Be nice to have a non-frontpage URL that might be more stable,
though I don't have one. Maybe this should move to html
in test/test_InfoExtractor.py?

											
										
										
											2017-03-20 00:52:25 +00:00
+								            'url': 'https://skiplagged.com/',
-												[generic] Add support for LazyYT embeds (Fixes #4306)

											
										
										
											2014-11-25 13:34:19 +00:00
+								            'info_dict': {
-												[generic] Replace LazyYT test with skiplagged

discourse.ubuntu.com has gone away, repalce with skiplagged.com.
Be nice to have a non-frontpage URL that might be more stable,
though I don't have one. Maybe this should move to html
in test/test_InfoExtractor.py?

											
										
										
											2017-03-20 00:52:25 +00:00
+								                'id': 'skiplagged',
 								                'title': 'Skiplagged: The smart way to find cheap flights',
-												[generic] Add support for LazyYT embeds (Fixes #4306)

											
										
										
											2014-11-25 13:34:19 +00:00
+								            },
-												[generic] Replace LazyYT test with skiplagged

discourse.ubuntu.com has gone away, repalce with skiplagged.com.
Be nice to have a non-frontpage URL that might be more stable,
though I don't have one. Maybe this should move to html
in test/test_InfoExtractor.py?

											
										
										
											2017-03-20 00:52:25 +00:00
+								            'playlist_mincount': 1,
 								            'add_ie': ['Youtube'],
-												[generic] Detect direct video links (Fixes #4149, #4313)

											
										
										
											2014-11-26 09:44:39 +00:00
+								        },
-												[cleanup] Remove dead extractors (#8604)

Closes #1609, Closes #3232, Closes #4763, Closes #6026, Closes #6322, Closes #7912
Authored by: seproDev
											
										
										
											2023-11-26 03:09:59 +00:00
+								        # Libsyn embed
-												[cinchcast] Add new extractor (Fixes #4428)

											
										
										
											2014-12-12 01:57:36 +00:00
+								        {
 								            'url': 'http://undergroundwellness.com/podcasts/306-5-steps-to-permanent-gut-healing/',
 								            'info_dict': {
-												[cleanup] Remove dead extractors (#8604)

Closes #1609, Closes #3232, Closes #4763, Closes #6026, Closes #6322, Closes #7912
Authored by: seproDev
											
										
										
											2023-11-26 03:09:59 +00:00
+								                'id': '3793998',
-												[cinchcast] Add new extractor (Fixes #4428)

											
										
										
											2014-12-12 01:57:36 +00:00
+								                'ext': 'mp3',
 								                'upload_date': '20141126',
-												[cleanup] Remove dead extractors (#8604)

Closes #1609, Closes #3232, Closes #4763, Closes #6026, Closes #6322, Closes #7912
Authored by: seproDev
											
										
										
											2023-11-26 03:09:59 +00:00
+								                'title': 'Underground Wellness Radio - Jack Tips: 5 Steps to Permanent Gut Healing',
 								                'thumbnail': 'https://assets.libsyn.com/secure/item/3793998/?height=90&width=90',
 								                'duration': 3989.0,
-												[cinchcast] Add new extractor (Fixes #4428)

											
										
										
											2014-12-12 01:57:36 +00:00
+								            }
 								        },
-												[generic] Add support for Cinerama player (Fixes #4752)

											
										
										
											2015-01-23 11:00:25 +00:00
+								        # Cinerama player
 								        {
 								            'url': 'http://www.abc.net.au/7.30/content/2015/s4164797.htm',
 								            'info_dict': {
 								                'id': '730m_DandD_1901_512k',
 								                'ext': 'mp4',
 								                'uploader': 'www.abc.net.au',
 								                'title': 'Game of Thrones with dice - Dungeons and Dragons fantasy role-playing game gets new life - 19/01/2015',
 								            }
-												fixed viddler support - needed a Referer header; also added a viddler
generic extractor

											
										
										
											2015-01-28 05:08:19 +00:00
+								        },
 								        # embedded viddler video
 								        {
 								            'url': 'http://deadspin.com/i-cant-stop-watching-john-wall-chop-the-nuggets-with-th-1681801597',
 								            'info_dict': {
 								                'id': '4d03aad9',
 								                'ext': 'mp4',
 								                'uploader': 'deadspin',
 								                'title': 'WALL-TO-GORTAT',
 								                'timestamp': 1422285291,
 								                'upload_date': '20150126',
 								            },
 								            'add_ie': ['Viddler'],
-												[generic] Add support for jwPlayer YouTube videos

This makes nationalarchives.gov.uk work (Fixes #4907, fixes #4876)

											
										
										
											2015-02-09 09:42:25 +00:00
+								        },
-												[extractor/generic] Add test for Libsyn embed

											
										
										
											2015-03-22 02:20:27 +00:00
+								        # Libsyn embed
 								        {
 								            'url': 'http://thedailyshow.cc.com/podcast/episodetwelve',
 								            'info_dict': {
 								                'id': '3377616',
 								                'ext': 'mp3',
 								                'title': "The Daily Show Podcast without Jon Stewart - Episode 12: Bassem Youssef: Egypt's Jon Stewart",
 								                'description': 'md5:601cb790edd05908957dae8aaa866465',
 								                'upload_date': '20150220',
 								            },
-												[generic] Skip an invalid test

											
										
										
											2016-07-26 05:16:04 +00:00
+								            'skip': 'All The Daily Show URLs now redirect to http://www.cc.com/shows/',
-												[extractor/generic] Add test for Libsyn embed

											
										
										
											2015-03-22 02:20:27 +00:00
+								        },
-												[generic] Add support for jwPlayer YouTube videos

This makes nationalarchives.gov.uk work (Fixes #4907, fixes #4876)

											
										
										
											2015-02-09 09:42:25 +00:00
+								        # jwplayer YouTube
 								        {
 								            'url': 'http://media.nationalarchives.gov.uk/index.php/webinar-using-discovery-national-archives-online-catalogue/',
 								            'info_dict': {
 								                'id': 'Mrj4DVp2zeA',
 								                'ext': 'mp4',
-												[generic] Correct test case

Video has been reuploaded / edited

											
										
										
											2015-02-19 01:00:50 +00:00
+								                'upload_date': '20150212',
-												[generic] Add support for jwPlayer YouTube videos

This makes nationalarchives.gov.uk work (Fixes #4907, fixes #4876)

											
										
										
											2015-02-09 09:42:25 +00:00
+								                'uploader': 'The National Archives UK',
-												[generic] fix some of the tests

											
										
										
											2017-10-12 16:14:43 +00:00
+								                'description': 'md5:8078af856dca76edc42910b61273dbbf',
-												[generic] Add support for jwPlayer YouTube videos

This makes nationalarchives.gov.uk work (Fixes #4907, fixes #4876)

											
										
										
											2015-02-09 09:42:25 +00:00
+								                'uploader_id': 'NationalArchives08',
 								                'title': 'Webinar: Using Discovery, The National Archives’ online catalogue',
 								            },
-												[rtlnl|generic] Add support for rtl.nl embeds (Fixes #4959)

											
										
										
											2015-02-16 14:45:01 +00:00
+								        },
-												[extractor/generic] Add test for #11993 and more metadata for rtmp

											
										
										
											2017-02-06 16:31:58 +00:00
+								        # jwplayer rtmp
 								        {
-												[Generic] Update test 69 (suffolk/sjc)

suffolk.edu/sjc => suffolk.edu/sjc/live.php

Unfortunately it only transmits video a few mornings per month, so
leaving the 'skip' is probably appropriate. Updating the 'skip- to
include the calendar information though.

											
										
										
											2017-11-22 16:56:47 +00:00
+								            'url': 'http://www.suffolk.edu/sjc/live.php',
-												[extractor/generic] Add test for #11993 and more metadata for rtmp

											
										
										
											2017-02-06 16:31:58 +00:00
+								            'info_dict': {
-												[Generic] Update test 69 (suffolk/sjc)

suffolk.edu/sjc => suffolk.edu/sjc/live.php

Unfortunately it only transmits video a few mornings per month, so
leaving the 'skip' is probably appropriate. Updating the 'skip- to
include the calendar information though.

											
										
										
											2017-11-22 16:56:47 +00:00
+								                'id': 'live',
-												[extractor/generic] Add test for #11993 and more metadata for rtmp

											
										
										
											2017-02-06 16:31:58 +00:00
+								                'ext': 'flv',
 								                'title': 'Massachusetts Supreme Judicial Court Oral Arguments',
 								                'uploader': 'www.suffolk.edu',
 								            },
 								            'params': {
 								                'skip_download': True,
-												[generic] fix some of the tests

											
										
										
											2017-10-12 16:14:43 +00:00
+								            },
-												[Generic] Update test 69 (suffolk/sjc)

suffolk.edu/sjc => suffolk.edu/sjc/live.php

Unfortunately it only transmits video a few mornings per month, so
leaving the 'skip' is probably appropriate. Updating the 'skip- to
include the calendar information though.

											
										
										
											2017-11-22 16:56:47 +00:00
+								            'skip': 'Only has video a few mornings per month, see http://www.suffolk.edu/sjc/',
-												[extractor/generic] Add test for #11993 and more metadata for rtmp

											
										
										
											2017-02-06 16:31:58 +00:00
+								        },
-												[generic] parse jwplayer with only the json URL
Closes #1476

											
										
										
											2021-10-29 20:23:28 +00:00
+								        # jwplayer with only the json URL
 								        {
 								            'url': 'https://www.hollywoodreporter.com/news/general-news/dunkirk-team-reveals-what-christopher-nolan-said-oscar-win-meet-your-oscar-winner-1092454',
 								            'info_dict': {
 								                'id': 'TljWkvWH',
 								                'ext': 'mp4',
 								                'upload_date': '20180306',
 								                'title': 'md5:91eb1862f6526415214f62c00b453936',
 								                'description': 'md5:73048ae50ae953da10549d1d2fe9b3aa',
 								                'timestamp': 1520367225,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[generic] Try parsing JWPlayer embedded videos (closes #12030)

											
										
										
											2017-02-16 15:42:36 +00:00
+								        # Complex jwplayer
 								        {
 								            'url': 'http://www.indiedb.com/games/king-machine/videos',
 								            'info_dict': {
 								                'id': 'videos',
 								                'ext': 'mp4',
 								                'title': 'king machine trailer 1',
-												[generic] fix some of the tests

											
										
										
											2017-10-12 16:14:43 +00:00
+								                'description': 'Browse King Machine videos & audio for sweet media. Your eyes will thank you.',
-												[generic] Try parsing JWPlayer embedded videos (closes #12030)

											
										
										
											2017-02-16 15:42:36 +00:00
+								                'thumbnail': r're:^https?://.*\.jpg$',
 								            },
 								        },
-												[generic] Add support for Video.js embeds

											
										
										
											2017-09-27 17:29:42 +00:00
+								        {
-												[extractor/generic] Attempt to detect live HLS (#6775)

* Extract duration for non-live generic HLS videos
* Add extractor-arg `is_live` to bypass live HLS check

Closes #6705
Authored by: bashonly
											
										
										
											2023-04-13 19:36:06 +00:00
+								            # Youtube embed, formerly: Video.js embed, multiple formats
-												[generic] Add support for Video.js embeds

											
										
										
											2017-09-27 17:29:42 +00:00
+								            'url': 'http://ortcam.com/solidworks-урок-6-настройка-чертежа_33f9b7351.html',
 								            'info_dict': {
 								                'id': 'yygqldloqIk',
 								                'ext': 'mp4',
 								                'title': 'SolidWorks. Урок 6 Настройка чертежа',
 								                'description': 'md5:baf95267792646afdbf030e4d06b2ab3',
 								                'upload_date': '20130314',
 								                'uploader': 'PROстое3D',
 								                'uploader_id': 'PROstoe3D',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[generic] Add support for single format Video.js embeds (closes #14371)

											
										
										
											2017-10-01 00:01:21 +00:00
+								        {
 								            # Video.js embed, single format
 								            'url': 'https://www.vooplayer.com/v3/watch/watch.php?v=NzgwNTg=',
 								            'info_dict': {
 								                'id': 'watch',
 								                'ext': 'mp4',
 								                'title': 'Step 1 -  Good Foundation',
 								                'description': 'md5:d1e7ff33a29fc3eb1673d6c270d344f4',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[extractor/generic] Attempt to detect live HLS (#6775)

* Extract duration for non-live generic HLS videos
* Add extractor-arg `is_live` to bypass live HLS check

Closes #6705
Authored by: bashonly
											
										
										
											2023-04-13 19:36:06 +00:00
+								            'skip': '404 Not Found',
-												[generic] Add support for single format Video.js embeds (closes #14371)

											
										
										
											2017-10-01 00:01:21 +00:00
+								        },
-												[rtlnl|generic] Add support for rtl.nl embeds (Fixes #4959)

											
										
										
											2015-02-16 14:45:01 +00:00
+								        # rtl.nl embed
 								        {
 								            'url': 'http://www.rtlnieuws.nl/nieuws/buitenland/aanslagen-kopenhagen',
 								            'playlist_mincount': 5,
 								            'info_dict': {
 								                'id': 'aanslagen-kopenhagen',
-												[generic] fix some of the tests

											
										
										
											2017-10-12 16:14:43 +00:00
+								                'title': 'Aanslagen Kopenhagen',
-												[rtlnl|generic] Add support for rtl.nl embeds (Fixes #4959)

											
										
										
											2015-02-16 14:45:01 +00:00
+								            }
-												[generic] Add support for Zapiks embeds (#5014)

											
										
										
											2015-02-21 19:39:26 +00:00
+								        },
 								        # Zapiks embed
 								        {
 								            'url': 'http://www.skipass.com/news/116090-bon-appetit-s5ep3-baqueira-mi-cor.html',
 								            'info_dict': {
 								                'id': '118046',
 								                'ext': 'mp4',
 								                'title': 'EP3S5 - Bon Appétit - Baqueira Mi Corazon !',
 								            }
 								        },
-												[extractor/generic] Improve kaltura embeds support (Closes #6137)

											
										
										
											2015-07-02 15:39:46 +00:00
+								        # Kaltura embed (different embed code)
 								        {
 								            'url': 'http://www.premierchristianradio.com/Shows/Saturday/Unbelievable/Conference-Videos/Os-Guinness-Is-It-Fools-Talk-Unbelievable-Conference-2014',
 								            'info_dict': {
 								                'id': '1_a52wc67y',
 								                'ext': 'flv',
 								                'upload_date': '20150127',
 								                'uploader_id': 'PremierMedia',
 								                'timestamp': int,
 								                'title': 'Os Guinness // Is It Fools Talk? // Unbelievable? Conference 2014',
 								            },
 								        },
-												[generic] Improve Kaltura detection

Closes #4004

											
										
										
											2016-06-01 10:37:34 +00:00
+								        # Kaltura embed with single quotes
 								        {
 								            'url': 'http://fod.infobase.com/p_ViewPlaylist.aspx?AssignmentID=NUN8ZY',
 								            'info_dict': {
 								                'id': '0_izeg5utt',
 								                'ext': 'mp4',
 								                'title': '35871',
 								                'timestamp': 1355743100,
 								                'upload_date': '20121217',
-												[kaltura] Improve embeds detection (closes #16201)

											
										
										
											2018-04-17 18:24:02 +00:00
+								                'uploader_id': 'cplapp@learn360.com',
-												[generic] Improve Kaltura detection

Closes #4004

											
										
										
											2016-06-01 10:37:34 +00:00
+								            },
 								            'add_ie': ['Kaltura'],
 								        },
-												[extractor/generic] Improve kaltura embed detection (Closes #9911)

											
										
										
											2016-06-26 21:11:53 +00:00
+								        {
 								            # Kaltura embedded via quoted entry_id
 								            'url': 'https://www.oreilly.com/ideas/my-cloud-makes-pretty-pictures',
 								            'info_dict': {
 								                'id': '0_utuok90b',
 								                'ext': 'mp4',
 								                'title': '06_matthew_brender_raj_dutt',
 								                'timestamp': 1466638791,
 								                'upload_date': '20160622',
 								            },
 								            'add_ie': ['Kaltura'],
 								            'expected_warnings': [
 								                'Could not send HEAD request'
 								            ],
 								            'params': {
 								                'skip_download': True,
 								            }
 								        },
-												[kaltura] Improve widget ID extraction (closes #11480)

											
										
										
											2016-12-20 10:45:52 +00:00
+								        {
 								            # Kaltura embedded, some fileExt broken (#11480)
 								            'url': 'http://www.cornell.edu/video/nima-arkani-hamed-standard-models-of-particle-physics',
 								            'info_dict': {
 								                'id': '1_sgtvehim',
 								                'ext': 'mp4',
 								                'title': 'Our "Standard Models" of particle physics and cosmology',
 								                'description': 'md5:67ea74807b8c4fea92a6f38d6d323861',
 								                'timestamp': 1321158993,
 								                'upload_date': '20111113',
 								                'uploader_id': 'kps1',
 								            },
 								            'add_ie': ['Kaltura'],
 								        },
-												[kaltura] Add support for iframe embeds


											
										
										
											2017-04-08 09:40:57 +00:00
+								        {
 								            # Kaltura iframe embed
 								            'url': 'http://www.gsd.harvard.edu/event/i-m-pei-a-centennial-celebration/',
 								            'md5': 'ae5ace8eb09dc1a35d03b579a9c2cc44',
 								            'info_dict': {
 								                'id': '0_f2cfbpwy',
 								                'ext': 'mp4',
 								                'title': 'I. M. Pei: A Centennial Celebration',
 								                'description': 'md5:1db8f40c69edc46ca180ba30c567f37c',
 								                'upload_date': '20170403',
 								                'uploader_id': 'batchUser',
 								                'timestamp': 1491232186,
 								            },
 								            'add_ie': ['Kaltura'],
 								        },
-												[kaltura] Improve iframe embeds detection (closes #16337)

											
										
										
											2018-04-30 20:09:04 +00:00
+								        {
 								            # Kaltura iframe embed, more sophisticated
 								            'url': 'http://www.cns.nyu.edu/~eero/math-tools/Videos/lecture-05sep2017.html',
 								            'info_dict': {
 								                'id': '1_9gzouybz',
 								                'ext': 'mp4',
 								                'title': 'lecture-05sep2017',
 								                'description': 'md5:40f347d91fd4ba047e511c5321064b49',
 								                'upload_date': '20170913',
 								                'uploader_id': 'eps2',
 								                'timestamp': 1505340777,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								            'add_ie': ['Kaltura'],
 								        },
-												[kaltura] Improve embeds detection (closes #16201)

											
										
										
											2018-04-17 18:24:02 +00:00
+								        {
 								            # meta twitter:player
 								            'url': 'http://thechive.com/2017/12/08/all-i-want-for-christmas-is-more-twerk/',
 								            'info_dict': {
 								                'id': '0_01b42zps',
 								                'ext': 'mp4',
 								                'title': 'Main Twerk (Video)',
 								                'upload_date': '20171208',
 								                'uploader_id': 'sebastian.salinas@thechive.com',
 								                'timestamp': 1512713057,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								            'add_ie': ['Kaltura'],
 								        },
-												[generic] Add tests for #13557

											
										
										
											2017-07-09 09:02:38 +00:00
+								        # referrer protected EaglePlatform embed
 								        {
 								            'url': 'https://tvrain.ru/lite/teleshow/kak_vse_nachinalos/namin-418921/',
 								            'info_dict': {
 								                'id': '582306',
 								                'ext': 'mp4',
 								                'title': 'Стас Намин: «Мы нарушили девственность Кремля»',
 								                'thumbnail': r're:^https?://.*\.jpg$',
 								                'duration': 3382,
 								                'view_count': int,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[eagleplatform] Add support for embeds

											
										
										
											2015-03-07 16:22:57 +00:00
+								        },
-												[eagleplatform] Add support for referrer protected videos (closes #13557)

											
										
										
											2017-07-09 08:57:33 +00:00
+								        # ClipYou (EaglePlatform) embed (custom URL)
-												[eagleplatform] Add support for ClipYou embeds

											
										
										
											2015-03-07 16:34:44 +00:00
+								        {
 								            'url': 'http://muz-tv.ru/play/7129/',
-												[eagleplatform] Checking direct HTTP links

Sometimes they fail with 404

											
										
										
											2016-04-25 14:48:17 +00:00
+								            # Not checking MD5 as sometimes the direct HTTP link results in 404 and HLS is used
-												[eagleplatform] Add support for ClipYou embeds

											
										
										
											2015-03-07 16:34:44 +00:00
+								            'info_dict': {
 								                'id': '12820',
 								                'ext': 'mp4',
 								                'title': "'O Sole Mio",
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											2017-01-02 12:08:07 +00:00
+								                'thumbnail': r're:^https?://.*\.jpg$',
-												[eagleplatform] Add support for ClipYou embeds

											
										
										
											2015-03-07 16:34:44 +00:00
+								                'duration': 216,
 								                'view_count': int,
 								            },
-												[generic] Add tests for #13557

											
										
										
											2017-07-09 09:02:38 +00:00
+								            'params': {
 								                'skip_download': True,
 								            },
-												[generic] fix some of the tests

											
										
										
											2017-10-12 16:14:43 +00:00
+								            'skip': 'This video is unavailable.',
-												[eagleplatform] Add support for ClipYou embeds

											
										
										
											2015-03-07 16:34:44 +00:00
+								        },
-												[pladform] Add support for embeds

											
										
										
											2015-03-08 12:07:10 +00:00
+								        # Pladform embed
 								        {
 								            'url': 'http://muz-tv.ru/kinozal/view/7400/',
 								            'info_dict': {
 								                'id': '100183293',
 								                'ext': 'mp4',
-												[generic] Update pladform embed test

											
										
										
											2015-04-16 15:37:15 +00:00
+								                'title': 'Тайны перевала Дятлова • 1 серия 2 часть',
-												[pladform] Add support for embeds

											
										
										
											2015-03-08 12:07:10 +00:00
+								                'description': 'Документальный сериал-расследование одной из самых жутких тайн ХХ века',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											2017-01-02 12:08:07 +00:00
+								                'thumbnail': r're:^https?://.*\.jpg$',
-												[pladform] Add support for embeds

											
										
										
											2015-03-08 12:07:10 +00:00
+								                'duration': 694,
 								                'age_limit': 0,
 								            },
-												[generic] fix some of the tests

											
										
										
											2017-10-12 16:14:43 +00:00
+								            'skip': 'HTTP Error 404: Not Found',
-												[pladform] Add support for embeds

											
										
										
											2015-03-08 12:07:10 +00:00
+								        },
-												[generic] Add test for playwire embed (#5430)

											
										
										
											2015-04-15 16:13:01 +00:00
+								        # Playwire embed
 								        {
 								            'url': 'http://www.cinemablend.com/new/First-Joe-Dirt-2-Trailer-Teaser-Stupid-Greatness-70874.html',
 								            'info_dict': {
 								                'id': '3519514',
 								                'ext': 'mp4',
 								                'title': 'Joe Dirt 2 Beautiful Loser Teaser Trailer',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											2017-01-02 12:08:07 +00:00
+								                'thumbnail': r're:^https?://.*\.png$',
-												[generic] Add test for playwire embed (#5430)

											
										
										
											2015-04-15 16:13:01 +00:00
+								                'duration': 45.115,
 								            },
 								        },
-												[generic] Add tests for Crooks and Liars embeds

											
										
										
											2015-04-11 14:26:42 +00:00
+								        # Crooks and Liars embed
 								        {
 								            'url': 'http://crooksandliars.com/2015/04/fox-friends-says-protecting-atheists',
 								            'info_dict': {
 								                'id': '8RUoRhRi',
 								                'ext': 'mp4',
 								                'title': "Fox & Friends Says Protecting Atheists From Discrimination Is Anti-Christian!",
 								                'description': 'md5:e1a46ad1650e3a5ec7196d432799127f',
 								                'timestamp': 1428207000,
 								                'upload_date': '20150405',
 								                'uploader': 'Heather',
 								            },
 								        },
 								        # Crooks and Liars external embed
 								        {
 								            'url': 'http://theothermccain.com/2010/02/02/video-proves-that-bill-kristol-has-been-watching-glenn-beck/comment-page-1/',
 								            'info_dict': {
 								                'id': 'MTE3MjUtMzQ2MzA',
 								                'ext': 'mp4',
 								                'title': 'md5:5e3662a81a4014d24c250d76d41a08d5',
 								                'description': 'md5:9b8e9542d6c3c5de42d6451b7d780cec',
 								                'timestamp': 1265032391,
 								                'upload_date': '20100201',
 								                'uploader': 'Heather',
 								            },
 								        },
-												[generic] Add working NBC Sports vplayer test

											
										
										
											2015-03-31 14:11:14 +00:00
+								        # NBC Sports vplayer embed
-												[NBC/ThePlatform/Generic] Add a generic detector for NBCSportsVPlayer and enhance error detection in ThePlatformIE

											
										
										
											2015-03-30 19:36:09 +00:00
+								        {
-												[generic] Add working NBC Sports vplayer test

											
										
										
											2015-03-31 14:11:14 +00:00
+								            'url': 'http://www.riderfans.com/forum/showthread.php?121827-Freeman&s=e98fa1ea6dc08e886b1678d35212494a',
-												[NBC/ThePlatform/Generic] Add a generic detector for NBCSportsVPlayer and enhance error detection in ThePlatformIE

											
										
										
											2015-03-30 19:36:09 +00:00
+								            'info_dict': {
-												[generic] Add working NBC Sports vplayer test

											
										
										
											2015-03-31 14:11:14 +00:00
+								                'id': 'ln7x1qSThw4k',
 								                'ext': 'flv',
 								                'title': "PFT Live: New leader in the 'new-look' defense",
 								                'description': 'md5:65a19b4bbfb3b0c0c5768bed1dfad74e',
-												[ThePlatform] Fix tests failed since 79ba9140dc8fcf5883b7473596e8f20cba6b479f

											
										
										
											2016-04-24 12:44:52 +00:00
+								                'uploader': 'NBCU-SPORTS',
 								                'upload_date': '20140107',
 								                'timestamp': 1389118457,
-												[NBC/ThePlatform/Generic] Add a generic detector for NBCSportsVPlayer and enhance error detection in ThePlatformIE

											
										
										
											2015-03-30 19:36:09 +00:00
+								            },
-												[generic] fix some of the tests

											
										
										
											2017-10-12 16:14:43 +00:00
+								            'skip': 'Invalid Page URL',
-												[udn] Add new extractor

											
										
										
											2015-04-08 09:26:51 +00:00
+								        },
-												[generic] Detect NBC News embeds

											
										
										
											2016-06-10 05:32:59 +00:00
+								        # NBC News embed
 								        {
 								            'url': 'http://www.vulture.com/2016/06/letterman-couldnt-care-less-about-late-night.html',
 								            'md5': '1aa589c675898ae6d37a17913cf68d66',
 								            'info_dict': {
-												[generic] fix some of the tests

											
										
										
											2017-10-12 16:14:43 +00:00
+								                'id': 'x_dtl_oa_LettermanliftPR_160608',
-												[generic] Detect NBC News embeds

											
										
										
											2016-06-10 05:32:59 +00:00
+								                'ext': 'mp4',
-												[generic] fix some of the tests

											
										
										
											2017-10-12 16:14:43 +00:00
+								                'title': 'David Letterman: A Preview',
-												[generic] Detect NBC News embeds

											
										
										
											2016-06-10 05:32:59 +00:00
+								                'description': 'A preview of Tom Brokaw\'s interview with David Letterman as part of the On Assignment series powered by Dateline. Airs Sunday June 12 at 7/6c.',
-												[generic] fix some of the tests

											
										
										
											2017-10-12 16:14:43 +00:00
+								                'upload_date': '20160609',
 								                'timestamp': 1465431544,
 								                'uploader': 'NBCU-NEWS',
-												[generic] Detect NBC News embeds

											
										
										
											2016-06-10 05:32:59 +00:00
+								            },
 								        },
-												[udn] Add new extractor

											
										
										
											2015-04-08 09:26:51 +00:00
+								        # UDN embed
 								        {
-												[generic] Update the UDNEmbed test case

											
										
										
											2016-06-01 11:23:44 +00:00
+								            'url': 'https://video.udn.com/news/300346',
-												[generic] Fix test generic_51

The website replaced the original video with a new one

											
										
										
											2015-04-14 05:10:10 +00:00
+								            'md5': 'fd2060e988c326991037b9aff9df21a6',
-												[udn] Add new extractor

											
										
										
											2015-04-08 09:26:51 +00:00
+								            'info_dict': {
-												[generic] Fix test generic_51

The website replaced the original video with a new one

											
										
										
											2015-04-14 05:10:10 +00:00
+								                'id': '300346',
-												[udn] Add new extractor

											
										
										
											2015-04-08 09:26:51 +00:00
+								                'ext': 'mp4',
-												[generic] Fix test generic_51

The website replaced the original video with a new one

											
										
										
											2015-04-14 05:10:10 +00:00
+								                'title': '中一中男師變性 全校師生力挺',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											2017-01-02 12:08:07 +00:00
+								                'thumbnail': r're:^https?://.*\.jpg$',
-												[generic] Update the UDNEmbed test case

											
										
										
											2016-06-01 11:23:44 +00:00
+								            },
 								            'params': {
 								                # m3u8 download
 								                'skip_download': True,
 								            },
-												[generic] fix some of the tests

											
										
										
											2017-10-12 16:14:43 +00:00
+								            'expected_warnings': ['Failed to parse JSON Expecting value'],
-												[generic] Support another type of Ooyala embedded video

											
										
										
											2015-04-14 04:45:43 +00:00
+								        },
-												[kinja] add support for Kinja embeds

closes #5756
closes #11282
closes #22237
closes #22384

											
										
										
											2019-11-06 18:56:10 +00:00
+								        # Kinja embed
-												[extractor/generic] Add test for OnionStudios embeds

											
										
										
											2015-06-24 17:23:16 +00:00
+								        {
 								            'url': 'http://www.clickhole.com/video/dont-understand-bitcoin-man-will-mumble-explanatio-2537',
 								            'info_dict': {
-												[kinja] add support for Kinja embeds

closes #5756
closes #11282
closes #22237
closes #22384

											
										
										
											2019-11-06 18:56:10 +00:00
+								                'id': '106351',
-												[extractor/generic] Add test for OnionStudios embeds

											
										
										
											2015-06-24 17:23:16 +00:00
+								                'ext': 'mp4',
 								                'title': 'Don’t Understand Bitcoin? This Man Will Mumble An Explanation At You',
-												[kinja] add support for Kinja embeds

closes #5756
closes #11282
closes #22237
closes #22384

											
										
										
											2019-11-06 18:56:10 +00:00
+								                'description': 'Migrated from OnionStudios',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											2017-01-02 12:08:07 +00:00
+								                'thumbnail': r're:^https?://.*\.jpe?g$',
-												[kinja] add support for Kinja embeds

closes #5756
closes #11282
closes #22237
closes #22384

											
										
										
											2019-11-06 18:56:10 +00:00
+								                'uploader': 'clickhole',
 								                'upload_date': '20150527',
 								                'timestamp': 1432744860,
-												[extractor/generic] Add test for OnionStudios embeds

											
										
										
											2015-06-24 17:23:16 +00:00
+								            }
 								        },
-												[extractor/generic] Add test for snagfilms embeds

											
										
										
											2015-06-27 12:28:10 +00:00
+								        # SnagFilms embed
 								        {
 								            'url': 'http://whilewewatch.blogspot.ru/2012/06/whilewewatch-whilewewatch-gripping.html',
 								            'info_dict': {
 								                'id': '74849a00-85a9-11e1-9660-123139220831',
 								                'ext': 'mp4',
 								                'title': '#whilewewatch',
 								            }
 								        },
-												[generic/adobetv] Support AdobeTVVideo embeds (#6039)

											
										
										
											2015-06-22 07:02:53 +00:00
+								        # AdobeTVVideo embed
 								        {
 								            'url': 'https://helpx.adobe.com/acrobat/how-to/new-experience-acrobat-dc.html?set=acrobat--get-started--essential-beginners',
 								            'md5': '43662b577c018ad707a63766462b1e87',
 								            'info_dict': {
 								                'id': '2456',
 								                'ext': 'mp4',
 								                'title': 'New experience with Acrobat DC',
 								                'description': 'New experience with Acrobat DC',
 								                'duration': 248.667,
 								            },
-												[generic] Add test for screenwavemedia embed

											
										
										
											2015-08-29 13:12:38 +00:00
+								        },
-												[arte.tv:embed] Extended support (#2620)

											
										
										
											2016-04-11 11:17:11 +00:00
+								        # Another form of arte.tv embed
 								        {
 								            'url': 'http://www.tv-replay.fr/redirection/09-04-16/arte-reportage-arte-11508975.html',
 								            'md5': '850bfe45417ddf221288c88a0cffe2e2',
 								            'info_dict': {
 								                'id': '030273-562_PLUS7-F',
 								                'ext': 'mp4',
 								                'title': 'ARTE Reportage - Nulle part, en France',
 								                'description': 'md5:e3a0e8868ed7303ed509b9e3af2b870d',
 								                'upload_date': '20160409',
 								            },
 								        },
-												[genric] Eliminate duplicated video URLs (closes #6562)

											
										
										
											2016-05-22 14:22:27 +00:00
+								        # Duplicated embedded video URLs
 								        {
 								            'url': 'http://www.hudl.com/athlete/2538180/highlights/149298443',
 								            'info_dict': {
 								                'id': '149298443_480_16c25b74_2',
 								                'ext': 'mp4',
 								                'title': 'vs. Blue Orange Spring Game',
 								                'uploader': 'www.hudl.com',
 								            },
 								        },
-												[extractor/generic] Change twitter:player embeds priority to lowest (Closes #10090)

											
										
										
											2016-07-16 08:59:43 +00:00
+								        # twitter:player:stream embed
 								        {
 								            'url': 'http://www.rtl.be/info/video/589263.aspx?CategoryID=288',
 								            'info_dict': {
 								                'id': 'master',
 								                'ext': 'mp4',
 								                'title': 'Une nouvelle espèce de dinosaure découverte en Argentine',
 								                'uploader': 'www.rtl.be',
 								            },
 								            'params': {
 								                # m3u8 downloads
 								                'skip_download': True,
 								            },
 								        },
-												[generic] add generic support for twitter:player embeds

											
										
										
											2016-06-30 11:01:30 +00:00
+								        # twitter:player embed
 								        {
 								            'url': 'http://www.theatlantic.com/video/index/484130/what-do-black-holes-sound-like/',
 								            'md5': 'a3e0df96369831de324f0778e126653c',
 								            'info_dict': {
 								                'id': '4909620399001',
 								                'ext': 'mp4',
 								                'title': 'What Do Black Holes Sound Like?',
 								                'description': 'what do black holes sound like',
 								                'upload_date': '20160524',
 								                'uploader_id': '29913724001',
 								                'timestamp': 1464107587,
 								                'uploader': 'TheAtlantic',
 								            },
-												[extractor/brightcove] Add `BrightcoveNewBaseIE` and fix embed extraction (#5558)

* Move Brightcove embed extraction and tests into the IEs
* Split `BrightcoveNewBaseIE` from `BrightcoveNewIE`
* Fix bug in ade1fa70cbaaaadaa4772e5f0564870cea3167ef with the "wrong" spelling of `referrer` being smuggled

Closes #5539
											
										
										
											2022-11-17 19:11:35 +00:00
+								            'skip': 'Private Youtube video',
-												[facebook] Improve Facebook embedded detection

Related to #9938.

Another example comes from 9834872bf63b4e03b66c5e3b8f306556e735d8c5.

											
										
										
											2016-07-02 13:33:23 +00:00
+								        },
 								        # Facebook <iframe> embed
 								        {
 								            'url': 'https://www.hostblogger.de/blog/archives/6181-Auto-jagt-Betonmischer.html',
-												[generic] Add MD5 checksums

											
										
										
											2016-07-02 13:57:06 +00:00
+								            'md5': 'fbcde74f534176ecb015849146dd3aee',
-												[facebook] Improve Facebook embedded detection

Related to #9938.

Another example comes from 9834872bf63b4e03b66c5e3b8f306556e735d8c5.

											
										
										
											2016-07-02 13:33:23 +00:00
+								            'info_dict': {
 								                'id': '599637780109885',
 								                'ext': 'mp4',
 								                'title': 'Facebook video #599637780109885',
 								            },
 								        },
-												[facebook] Add test for plugin video embed (#13493)

											
										
										
											2017-06-27 15:36:54 +00:00
+								        # Facebook <iframe> embed, plugin video
 								        {
 								            'url': 'http://5pillarsuk.com/2017/06/07/tariq-ramadan-disagrees-with-pr-exercise-by-imams-refusing-funeral-prayers-for-london-attackers/',
 								            'info_dict': {
 								                'id': '1754168231264132',
 								                'ext': 'mp4',
 								                'title': 'About the Imams and Religious leaders refusing to perform funeral prayers for...',
 								                'uploader': 'Tariq Ramadan (official)',
 								                'timestamp': 1496758379,
 								                'upload_date': '20170606',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[facebook] Improve Facebook embedded detection

Related to #9938.

Another example comes from 9834872bf63b4e03b66c5e3b8f306556e735d8c5.

											
										
										
											2016-07-02 13:33:23 +00:00
+								        # Facebook API embed
 								        {
 								            'url': 'http://www.lothype.com/blue-stars-2016-preview-standstill-full-show/',
-												[generic] Add MD5 checksums

											
										
										
											2016-07-02 13:57:06 +00:00
+								            'md5': 'a47372ee61b39a7b90287094d447d94e',
-												[facebook] Improve Facebook embedded detection

Related to #9938.

Another example comes from 9834872bf63b4e03b66c5e3b8f306556e735d8c5.

											
										
										
											2016-07-02 13:33:23 +00:00
+								            'info_dict': {
 								                'id': '10153467542406923',
 								                'ext': 'mp4',
 								                'title': 'Facebook video #10153467542406923',
 								            },
-												[generic] Support Wordpress "YouTube Video Importer" plugin

Closes #9938

											
										
										
											2016-07-02 13:50:17 +00:00
+								        },
 								        # Wordpress "YouTube Video Importer" plugin
 								        {
 								            'url': 'http://www.lothype.com/blue-devils-drumline-stanford-lot-2016/',
-												[generic] Add MD5 checksums

											
										
										
											2016-07-02 13:57:06 +00:00
+								            'md5': 'd16797741b560b485194eddda8121b48',
-												[generic] Support Wordpress "YouTube Video Importer" plugin

Closes #9938

											
										
										
											2016-07-02 13:50:17 +00:00
+								            'info_dict': {
 								                'id': 'HNTXWDXV9Is',
 								                'ext': 'mp4',
 								                'title': 'Blue Devils Drumline Stanford lot 2016',
 								                'upload_date': '20160627',
 								                'uploader_id': 'GENOCIDE8GENERAL10',
 								                'uploader': 'cylus cyrus',
 								            },
 								        },
-												[kaltura] add support videos stored on custom kaltura servers(closes #5557)

											
										
										
											2016-07-04 16:57:44 +00:00
+								        {
 								            # video stored on custom kaltura server
 								            'url': 'http://www.expansion.com/multimedia/videos.html?media=EQcM30NHIPv',
 								            'md5': '537617d06e64dfed891fa1593c4b30cc',
 								            'info_dict': {
 								                'id': '0_1iotm5bh',
 								                'ext': 'mp4',
 								                'title': 'Elecciones británicas: 5 lecciones para Rajoy',
 								                'description': 'md5:435a89d68b9760b92ce67ed227055f16',
 								                'uploader_id': 'videos.expansion@el-mundo.net',
 								                'upload_date': '20150429',
 								                'timestamp': 1430303472,
 								            },
 								            'add_ie': ['Kaltura'],
 								        },
-												[kaltura] Add support for multiple embeds on a webpage (closes #25523)

											
										
										
											2020-06-05 19:14:35 +00:00
+								        {
 								            # multiple kaltura embeds, nsfw
 								            'url': 'https://www.quartier-rouge.be/prive/femmes/kamila-avec-video-jaime-sadomie.html',
 								            'info_dict': {
 								                'id': 'kamila-avec-video-jaime-sadomie',
 								                'title': "Kamila avec vídeo “J'aime sadomie”",
 								            },
 								            'playlist_count': 8,
 								        },
-												[generic] Add the test. Closes #1638

											
										
										
											2016-07-09 06:39:01 +00:00
+								        {
 								            # Non-standard Vimeo embed
 								            'url': 'https://openclassrooms.com/courses/understanding-the-web',
 								            'md5': '64d86f1c7d369afd9a78b38cbb88d80a',
 								            'info_dict': {
 								                'id': '148867247',
 								                'ext': 'mp4',
 								                'title': 'Understanding the web - Teaser',
 								                'description': 'This is "Understanding the web - Teaser" by openclassrooms on Vimeo, the home for high quality videos and the people who love them.',
 								                'upload_date': '20151214',
 								                'uploader': 'OpenClassrooms',
 								                'uploader_id': 'openclassrooms',
 								            },
 								            'add_ie': ['Vimeo'],
 								        },
-												[extractor/generic] Add vimeo embed that requires Referer passed

											
										
										
											2016-09-12 14:49:31 +00:00
+								        {
 								            # generic vimeo embed that requires original URL passed as Referer
 								            'url': 'http://racing4everyone.eu/2016/07/30/formula-1-2016-round12-germany/',
 								            'only_matching': True,
 								        },
-												[extractor/generic] Add support for arkena embeds

											
										
										
											2016-07-23 10:56:48 +00:00
+								        {
 								            'url': 'https://support.arkena.com/display/PLAY/Ways+to+embed+your+video',
 								            'md5': 'b96f2f71b359a8ecd05ce4e1daa72365',
 								            'info_dict': {
 								                'id': 'b41dda37-d8e7-4d3f-b1b5-9a9db578bdfe',
 								                'ext': 'mp4',
 								                'title': 'Big Buck Bunny',
 								                'description': 'Royalty free test video',
 								                'timestamp': 1432816365,
 								                'upload_date': '20150528',
 								                'is_live': False,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-08-01 01:23:25 +00:00
+								            'add_ie': ['Arkena'],
-												[extractor/generic] Add support for arkena embeds

											
										
										
											2016-07-23 10:56:48 +00:00
+								        },
-												[vbox7:generic] Add support for vbox7 embeds

											
										
										
											2016-08-16 18:02:59 +00:00
+								        {
 								            'url': 'http://nova.bg/news/view/2016/08/16/156543/%D0%BD%D0%B0-%D0%BA%D0%BE%D1%81%D1%8A%D0%BC-%D0%BE%D1%82-%D0%B2%D0%B7%D1%80%D0%B8%D0%B2-%D0%BE%D1%82%D1%86%D0%B5%D0%BF%D0%B8%D1%85%D0%B0-%D1%86%D1%8F%D0%BB-%D0%BA%D0%B2%D0%B0%D1%80%D1%82%D0%B0%D0%BB-%D0%B7%D0%B0%D1%80%D0%B0%D0%B4%D0%B8-%D0%B8%D0%B7%D1%82%D0%B8%D1%87%D0%B0%D0%BD%D0%B5-%D0%BD%D0%B0-%D0%B3%D0%B0%D0%B7-%D0%B2-%D0%BF%D0%BB%D0%BE%D0%B2%D0%B4%D0%B8%D0%B2/',
 								            'info_dict': {
 								                'id': '1c7141f46c',
 								                'ext': 'mp4',
 								                'title': 'НА КОСЪМ ОТ ВЗРИВ: Изтичане на газ на бензиностанция в Пловдив',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-08-01 01:23:25 +00:00
+								            'add_ie': ['Vbox7'],
-												[vbox7:generic] Add support for vbox7 embeds

											
										
										
											2016-08-16 18:02:59 +00:00
+								        },
-												[DBTV:generic] Add support for embeds

											
										
										
											2016-08-17 10:45:24 +00:00
+								        {
 								            # DBTV embeds
 								            'url': 'http://www.dagbladet.no/2016/02/23/nyheter/nordlys/ski/troms/ver/43254897/',
-												[generic] Fix dbtv test (Closes #10364)

											
										
										
											2016-08-18 14:35:41 +00:00
+								            'info_dict': {
 								                'id': '43254897',
 								                'title': 'Etter ett års planlegging, klaffet endelig alt: - Jeg måtte ta en liten dans',
 								            },
-												[DBTV:generic] Add support for embeds

											
										
										
											2016-08-17 10:45:24 +00:00
+								            'playlist_mincount': 3,
 								        },
-												[videa] Add support for videa embeds

											
										
										
											2016-12-31 15:04:29 +00:00
+								        {
 								            # Videa embeds
 								            'url': 'http://forum.dvdtalk.com/movie-talk/623756-deleted-magic-star-wars-ot-deleted-alt-scenes-docu-style.html',
 								            'info_dict': {
 								                'id': '623756-deleted-magic-star-wars-ot-deleted-alt-scenes-docu-style',
 								                'title': 'Deleted Magic - Star Wars: OT Deleted / Alt. Scenes Docu. Style - DVD Talk Forum',
 								            },
 								            'playlist_mincount': 2,
 								        },
-												[extractor/generic] Add support for 20 minuten embeds (closes #11683, closes #11751)

											
										
										
											2017-01-18 15:08:31 +00:00
+								        {
 								            # 20 minuten embed
 								            'url': 'http://www.20min.ch/schweiz/news/story/So-kommen-Sie-bei-Eis-und-Schnee-sicher-an-27032552',
 								            'info_dict': {
 								                'id': '523629',
 								                'ext': 'mp4',
 								                'title': 'So kommen Sie bei Eis und Schnee sicher an',
 								                'description': 'md5:117c212f64b25e3d95747e5276863f7d',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-08-01 01:23:25 +00:00
+								            'add_ie': ['TwentyMinuten'],
-												[videopress] Add extractor

											
										
										
											2017-02-05 06:37:27 +00:00
+								        },
 								        {
 								            # VideoPress embed
 								            'url': 'https://en.support.wordpress.com/videopress/',
 								            'info_dict': {
 								                'id': 'OcobLTqC',
 								                'ext': 'm4v',
 								                'title': 'IMG_5786',
 								                'timestamp': 1435711927,
 								                'upload_date': '20150701',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-08-01 01:23:25 +00:00
+								            'add_ie': ['VideoPress'],
-												[theplatform] Recognize URLs with whitespaces (closes #12044)

											
										
										
											2017-02-17 15:13:51 +00:00
+								        },
-												[generic] Add support for rutube embeds

											
										
										
											2017-03-03 17:46:33 +00:00
+								        {
 								            # Rutube embed
 								            'url': 'http://magazzino.friday.ru/videos/vipuski/kazan-2',
 								            'info_dict': {
 								                'id': '9b3d5bee0a8740bf70dfd29d3ea43541',
 								                'ext': 'flv',
 								                'title': 'Магаззино: Казань 2',
 								                'description': 'md5:99bccdfac2269f0e8fdbc4bbc9db184a',
 								                'uploader': 'Магаззино',
 								                'upload_date': '20170228',
 								                'uploader_id': '996642',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-08-01 01:23:25 +00:00
+								            'add_ie': ['Rutube'],
-												[generic] Add support for rutube embeds

											
										
										
											2017-03-03 17:46:33 +00:00
+								        },
-												[glomex] Add new extractors (#1979)

Original PR: https://github.com/ytdl-org/youtube-dl/pull/30212
Authored by: zmousm
											
										
										
											2022-01-13 21:09:52 +00:00
+								        {
-												[glomex] Minor fixes (#2357)

Authored by: zmousm
											
										
										
											2022-01-16 12:38:31 +00:00
+								            # glomex:embed
-												[glomex] Add new extractors (#1979)

Original PR: https://github.com/ytdl-org/youtube-dl/pull/30212
Authored by: zmousm
											
										
										
											2022-01-13 21:09:52 +00:00
+								            'url': 'https://www.skai.gr/news/world/iatrikos-syllogos-tourkias-to-turkovac-aplo-dialyma-erntogan-eiste-apateones-kai-pseytes',
 								            'info_dict': {
 								                'id': 'v-ch2nkhcirwc9-sf',
 								                'ext': 'mp4',
 								                'title': 'md5:786e1e24e06c55993cee965ef853a0c1',
 								                'description': 'md5:8b517a61d577efe7e36fde72fd535995',
 								                'timestamp': 1641885019,
 								                'upload_date': '20220111',
 								                'duration': 460000,
-												[megatvcom] Add embed test (#2362)

Authored by: zmousm
											
										
										
											2022-01-19 13:43:51 +00:00
+								                'thumbnail': 'https://i3thumbs.glomex.com/dC1idjJwdndiMjRzeGwvMjAyMi8wMS8xMS8wNy8xMF8zNV82MWRkMmQ2YmU5ZTgyLmpwZw==/profile:player-960x540',
-												[glomex] Add new extractors (#1979)

Original PR: https://github.com/ytdl-org/youtube-dl/pull/30212
Authored by: zmousm
											
										
										
											2022-01-13 21:09:52 +00:00
+								            },
 								        },
-												[megatvcom] Add embed test (#2362)

Authored by: zmousm
											
										
										
											2022-01-19 13:43:51 +00:00
+								        {
 								            # megatvcom:embed
 								            'url': 'https://www.in.gr/2021/12/18/greece/apokalypsi-mega-poios-parelave-tin-ereyna-tsiodra-ek-merous-tis-kyvernisis-o-prothypourgos-telika-gnorize/',
 								            'info_dict': {
 								                'id': 'apokalypsi-mega-poios-parelave-tin-ereyna-tsiodra-ek-merous-tis-kyvernisis-o-prothypourgos-telika-gnorize',
 								                'title': 'md5:5e569cf996ec111057c2764ec272848f',
 								            },
 								            'playlist': [{
 								                'md5': '1afa26064ff00ccb91617957dbc73dc1',
 								                'info_dict': {
 								                    'ext': 'mp4',
 								                    'id': '564916',
 								                    'display_id': 'md5:6cdf22d3a2e7bacb274b7295089a1770',
 								                    'title': 'md5:33b9dd39584685b62873043670eb52a6',
 								                    'description': 'md5:c1db7310f390518ac36dd69d947ef1a1',
 								                    'timestamp': 1639753145,
 								                    'upload_date': '20211217',
 								                    'thumbnail': 'https://www.megatv.com/wp-content/uploads/2021/12/prezerakos-1024x597.jpg',
 								                },
 								            }, {
 								                'md5': '4a1c220695f1ef865a8b7966a53e2474',
 								                'info_dict': {
 								                    'ext': 'mp4',
 								                    'id': '564905',
 								                    'display_id': 'md5:ead15695e485e649aed2b81ebd699b88',
 								                    'title': 'md5:2b71fd54249a3ca34609fe39ae31c47b',
 								                    'description': 'md5:c42e12f638d0a97d6de4508e2c4df982',
 								                    'timestamp': 1639753047,
 								                    'upload_date': '20211217',
 								                    'thumbnail': 'https://www.megatv.com/wp-content/uploads/2021/12/tsiodras-mitsotakis-1024x545.jpg',
 								                },
 								            }]
 								        },
-												[ertgr] Add new extractors (#2338)

Authored-by: zmousm, dirkf
											
										
										
											2022-02-01 07:32:13 +00:00
+								        {
 								            'url': 'https://www.ertnews.gr/video/manolis-goyalles-o-anthropos-piso-apo-ti-diadiktyaki-vasilopita/',
 								            'info_dict': {
 								                'id': '2022/tv/news-themata-ianouarios/20220114-apotis6-gouales-pita.mp4',
 								                'ext': 'mp4',
 								                'title': 'md5:df64f5b61c06d0e9556c0cdd5cf14464',
 								                'thumbnail': 'https://www.ert.gr/themata/photos/2021/20220114-apotis6-gouales-pita.jpg',
 								            },
 								        },
-												[theplatform] Recognize URLs with whitespaces (closes #12044)

											
										
										
											2017-02-17 15:13:51 +00:00
+								        {
 								            # ThePlatform embedded with whitespaces in URLs
 								            'url': 'http://www.golfchannel.com/topics/shows/golftalkcentral.htm',
 								            'only_matching': True,
 								        },
-												[generic] Add test for Senate ISVP iframe embed


											
										
										
											2017-03-21 17:12:14 +00:00
+								        {
 								            # Senate ISVP iframe https
 								            'url': 'https://www.hsgac.senate.gov/hearings/canadas-fast-track-refugee-plan-unanswered-questions-and-implications-for-us-national-security',
 								            'md5': 'fb8c70b0b515e5037981a2492099aab8',
 								            'info_dict': {
 								                'id': 'govtaff020316',
 								                'ext': 'mp4',
 								                'title': 'Integrated Senate Video Player',
 								            },
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-08-01 01:23:25 +00:00
+								            'add_ie': ['SenateISVP'],
-												[generic] Add test for Senate ISVP iframe embed


											
										
										
											2017-03-21 17:12:14 +00:00
+								        },
-												[extractor/generic] Add test for #12761

											
										
										
											2017-04-16 17:36:59 +00:00
+								        {
 								            # Limelight embeds (1 channel embed + 4 media embeds)
 								            'url': 'http://www.sedona.com/FacilitatorTraining2017',
 								            'info_dict': {
 								                'id': 'FacilitatorTraining2017',
 								                'title': 'Facilitator Training 2017',
 								            },
 								            'playlist_mincount': 5,
 								        },
-												[generic] Add test for #13895

											
										
										
											2017-08-12 18:11:27 +00:00
+								        {
 								            # Limelight embed (LimelightPlayerUtil.embed)
 								            'url': 'https://tv5.ca/videos?v=xuu8qowr291ri',
 								            'info_dict': {
 								                'id': '95d035dc5c8a401588e9c0e6bd1e9c92',
 								                'ext': 'mp4',
 								                'title': '07448641',
 								                'timestamp': 1499890639,
 								                'upload_date': '20170712',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								            'add_ie': ['LimelightMedia'],
 								        },
-												[anvato] Improve extraction (closes #12913)
* Promote to regular shortcut based extractor
* Add mcp to access key mapping table
* Add support for embeds extraction
* Add support for anvato embeds in generic extractor

											
										
										
											2017-04-29 12:49:04 +00:00
+								        {
 								            'url': 'http://kron4.com/2017/04/28/standoff-with-walnut-creek-murder-suspect-ends-with-arrest/',
 								            'info_dict': {
 								                'id': 'standoff-with-walnut-creek-murder-suspect-ends-with-arrest',
 								                'title': 'Standoff with Walnut Creek murder suspect ends',
 								                'description': 'md5:3ccc48a60fc9441eeccfc9c469ebf788',
 								            },
 								            'playlist_mincount': 4,
 								        },
-												[washingtonpost] Add support for embeds (closes #12699)

											
										
										
											2017-04-10 05:09:10 +00:00
+								        {
 								            # WashingtonPost embed
 								            'url': 'http://www.vanityfair.com/hollywood/2017/04/donald-trump-tv-pitches',
 								            'info_dict': {
 								                'id': '8caf6e88-d0ec-11e5-90d3-34c2c42653ac',
 								                'ext': 'mp4',
 								                'title': "No one has seen the drama series based on Trump's life \u2014 until now",
 								                'description': 'Donald Trump wanted a weekly TV drama based on his life. It never aired. But The Washington Post recently obtained a scene from the pilot script — and enlisted actors.',
 								                'timestamp': 1455216756,
 								                'uploader': 'The Washington Post',
 								                'upload_date': '20160211',
 								            },
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-08-01 01:23:25 +00:00
+								            'add_ie': ['WashingtonPost'],
-												[washingtonpost] Add support for embeds (closes #12699)

											
										
										
											2017-04-10 05:09:10 +00:00
+								        },
-												[joj] Rewrite and add support for generic embeds (closes #13268)

											
										
										
											2017-07-09 12:05:18 +00:00
+								        {
 								            # JOJ.sk embeds
 								            'url': 'https://www.noviny.sk/slovensko/238543-slovenskom-sa-prehnala-vlna-silnych-burok',
 								            'info_dict': {
 								                'id': '238543-slovenskom-sa-prehnala-vlna-silnych-burok',
 								                'title': 'Slovenskom sa prehnala vlna silných búrok',
 								            },
 								            'playlist_mincount': 5,
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-08-01 01:23:25 +00:00
+								            'add_ie': ['Joj'],
-												[joj] Rewrite and add support for generic embeds (closes #13268)

											
										
										
											2017-07-09 12:05:18 +00:00
+								        },
-												[extractor/common] Add support for AMP tags in _parse_html5_media_entries

											
										
										
											2017-07-09 09:29:52 +00:00
+								        {
 								            # AMP embed (see https://www.ampproject.org/docs/reference/components/amp-video)
 								            'url': 'https://tvrain.ru/amp/418921/',
 								            'md5': 'cc00413936695987e8de148b67d14f1d',
 								            'info_dict': {
 								                'id': '418921',
 								                'ext': 'mp4',
 								                'title': 'Стас Намин: «Мы нарушили девственность Кремля»',
 								            },
 								        },
-												[generic] Fix support for multiple HTML5 videos on one page (closes #14080)


											
										
										
											2017-09-22 22:49:48 +00:00
+								        {
 								            # multiple HTML5 videos on one page
 								            'url': 'https://www.paragon-software.com/home/rk-free/keyscenarios.html',
 								            'info_dict': {
 								                'id': 'keyscenarios',
 								                'title': 'Rescue Kit 14 Free Edition - Getting started',
 								            },
 								            'playlist_count': 4,
-												[vshare] Fix extraction (closes #14473)


											
										
										
											2017-11-14 15:34:45 +00:00
+								        },
 								        {
 								            # vshare embed
-												Completely change project name to yt-dlp (#85)

* All modules and binary names are changed
* All documentation references changed
* yt-dlp no longer loads youtube-dlc config files
* All URLs changed to point to organization account

Co-authored-by: Pccode66
Co-authored-by: pukkandan
											
										
										
											2021-02-24 18:45:56 +00:00
+								            'url': 'https://youtube-dl-demo.neocities.org/vshare.html',
-												[vshare] Fix extraction (closes #14473)


											
										
										
											2017-11-14 15:34:45 +00:00
+								            'md5': '17b39f55b5497ae8b59f5fbce8e35886',
 								            'info_dict': {
 								                'id': '0f64ce6',
 								                'title': 'vl14062007715967',
 								                'ext': 'mp4',
 								            }
-												[mediasite] Improve extraction and code style, add support for DASH (closes #11185, closes #14343, refs #5428)

											
										
										
											2017-12-30 00:28:18 +00:00
+								        },
 								        {
 								            'url': 'http://www.heidelberg-laureate-forum.org/blog/video/lecture-friday-september-23-2016-sir-c-antony-r-hoare/',
 								            'md5': 'aecd089f55b1cb5a59032cb049d3a356',
 								            'info_dict': {
 								                'id': '90227f51a80c4d8f86c345a7fa62bd9a1d',
 								                'ext': 'mp4',
 								                'title': 'Lecture: Friday, September 23, 2016 - Sir Tony Hoare',
 								                'description': 'md5:5a51db84a62def7b7054df2ade403c6c',
 								                'timestamp': 1474354800,
 								                'upload_date': '20160920',
 								            }
-												[springboardplatform] Add extractor

											
										
										
											2018-01-19 17:33:45 +00:00
+								        },
 								        {
 								            'url': 'http://www.kidzworld.com/article/30935-trolls-the-beat-goes-on-interview-skylar-astin-and-amanda-leighton',
 								            'info_dict': {
 								                'id': '1731611',
 								                'ext': 'mp4',
 								                'title': 'Official Trailer | TROLLS: THE BEAT GOES ON!',
 								                'description': 'md5:eb5f23826a027ba95277d105f248b825',
 								                'timestamp': 1516100691,
 								                'upload_date': '20180116',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-08-01 01:23:25 +00:00
+								            'add_ie': ['SpringboardPlatform'],
-												[youtube] Handle shared URLs with generic extractor (closes #14303)

											
										
										
											2018-02-15 15:33:11 +00:00
+								        },
-												[yapfiles] Add extractor (closes #15726, refs #11085)

											
										
										
											2018-03-02 18:24:36 +00:00
+								        {
 								            'url': 'https://www.yapfiles.ru/show/1872528/690b05d3054d2dbe1e69523aa21bb3b1.mp4.html',
 								            'info_dict': {
 								                'id': 'vMDE4NzI1Mjgt690b',
 								                'ext': 'mp4',
 								                'title': 'Котята',
 								            },
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-08-01 01:23:25 +00:00
+								            'add_ie': ['YapFiles'],
-												[yapfiles] Add extractor (closes #15726, refs #11085)

											
										
										
											2018-03-02 18:24:36 +00:00
+								            'params': {
 								                'skip_download': True,
 								            },
-												[generic] Add support for share-videos.se embeds (closes #16089)


											
										
										
											2018-04-08 17:19:23 +00:00
+								        },
-												[cloudflarestream] Add support for cloudflare streams (closes #16375)

											
										
										
											2018-05-04 18:21:52 +00:00
+								        {
 								            # CloudflareStream embed
 								            'url': 'https://www.cloudflare.com/products/cloudflare-stream/',
 								            'info_dict': {
 								                'id': '31c9291ab41fac05471db4e73aa11717',
 								                'ext': 'mp4',
 								                'title': '31c9291ab41fac05471db4e73aa11717',
 								            },
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-08-01 01:23:25 +00:00
+								            'add_ie': ['CloudflareStream'],
-												[cloudflarestream] Add support for cloudflare streams (closes #16375)

											
										
										
											2018-05-04 18:21:52 +00:00
+								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[peertube] Add support for generic embeds

											
										
										
											2018-05-25 17:28:30 +00:00
+								        {
 								            # PeerTube embed
 								            'url': 'https://joinpeertube.org/fr/home/',
 								            'info_dict': {
 								                'id': 'home',
 								                'title': 'Reprenez le contrôle de vos vidéos ! #JoinPeertube',
 								            },
 								            'playlist_count': 2,
 								        },
-												[indavideo] Add support for generic embeds (closes #11989)

											
										
										
											2018-05-25 18:25:40 +00:00
+								        {
 								            # Indavideo embed
 								            'url': 'https://streetkitchen.hu/receptek/igy_kell_otthon_hamburgert_sutni/',
 								            'info_dict': {
 								                'id': '1693903',
 								                'ext': 'mp4',
 								                'title': 'Így kell otthon hamburgert sütni',
 								                'description': 'md5:f5a730ecf900a5c852e1e00540bbb0f7',
 								                'timestamp': 1426330212,
 								                'upload_date': '20150314',
 								                'uploader': 'StreetKitchen',
 								                'uploader_id': '546363',
 								            },
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-08-01 01:23:25 +00:00
+								            'add_ie': ['IndavideoEmbed'],
-												[indavideo] Add support for generic embeds (closes #11989)

											
										
										
											2018-05-25 18:25:40 +00:00
+								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[apa] Add extractor (closes #15041, closes #15672)

											
										
										
											2018-05-27 11:24:37 +00:00
+								        {
 								            # APA embed via JWPlatform embed
 								            'url': 'http://www.vol.at/blue-man-group/5593454',
 								            'info_dict': {
 								                'id': 'jjv85FdZ',
 								                'ext': 'mp4',
 								                'title': '"Blau ist mysteriös": Die Blue Man Group im Interview',
 								                'description': 'md5:d41d8cd98f00b204e9800998ecf8427e',
 								                'thumbnail': r're:^https?://.*\.jpg$',
 								                'duration': 254,
 								                'timestamp': 1519211149,
 								                'upload_date': '20180221',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[generic] Add support for share-videos.se embeds (closes #16089)


											
										
										
											2018-04-08 17:19:23 +00:00
+								        {
 								            'url': 'http://share-videos.se/auto/video/83645793?uid=13',
 								            'md5': 'b68d276de422ab07ee1d49388103f457',
 								            'info_dict': {
 								                'id': '83645793',
 								                'title': 'Lock up and get excited',
 								                'ext': 'mp4'
-												[generic] Restrict share-videos.se embeds regex to filter bogus URLs (#16115)

											
										
										
											2018-04-08 17:25:44 +00:00
+								            },
 								            'skip': 'TODO: fix nested playlists processing in tests',
 								        },
-												[viqeo] Add extractor (closes #17066)

											
										
										
											2018-07-29 20:05:36 +00:00
+								        {
 								            # Viqeo embeds
 								            'url': 'https://viqeo.tv/',
 								            'info_dict': {
 								                'id': 'viqeo',
 								                'title': 'All-new video platform',
 								            },
 								            'playlist_count': 6,
 								        },
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 12:26:37 +00:00
+								        # {
 								        #     # Zype embed
 								        #     'url': 'https://www.cookscountry.com/episode/554-smoky-barbecue-favorites',
 								        #     'info_dict': {
 								        #         'id': '5b400b834b32992a310622b9',
 								        #         'ext': 'mp4',
 								        #         'title': 'Smoky Barbecue Favorites',
 								        #         'thumbnail': r're:^https?://.*\.jpe?g',
 								        #         'description': 'md5:5ff01e76316bd8d46508af26dc86023b',
 								        #         'upload_date': '20170909',
 								        #         'timestamp': 1504915200,
 								        #     },
 								        #     'add_ie': [ZypeIE.ie_key()],
 								        #     'params': {
 								        #         'skip_download': True,
 								        #     },
 								        # },
-												[generic] Allow relative src for videojs embeds (closes #17324)

											
										
										
											2018-08-24 16:12:53 +00:00
+								        {
 								            # videojs embed
 								            'url': 'https://video.sibnet.ru/shell.php?videoid=3422904',
 								            'info_dict': {
 								                'id': 'shell',
 								                'ext': 'mp4',
 								                'title': 'Доставщик пиццы спросил разрешения сыграть на фортепиано',
 								                'description': 'md5:89209cdc587dab1e4a090453dbaa2cb1',
 								                'thumbnail': r're:^https?://.*\.jpg$',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								            'expected_warnings': ['Failed to download MPD manifest'],
 								        },
-												[dailymotion] add support embed with DM.player js call

											
										
										
											2019-07-01 07:37:21 +00:00
+								        {
 								            # DailyMotion embed with DM.player
 								            'url': 'https://www.beinsports.com/us/copa-del-rey/video/the-locker-room-valencia-beat-barca-in-copa/1203804',
 								            'info_dict': {
 								                'id': 'k6aKkGHd9FJs4mtJN39',
 								                'ext': 'mp4',
 								                'title': 'The Locker Room: Valencia Beat Barca In Copa del Rey Final',
 								                'description': 'This video is private.',
 								                'uploader_id': 'x1jf30l',
 								                'uploader': 'beIN SPORTS USA',
 								                'upload_date': '20190528',
 								                'timestamp': 1559062971,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[tvopengr] Add extractors (#2297)

Authored by: zmousm
											
										
										
											2022-01-19 20:43:02 +00:00
+								        {
 								            # tvopengr:embed
 								            'url': 'https://www.ethnos.gr/World/article/190604/hparosiaxekinoynoisynomiliessthgeneyhmethskiatoypolemoypanoapothnoykrania',
 								            'md5': 'eb0c3995d0a6f18f6538c8e057865d7d',
 								            'info_dict': {
 								                'id': '101119',
 								                'ext': 'mp4',
 								                'display_id': 'oikarpoitondiapragmateyseonhparosias',
 								                'title': 'md5:b979f4d640c568617d6547035528a149',
 								                'description': 'md5:e54fc1977c7159b01cc11cd7d9d85550',
 								                'timestamp': 1641772800,
 								                'upload_date': '20220110',
 								                'thumbnail': 'https://opentv-static.siliconweb.com/imgHandler/1920/70bc39fa-895b-4918-a364-c39d2135fc6d.jpg',
 								            }
 								        },
-												[blogger] Add extractor (#1629)

Authored by: pabs3
											
										
										
											2021-11-18 22:15:41 +00:00
+								        {
 								            # blogger embed
 								            'url': 'https://blog.tomeuvizoso.net/2019/01/a-panfrost-milestone.html',
 								            'md5': 'f1bc19b6ea1b0fd1d81e84ca9ec467ac',
 								            'info_dict': {
 								                'id': 'BLOGGER-video-3c740e3a49197e16-796',
 								                'ext': 'mp4',
 								                'title': 'Blogger',
 								                'thumbnail': r're:^https?://.*',
 								            },
 								        },
-												[extractor/generic] Properly comment out a test

											
										
										
											2016-07-09 01:32:55 +00:00
+								        # {
 								        #     # TODO: find another test
 								        #     # http://schema.org/VideoObject
 								        #     'url': 'https://flipagram.com/f/nyvTSJMKId',
 								        #     'md5': '888dcf08b7ea671381f00fab74692755',
 								        #     'info_dict': {
 								        #         'id': 'nyvTSJMKId',
 								        #         'ext': 'mp4',
 								        #         'title': 'Flipagram by sjuria101 featuring Midnight Memories by One Direction',
 								        #         'description': '#love for cats.',
 								        #         'timestamp': 1461244995,
 								        #         'upload_date': '20160421',
 								        #     },
 								        #     'params': {
 								        #         'force_generic_extractor': True,
 								        #     },
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 12:26:37 +00:00
+								        # },
 								        {
 								            # VHX Embed
 								            'url': 'https://demo.vhx.tv/category-c/videos/file-example-mp4-480-1-5mg-copy',
 								            'info_dict': {
 								                'id': '858208',
 								                'ext': 'mp4',
 								                'title': 'Untitled',
 								                'uploader_id': 'user80538407',
 								                'uploader': 'OTT Videos',
 								            },
 								        },
 								        {
 								            # ArcPublishing PoWa video player
 								            'url': 'https://www.adn.com/politics/2020/11/02/video-senate-candidates-campaign-in-anchorage-on-eve-of-election-day/',
 								            'md5': 'b03b2fac8680e1e5a7cc81a5c27e71b3',
 								            'info_dict': {
 								                'id': '8c99cb6e-b29c-4bc9-9173-7bf9979225ab',
 								                'ext': 'mp4',
 								                'title': 'Senate candidates wave to voters on Anchorage streets',
 								                'description': 'md5:91f51a6511f090617353dc720318b20e',
 								                'timestamp': 1604378735,
 								                'upload_date': '20201103',
 								                'duration': 1581,
 								            },
 								        },
-												Update to ytdl-2021.02.04.1 except youtube

											
										
										
											2021-02-04 07:56:01 +00:00
+								        {
 								            # MyChannels SDK embed
 								            # https://www.24kitchen.nl/populair/deskundige-dit-waarom-sommigen-gevoelig-zijn-voor-voedselallergieen
 								            'url': 'https://www.demorgen.be/nieuws/burgemeester-rotterdam-richt-zich-in-videoboodschap-tot-relschoppers-voelt-het-goed~b0bcfd741/',
 								            'md5': '90c0699c37006ef18e198c032d81739c',
 								            'info_dict': {
 								                'id': '194165',
 								                'ext': 'mp4',
 								                'title': 'Burgemeester Aboutaleb spreekt relschoppers toe',
 								                'timestamp': 1611740340,
 								                'upload_date': '20210127',
 								                'duration': 159,
 								            },
 								        },
-												Update to ytdl-commit-cf2dbec
https://github.com/ytdl-org/youtube-dl/commit/cf2dbec6301177a1fddf72862de05fa912d9869d

Except: [kakao] improve info extraction and detect geo restriction
https://github.com/ytdl-org/youtube-dl/commit/d8085580f63ad3b146a31712ff76cf41d5a4558a

											
										
										
											2021-02-19 20:44:36 +00:00
+								        {
 								            # Simplecast player embed
 								            'url': 'https://www.bio.org/podcast',
 								            'info_dict': {
 								                'id': 'podcast',
 								                'title': 'I AM BIO Podcast | BIO',
 								            },
 								            'playlist_mincount': 52,
-												Update to ytdl-commit-dfbbe29

[redbulltv] fix embed data extraction
https://github.com/ytdl-org/youtube-dl/commit/dfbbe2902fc67f0f93ee47a8077c148055c67a9b

											
										
										
											2021-05-20 15:38:49 +00:00
+								        }, {
-												[wimtv] Add extractor (#161)

Added support for VODs, live and embeds

Authored by: nixxo
											
										
										
											2021-03-11 07:58:51 +00:00
+								            # WimTv embed player
 								            'url': 'http://www.msmotor.tv/wearefmi-pt-2-2021/',
 								            'info_dict': {
 								                'id': 'wearefmi-pt-2-2021',
 								                'title': '#WEAREFMI – PT.2 – 2021 – MsMotorTV',
 								            },
 								            'playlist_count': 1,
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											2021-07-29 04:03:01 +00:00
+								        }, {
 								            # KVS Player
 								            'url': 'https://www.kvs-demo.com/videos/105/kelis-4th-of-july/',
 								            'info_dict': {
 								                'id': '105',
 								                'display_id': 'kelis-4th-of-july',
 								                'ext': 'mp4',
 								                'title': 'Kelis - 4th Of July',
-												Update to ytdl-commit-195f22f6

[generic] Improve KVS (etc) extraction
https://github.com/ytdl-org/youtube-dl/commit/195f22f679330549882a8234e7234942893a4902

Closes #3716
Authored by: Grub4k, pukkandan
											
										
										
											2023-01-02 13:45:36 +00:00
+								                'description': 'Kelis - 4th Of July',
 								                'thumbnail': r're:https://(?:www\.)?kvs-demo.com/contents/videos_screenshots/0/105/preview.jpg',
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											2021-07-29 04:03:01 +00:00
+								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												Update to ytdl-commit-195f22f6

[generic] Improve KVS (etc) extraction
https://github.com/ytdl-org/youtube-dl/commit/195f22f679330549882a8234e7234942893a4902

Closes #3716
Authored by: Grub4k, pukkandan
											
										
										
											2023-01-02 13:45:36 +00:00
+								            'expected_warnings': ['Untested major version'],
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											2021-07-29 04:03:01 +00:00
+								        }, {
 								            # KVS Player
 								            'url': 'https://www.kvs-demo.com/embed/105/',
 								            'info_dict': {
 								                'id': '105',
 								                'display_id': 'kelis-4th-of-july',
 								                'ext': 'mp4',
 								                'title': 'Kelis - 4th Of July / Embed Player',
-												Update to ytdl-commit-195f22f6

[generic] Improve KVS (etc) extraction
https://github.com/ytdl-org/youtube-dl/commit/195f22f679330549882a8234e7234942893a4902

Closes #3716
Authored by: Grub4k, pukkandan
											
										
										
											2023-01-02 13:45:36 +00:00
+								                'thumbnail': r're:https://(?:www\.)?kvs-demo.com/contents/videos_screenshots/0/105/preview.jpg',
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											2021-07-29 04:03:01 +00:00
+								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        }, {
 								            'url': 'https://youix.com/video/leningrad-zoj/',
 								            'md5': '94f96ba95706dc3880812b27b7d8a2b8',
 								            'info_dict': {
 								                'id': '18485',
 								                'display_id': 'leningrad-zoj',
 								                'ext': 'mp4',
 								                'title': 'Клип: Ленинград - ЗОЖ скачать, смотреть онлайн | Youix.com',
-												Update to ytdl-commit-195f22f6

[generic] Improve KVS (etc) extraction
https://github.com/ytdl-org/youtube-dl/commit/195f22f679330549882a8234e7234942893a4902

Closes #3716
Authored by: Grub4k, pukkandan
											
										
										
											2023-01-02 13:45:36 +00:00
+								                'thumbnail': r're:https://youix.com/contents/videos_screenshots/18000/18485/preview(?:_480x320_youix_com.mp4)?\.jpg',
 								            },
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											2021-07-29 04:03:01 +00:00
+								        }, {
 								            # KVS Player
 								            'url': 'https://youix.com/embed/18485',
 								            'md5': '94f96ba95706dc3880812b27b7d8a2b8',
 								            'info_dict': {
 								                'id': '18485',
 								                'display_id': 'leningrad-zoj',
 								                'ext': 'mp4',
 								                'title': 'Ленинград - ЗОЖ',
-												Update to ytdl-commit-195f22f6

[generic] Improve KVS (etc) extraction
https://github.com/ytdl-org/youtube-dl/commit/195f22f679330549882a8234e7234942893a4902

Closes #3716
Authored by: Grub4k, pukkandan
											
										
										
											2023-01-02 13:45:36 +00:00
+								                'thumbnail': r're:https://youix.com/contents/videos_screenshots/18000/18485/preview(?:_480x320_youix_com.mp4)?\.jpg',
 								            },
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											2021-07-29 04:03:01 +00:00
+								        }, {
 								            # KVS Player
 								            'url': 'https://bogmedia.org/videos/21217/40-nochey-40-nights-2016/',
 								            'md5': '94166bdb26b4cb1fb9214319a629fc51',
 								            'info_dict': {
 								                'id': '21217',
-												Update to ytdl-commit-195f22f6

[generic] Improve KVS (etc) extraction
https://github.com/ytdl-org/youtube-dl/commit/195f22f679330549882a8234e7234942893a4902

Closes #3716
Authored by: Grub4k, pukkandan
											
										
										
											2023-01-02 13:45:36 +00:00
+								                'display_id': '40-nochey-2016',
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											2021-07-29 04:03:01 +00:00
+								                'ext': 'mp4',
 								                'title': '40 ночей (2016) - BogMedia.org',
-												Update to ytdl-commit-195f22f6

[generic] Improve KVS (etc) extraction
https://github.com/ytdl-org/youtube-dl/commit/195f22f679330549882a8234e7234942893a4902

Closes #3716
Authored by: Grub4k, pukkandan
											
										
										
											2023-01-02 13:45:36 +00:00
+								                'description': 'md5:4e6d7d622636eb7948275432eb256dc3',
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											2021-07-29 04:03:01 +00:00
+								                'thumbnail': 'https://bogmedia.org/contents/videos_screenshots/21000/21217/preview_480p.mp4.jpg',
-												Update to ytdl-commit-195f22f6

[generic] Improve KVS (etc) extraction
https://github.com/ytdl-org/youtube-dl/commit/195f22f679330549882a8234e7234942893a4902

Closes #3716
Authored by: Grub4k, pukkandan
											
										
										
											2023-01-02 13:45:36 +00:00
+								            },
-												[wimtv] Add extractor (#161)

Added support for VODs, live and embeds

Authored by: nixxo
											
										
										
											2021-03-11 07:58:51 +00:00
+								        },
-												[generic] Fix HTTP KVS Player (#2111)

Authored by: git-anony-mouse
											
										
										
											2021-12-25 03:18:19 +00:00
+								        {
 								            # KVS Player (for sites that serve kt_player.js via non-https urls)
 								            'url': 'http://www.camhub.world/embed/389508',
 								            'md5': 'fbe89af4cfb59c8fd9f34a202bb03e32',
 								            'info_dict': {
 								                'id': '389508',
 								                'display_id': 'syren-de-mer-onlyfans-05-07-2020have-a-happy-safe-holiday5f014e68a220979bdb8cd-source',
 								                'ext': 'mp4',
-												Update to ytdl-commit-195f22f6

[generic] Improve KVS (etc) extraction
https://github.com/ytdl-org/youtube-dl/commit/195f22f679330549882a8234e7234942893a4902

Closes #3716
Authored by: Grub4k, pukkandan
											
										
										
											2023-01-02 13:45:36 +00:00
+								                'title': 'Syren De Mer onlyfans_05-07-2020Have_a_happy_safe_holiday5f014e68a220979bdb8cd_source / Embed плеер',
 								                'thumbnail': r're:https?://www\.camhub\.world/contents/videos_screenshots/389000/389508/preview\.mp4\.jpg',
 								            },
-												[generic] Fix HTTP KVS Player (#2111)

Authored by: git-anony-mouse
											
										
										
											2021-12-25 03:18:19 +00:00
+								        },
-												[Reddit] Add support for 1080p videos (#1682)

Fixes: https://github.com/ytdl-org/youtube-dl/issues/29565

Authored by: xenova
											
										
										
											2021-11-18 22:48:48 +00:00
+								        {
 								            # Reddit-hosted video that will redirect and be processed by RedditIE
 								            # Redirects to https://www.reddit.com/r/videos/comments/6rrwyj/that_small_heart_attack/
 								            'url': 'https://v.redd.it/zv89llsvexdz',
 								            'md5': '87f5f02f6c1582654146f830f21f8662',
 								            'info_dict': {
 								                'id': 'zv89llsvexdz',
 								                'ext': 'mp4',
 								                'timestamp': 1501941939.0,
 								                'title': 'That small heart attack.',
 								                'upload_date': '20170805',
 								                'uploader': 'Antw87'
 								            }
 								        },
 								        {
 								            # 1080p Reddit-hosted video that will redirect and be processed by RedditIE
 								            'url': 'https://v.redd.it/33hgok7dfbz71/',
 								            'md5': '7a1d587940242c9bb3bd6eb320b39258',
 								            'info_dict': {
 								                'id': '33hgok7dfbz71',
 								                'ext': 'mp4',
 								                'title': "The game Didn't want me to Knife that Guy I guess",
 								                'uploader': 'paraf1ve',
 								                'timestamp': 1636788683.0,
 								                'upload_date': '20211113'
 								            }
-												[gfycat] Support embeds (#2229)

Closes #2214
Authored by: coletdjnz
											
										
										
											2022-01-05 08:39:24 +00:00
+								        },
-												[MainStreaming] Add extractor (#2180)

Closes #1183, https://github.com/ytdl-org/youtube-dl/issues/29615

Authored by: coletdjnz
											
										
										
											2022-01-05 08:48:17 +00:00
+								        {
 								            # MainStreaming player
 								            'url': 'https://www.lactv.it/2021/10/03/lac-news24-la-settimana-03-10-2021/',
 								            'info_dict': {
 								                'id': 'EUlZfGWkGpOd',
 								                'title': 'La Settimana ',
 								                'description': '03 Ottobre ore 02:00',
 								                'ext': 'mp4',
 								                'live_status': 'not_live',
 								                'thumbnail': r're:https?://[A-Za-z0-9-]*\.msvdn.net/image/\w+/poster',
 								                'duration': 1512
 								            }
 								        },
-												[gfycat] Support embeds (#2229)

Closes #2214
Authored by: coletdjnz
											
										
										
											2022-01-05 08:39:24 +00:00
+								        {
 								            # Multiple gfycat iframe embeds
 								            'url': 'https://www.gezip.net/bbs/board.php?bo_table=entertaine&wr_id=613422',
 								            'info_dict': {
 								                'title': '재이, 윤, 세은 황금 드레스를 입고 빛난다',
 								                'id': 'board'
 								            },
 								            'playlist_count': 8,
 								        },
 								        {
 								            # Multiple gfycat gifs (direct links)
 								            'url': 'https://www.gezip.net/bbs/board.php?bo_table=entertaine&wr_id=612199',
 								            'info_dict': {
 								                'title': '옳게 된 크롭 니트 스테이씨 아이사',
 								                'id': 'board'
 								            },
 								            'playlist_count': 6
 								        },
 								        {
 								            # Multiple gfycat embeds, with uppercase "IFR" in urls
 								            'url': 'https://kkzz.kr/?vid=2295',
 								            'info_dict': {
 								                'title': '지방시 앰버서더 에스파 카리나 움짤',
 								                'id': '?vid=2295'
 								            },
 								            'playlist_count': 9
-												[panopto] Add extractors (#2908)

Based on https://github.com/ytdl-org/youtube-dl/pull/13449
Closes #1946
Authored by: coletdjnz, kmark
											
										
										
											2022-03-08 21:00:57 +00:00
+								        },
 								        {
 								            # Panopto embeds
 								            'url': 'https://www.monash.edu/learning-teaching/teachhq/learning-technologies/panopto/how-to/insert-a-quiz-into-a-panopto-video',
 								            'info_dict': {
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-08-01 01:23:25 +00:00
+								                'ext': 'mp4',
 								                'id': '0bd3f16c-824a-436a-8486-ac5900693aef',
 								                'title': 'Quizzes in Panopto',
-												[panopto] Add extractors (#2908)

Based on https://github.com/ytdl-org/youtube-dl/pull/13449
Closes #1946
Authored by: coletdjnz, kmark
											
										
										
											2022-03-08 21:00:57 +00:00
+								            },
-												[ruutu] Detect embeds (#3294)

Authored by: tpikonen
											
										
										
											2022-04-05 12:15:47 +00:00
+								        },
 								        {
 								            # Ruutu embed
 								            'url': 'https://www.nelonen.fi/ohjelmat/madventures-suomi/2160731-riku-ja-tunna-lahtevat-peurajahtiin-tv-sta-tutun-biologin-kanssa---metsastysreissu-huipentuu-kasvissyojan-painajaiseen',
 								            'md5': 'a2513a98d3496099e6eced40f7e6a14b',
 								            'info_dict': {
 								                'id': '4044426',
 								                'ext': 'mp4',
 								                'title': 'Riku ja Tunna lähtevät peurajahtiin tv:stä tutun biologin kanssa – metsästysreissu huipentuu kasvissyöjän painajaiseen!',
 								                'thumbnail': r're:^https?://.+\.jpg$',
 								                'duration': 108,
-												[cleanup] Misc fixes

Closes https://github.com/yt-dlp/yt-dlp/pull/3213, Closes https://github.com/yt-dlp/yt-dlp/pull/3117

Related: https://github.com/yt-dlp/yt-dlp/issues/3146#issuecomment-1077323114, https://github.com/yt-dlp/yt-dlp/pull/3277#discussion_r841019671, https://github.com/yt-dlp/yt-dlp/commit/a825ffbffa0bea322e3ccb44c6f8e01d8d9572fb#commitcomment-68538986, https://github.com/yt-dlp/yt-dlp/issues/2360, https://github.com/yt-dlp/yt-dlp/commit/5fa3c9a88f597625296981a4a26be723e65d4842#r70393519, https://github.com/yt-dlp/yt-dlp/commit/5fa3c9a88f597625296981a4a26be723e65d4842#r70393254

											
										
										
											2022-03-27 02:20:43 +00:00
+								                'series': 'Madventures Suomi',
-												[ruutu] Detect embeds (#3294)

Authored by: tpikonen
											
										
										
											2022-04-05 12:15:47 +00:00
+								                'description': 'md5:aa55b44bd06a1e337a6f1d0b46507381',
 								                'categories': ['Matkailu', 'Elämäntyyli'],
 								                'age_limit': 0,
 								                'upload_date': '20220308',
 								            },
 								        },
-												[ruutu] Support hs.fi embeds (#3547)

Authored by: tpikonen, pukkandan
											
										
										
											2022-05-07 11:24:41 +00:00
+								        {
 								            # Multiple Ruutu embeds
 								            'url': 'https://www.hs.fi/kotimaa/art-2000008762560.html',
 								            'info_dict': {
 								                'title': 'Koronavirus | Epidemiahuippu voi olla Suomessa ohi, mutta koronaviruksen poistamista yleisvaarallisten tautien joukosta harkitaan vasta syksyllä',
 								                'id': 'art-2000008762560'
 								            },
 								            'playlist_count': 3
 								        },
 								        {
 								            # Ruutu embed in hs.fi with a single video
 								            'url': 'https://www.hs.fi/kotimaa/art-2000008793421.html',
 								            'md5': 'f8964e65d8fada6e8a562389bf366bb4',
 								            'info_dict': {
 								                'id': '4081841',
 								                'ext': 'mp4',
 								                'title': 'Puolustusvoimat siirsi panssariajoneuvoja harjoituksiin Niinisaloon 2.5.2022',
 								                'thumbnail': r're:^https?://.+\.jpg$',
 								                'duration': 138,
 								                'age_limit': 0,
 								                'upload_date': '20220504',
 								            },
 								        },
-												[utils] `is_html`: Handle double BOM

Closes #2885

											
										
										
											2022-05-18 01:12:43 +00:00
+								        {
 								            # Webpage contains double BOM
 								            'url': 'https://www.filmarkivet.se/movies/paris-d-moll/',
 								            'md5': 'df02cadc719dcc63d43288366f037754',
 								            'info_dict': {
 								                'id': 'paris-d-moll',
 								                'ext': 'mp4',
 								                'upload_date': '20220518',
 								                'title': 'Paris d-moll',
 								                'description': 'md5:319e37ea5542293db37e1e13072fe330',
 								                'thumbnail': 'https://www.filmarkivet.se/wp-content/uploads/parisdmoll2.jpg',
 								                'timestamp': 1652833414,
 								                'age_limit': 0,
 								            }
-												[extractor/substack] Add extractor (#4011)

Closes #3722
Authored by: elyse0
											
										
										
											2022-06-19 00:08:53 +00:00
+								        },
 								        {
 								            'url': 'https://www.mollymovieclub.com/p/interstellar?s=r#details',
 								            'md5': '198bde8bed23d0b23c70725c83c9b6d9',
 								            'info_dict': {
 								                'id': '53602801',
 								                'ext': 'mpga',
 								                'title': 'Interstellar',
 								                'description': 'Listen now | Episode One',
 								                'thumbnail': 'md5:c30d9c83f738e16d8551d7219d321538',
 								                'uploader': 'Molly Movie Club',
 								                'uploader_id': '839621',
 								            },
 								        },
 								        {
 								            'url': 'https://www.blockedandreported.org/p/episode-117-lets-talk-about-depp?s=r',
 								            'md5': 'c0cc44ee7415daeed13c26e5b56d6aa0',
 								            'info_dict': {
 								                'id': '57962052',
 								                'ext': 'mpga',
 								                'title': 'md5:855b2756f0ee10f6723fa00b16266f8d',
 								                'description': 'md5:fe512a5e94136ad260c80bde00ea4eef',
 								                'thumbnail': 'md5:2218f27dfe517bb5ac16c47d0aebac59',
 								                'uploader': 'Blocked and Reported',
 								                'uploader_id': '500230',
 								            },
 								        },
 								        {
-												[extractor/jwplatform] Look for `data-video-jw-id`

Closes #3821

											
										
										
											2022-06-11 21:55:55 +00:00
+								            'url': 'https://www.skimag.com/video/ski-people-1980/',
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-08-01 01:23:25 +00:00
+								            'md5': '022a7e31c70620ebec18deeab376ee03',
-												[extractor/jwplatform] Look for `data-video-jw-id`

Closes #3821

											
										
										
											2022-06-11 21:55:55 +00:00
+								            'info_dict': {
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-08-01 01:23:25 +00:00
+								                'id': 'YTmgRiNU',
 								                'ext': 'mp4',
 								                'title': '1980 Ski People',
 								                'timestamp': 1610407738,
 								                'description': 'md5:cf9c3d101452c91e141f292b19fe4843',
 								                'thumbnail': 'https://cdn.jwplayer.com/v2/media/YTmgRiNU/poster.jpg?width=720',
 								                'duration': 5688.0,
 								                'upload_date': '20210111',
 								            }
-												[extractor/jwplatform] Look for `data-video-jw-id`

Closes #3821

											
										
										
											2022-06-11 21:55:55 +00:00
+								        },
-												[extractor] Handle `json_ld` with multiple `@type`s

Closes: #4022

											
										
										
											2022-06-13 13:09:58 +00:00
+								        {
 								            'note': 'JSON LD with multiple @type',
 								            'url': 'https://www.nu.nl/280161/video/hoe-een-bladvlo-dit-verwoestende-japanse-onkruid-moet-vernietigen.html',
 								            'md5': 'c7949f34f57273013fb7ccb1156393db',
 								            'info_dict': {
 								                'id': 'ipy2AcGL',
 								                'ext': 'mp4',
 								                'description': 'md5:6a9d644bab0dc2dc06849c2505d8383d',
 								                'thumbnail': r're:https://media\.nu\.nl/m/.+\.jpg',
 								                'title': 'Hoe een bladvlo dit verwoestende Japanse onkruid moet vernietigen',
 								                'timestamp': 1586577474,
 								                'upload_date': '20200411',
 								                'age_limit': 0,
 								                'duration': 111.0,
 								            }
 								        },
-												[extractor/common] Fix `json_ld` type checks (#5145)

Closes #5144, #5143
Authored by: Grub4K
											
										
										
											2022-10-09 03:17:58 +00:00
+								        {
 								            'note': 'JSON LD with unexpected data type',
 								            'url': 'https://www.autoweek.nl/autotests/artikel/porsche-911-gt3-rs-rij-impressie-2/',
 								            'info_dict': {
 								                'id': 'porsche-911-gt3-rs-rij-impressie-2',
 								                'ext': 'mp4',
 								                'title': 'Test: Porsche 911 GT3 RS',
 								                'description': 'Je ziet het niet, maar het is er wel. Downforce, hebben we het dan over. En in de nieuwe Porsche 911 GT3 RS is er zelfs heel veel downforce.',
 								                'timestamp': 1664920902,
 								                'upload_date': '20221004',
 								                'thumbnail': r're:^https://media.autoweek.nl/m/.+\.jpg$',
 								                'age_limit': 0,
 								                'direct': True,
 								            }
-												[extractor/generic] Decode unicode-escaped embed URLs (#5919)

Authored by: bashonly
Closes #5854
											
										
										
											2023-01-02 14:06:01 +00:00
+								        },
 								        {
-												[extractor/generic] Use `Accept-Encoding: identity` for initial request

The existing comment seems to imply this was the desired behavior from the beginning.

Partial fix for https://github.com/yt-dlp/yt-dlp/issues/5855, https://github.com/yt-dlp/yt-dlp/issues/5851, https://github.com/yt-dlp/yt-dlp/issues/4748

											
										
										
											2023-01-01 05:40:26 +00:00
+								            'note': 'server returns data in brotli compression by default if `accept-encoding: *` is specified.',
 								            'url': 'https://www.extra.cz/cauky-lidi-70-dil-babis-predstavil-pohadky-prymulanek-nebo-andrejovy-nove-saty-ac867',
 								            'info_dict': {
 								                'id': 'cauky-lidi-70-dil-babis-predstavil-pohadky-prymulanek-nebo-andrejovy-nove-saty-ac867',
 								                'ext': 'mp4',
 								                'title': 'čauky lidi 70 finall',
 								                'description': 'čauky lidi 70 finall',
 								                'thumbnail': 'h',
 								                'upload_date': '20220606',
 								                'timestamp': 1654513791,
 								                'duration': 318.0,
 								                'direct': True,
 								                'age_limit': 0,
-												[extractor/generic] Decode unicode-escaped embed URLs (#5919)

Authored by: bashonly
Closes #5854
											
										
										
											2023-01-02 14:06:01 +00:00
+								            },
 								        },
-												Update to ytdl-commit-195f22f6

[generic] Improve KVS (etc) extraction
https://github.com/ytdl-org/youtube-dl/commit/195f22f679330549882a8234e7234942893a4902

Closes #3716
Authored by: Grub4k, pukkandan
											
										
										
											2023-01-02 13:45:36 +00:00
+								        {
 								            'url': 'https://shooshtime.com/videos/284002/just-out-of-the-shower-joi/',
 								            'md5': 'e2f0a4c329f7986280b7328e24036d60',
 								            'info_dict': {
 								                'id': '284002',
 								                'display_id': 'just-out-of-the-shower-joi',
 								                'ext': 'mp4',
 								                'title': 'Just Out Of The Shower JOI - Shooshtime',
 								                'thumbnail': 'https://i.shoosh.co/contents/videos_screenshots/284000/284002/preview.mp4.jpg',
 								                'height': 720,
 								                'age_limit': 18,
 								            },
 								        },
-												[extractor/generic] Attempt to detect live HLS (#6775)

* Extract duration for non-live generic HLS videos
* Add extractor-arg `is_live` to bypass live HLS check

Closes #6705
Authored by: bashonly
											
										
										
											2023-04-13 19:36:06 +00:00
+								        {
 								            'note': 'Live HLS direct link',
 								            'url': 'https://d18j67ugtrocuq.cloudfront.net/out/v1/2767aec339144787926bd0322f72c6e9/index.m3u8',
 								            'info_dict': {
 								                'id': 'index',
 								                'title': r're:index',
 								                'ext': 'mp4',
 								                'live_status': 'is_live',
 								            },
 								            'params': {
 								                'skip_download': 'm3u8',
 								            },
 								        },
 								        {
 								            'note': 'Video.js VOD HLS',
 								            'url': 'https://gist.githubusercontent.com/bashonly/2aae0862c50f4a4b84f220c315767208/raw/e3380d413749dabbe804c9c2d8fd9a45142475c7/videojs_hls_test.html',
 								            'info_dict': {
 								                'id': 'videojs_hls_test',
 								                'title': 'video',
 								                'ext': 'mp4',
 								                'age_limit': 0,
 								                'duration': 1800,
 								            },
 								            'params': {
 								                'skip_download': 'm3u8',
 								            },
 								        },
-												GenericIE: Detect videos from Brightcove

Brightcove videos info is usually found in an <object class="BrightcoveExperience"></object> node, this is passed to a new method of BrightcoveIE that builds a url to extract the video.

											
										
										
											2013-07-10 15:49:11 +00:00
+								    ]
-												Move GenericIE into its own file

											
										
										
											2013-06-23 18:31:45 +00:00
 								    def report_following_redirect(self, new_url):
 								        """Report information extraction."""
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											2014-01-06 00:47:52 +00:00
+								        self._downloader.to_screen('[redirect] Following redirect to %s' % new_url)
-												Move GenericIE into its own file

											
										
										
											2013-06-23 18:31:45 +00:00
-												[extractor] Framework for embed detection (#4307)

											
										
										
											2022-08-01 01:22:03 +00:00
+								    def report_detected(self, name, num=1, note=None):
 								        if num > 1:
 								            name += 's'
 								        elif not num:
 								            return
 								        else:
 								            num = 'a'
 								        self._downloader.write_debug(f'Identified {num} {name}{format_field(note, None, "; %s")}')
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											2021-11-09 22:49:33 +00:00
-												[extractor/generic] Add extractor-args `hls_key`, `variant_query` (#6567)

Authored by: bashonly
											
										
										
											2023-03-21 23:12:17 +00:00
+								    def _extra_manifest_info(self, info, manifest_url):
-												[extractor/generic] Accept values for `fragment_query`, `variant_query` (#6600)

Closes #6593
Authored by: bashonly
											
										
										
											2023-03-23 16:28:23 +00:00
+								        fragment_query = self._configuration_arg('fragment_query', [None], casesense=True)[0]
 								        if fragment_query is not None:
 								            info['extra_param_to_segment_url'] = (
 								                urllib.parse.urlparse(fragment_query).query or fragment_query
 								                or urllib.parse.urlparse(manifest_url).query or None)
-												[extractor/generic] Add extractor-args `hls_key`, `variant_query` (#6567)

Authored by: bashonly
											
										
										
											2023-03-21 23:12:17 +00:00
 								        hex_or_none = lambda x: x if re.fullmatch(r'(0x)?[\da-f]+', x, re.IGNORECASE) else None
-												[extractor/generic] Accept values for `fragment_query`, `variant_query` (#6600)

Closes #6593
Authored by: bashonly
											
										
										
											2023-03-23 16:28:23 +00:00
+								        info['hls_aes'] = traverse_obj(self._configuration_arg('hls_key', casesense=True), {
-												[extractor/generic] Add extractor-args `hls_key`, `variant_query` (#6567)

Authored by: bashonly
											
										
										
											2023-03-21 23:12:17 +00:00
+								            'uri': (0, {url_or_none}), 'key': (0, {hex_or_none}), 'iv': (1, {hex_or_none}),
 								        }) or None
-												[extractor/generic] Accept values for `fragment_query`, `variant_query` (#6600)

Closes #6593
Authored by: bashonly
											
										
										
											2023-03-23 16:28:23 +00:00
+								        variant_query = self._configuration_arg('variant_query', [None], casesense=True)[0]
 								        if variant_query is not None:
 								            query = urllib.parse.parse_qs(
 								                urllib.parse.urlparse(variant_query).query or variant_query
 								                or urllib.parse.urlparse(manifest_url).query)
-												[extractor/generic] Add extractor-args `hls_key`, `variant_query` (#6567)

Authored by: bashonly
											
										
										
											2023-03-21 23:12:17 +00:00
+								            for fmt in self._downloader._get_formats(info):
 								                fmt['url'] = update_url_query(fmt['url'], query)
-												[extractor/generic] Add `fragment_query` extractor arg for DASH and HLS (#5528)

* `fragment_query`: passthrough any query in generic mpd/m3u8 manifest URLs to their fragments
* Add support for `extra_param_to_segment_url` to DASH downloader
Authored by: bashonly, pukkandan
											
										
										
											2022-11-21 00:51:45 +00:00
-												[extractor/generic] Attempt to detect live HLS (#6775)

* Extract duration for non-live generic HLS videos
* Add extractor-arg `is_live` to bypass live HLS check

Closes #6705
Authored by: bashonly
											
										
										
											2023-04-13 19:36:06 +00:00
+								        # Attempt to detect live HLS or set VOD duration
 								        m3u8_format = next((f for f in self._downloader._get_formats(info)
 								                            if determine_protocol(f) == 'm3u8_native'), None)
 								        if m3u8_format:
 								            is_live = self._configuration_arg('is_live', [None])[0]
 								            if is_live is not None:
 								                info['live_status'] = 'not_live' if is_live == 'false' else 'is_live'
 								                return
 								            headers = m3u8_format.get('http_headers') or info.get('http_headers')
 								            duration = self._extract_m3u8_vod_duration(
 								                m3u8_format['url'], info.get('id'), note='Checking m3u8 live status',
 								                errnote='Failed to download m3u8 media playlist', headers=headers)
 								            if not duration:
 								                info['live_status'] = 'is_live'
 								            info['duration'] = info.get('duration') or duration
-												[generic] Add support for RSS feeds (Fixes #667)

											
										
										
											2014-02-20 12:14:05 +00:00
+								    def _extract_rss(self, url, video_id, doc):
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 12:26:37 +00:00
+								        NS_MAP = {
 								            'itunes': 'http://www.itunes.com/dtds/podcast-1.0.dtd',
 								        }
-												[generic] Parse RSS enclosure URLs (Fixes #5091)

											
										
										
											2015-03-02 14:21:11 +00:00
+								        entries = []
 								        for it in doc.findall('./channel/item'):
-												[generic] Refactor `_extract_rss`

Closes #3738

											
										
										
											2022-05-17 22:44:13 +00:00
+								            next_url = next(
 								                (e.attrib.get('url') for e in it.findall('./enclosure')),
 								                xpath_text(it, 'link', fatal=False))
-												[generic] Parse RSS enclosure URLs (Fixes #5091)

											
										
										
											2015-03-02 14:21:11 +00:00
+								            if not next_url:
 								                continue
-												[generic] Refactor `_extract_rss`

Closes #3738

											
										
										
											2022-05-17 22:44:13 +00:00
+								            guid = try_call(lambda: it.find('guid').text)
 								            if guid:
 								                next_url = smuggle_url(next_url, {'force_videoid': guid})
-												[generic] Set rss `guid` as video id (#2741)

Closes #2424
Authored by: Bricio
											
										
										
											2022-02-11 23:32:58 +00:00
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 12:26:37 +00:00
+								            def itunes(key):
-												[generic] Refactor `_extract_rss`

Closes #3738

											
										
										
											2022-05-17 22:44:13 +00:00
+								                return xpath_text(it, xpath_with_ns(f'./itunes:{key}', NS_MAP), default=None)
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 12:26:37 +00:00
-												[generic] Parse RSS enclosure URLs (Fixes #5091)

											
										
										
											2015-03-02 14:21:11 +00:00
+								            entries.append({
-												[extractor/generic] Extract RSS entries as url_transparent (#11163)

											
										
										
											2017-04-15 17:52:15 +00:00
+								                '_type': 'url_transparent',
-												[generic] Parse RSS enclosure URLs (Fixes #5091)

											
										
										
											2015-03-02 14:21:11 +00:00
+								                'url': next_url,
-												[generic] Refactor `_extract_rss`

Closes #3738

											
										
										
											2022-05-17 22:44:13 +00:00
+								                'title': try_call(lambda: it.find('title').text),
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 12:26:37 +00:00
+								                'description': xpath_text(it, 'description', default=None),
-												[generic] Refactor `_extract_rss`

Closes #3738

											
										
										
											2022-05-17 22:44:13 +00:00
+								                'timestamp': unified_timestamp(xpath_text(it, 'pubDate', default=None)),
 								                'duration': parse_duration(itunes('duration')),
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 12:26:37 +00:00
+								                'thumbnail': url_or_none(xpath_attr(it, xpath_with_ns('./itunes:image', NS_MAP), 'href')),
 								                'episode': itunes('title'),
 								                'episode_number': int_or_none(itunes('episode')),
 								                'season_number': int_or_none(itunes('season')),
-												[generic] Refactor `_extract_rss`

Closes #3738

											
										
										
											2022-05-17 22:44:13 +00:00
+								                'age_limit': {'true': 18, 'yes': 18, 'false': 0, 'no': 0}.get((itunes('explicit') or '').lower()),
-												[generic] Parse RSS enclosure URLs (Fixes #5091)

											
										
										
											2015-03-02 14:21:11 +00:00
+								            })
-												[generic] Add support for RSS feeds (Fixes #667)

											
										
										
											2014-02-20 12:14:05 +00:00
 								        return {
 								            '_type': 'playlist',
 								            'id': url,
-												[generic] Refactor `_extract_rss`

Closes #3738

											
										
										
											2022-05-17 22:44:13 +00:00
+								            'title': try_call(lambda: doc.find('./channel/title').text),
 								            'description': try_call(lambda: doc.find('./channel/description').text),
-												[generic] Add support for RSS feeds (Fixes #667)

											
										
										
											2014-02-20 12:14:05 +00:00
+								            'entries': entries,
 								        }
-												Update to ytdl-commit-195f22f6

[generic] Improve KVS (etc) extraction
https://github.com/ytdl-org/youtube-dl/commit/195f22f679330549882a8234e7234942893a4902

Closes #3716
Authored by: Grub4k, pukkandan
											
										
										
											2023-01-02 13:45:36 +00:00
+								    @classmethod
 								    def _kvs_get_real_url(cls, video_url, license_code):
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											2021-07-29 04:03:01 +00:00
+								        if not video_url.startswith('function/0/'):
 								            return video_url  # not obfuscated
-												Update to ytdl-commit-195f22f6

[generic] Improve KVS (etc) extraction
https://github.com/ytdl-org/youtube-dl/commit/195f22f679330549882a8234e7234942893a4902

Closes #3716
Authored by: Grub4k, pukkandan
											
										
										
											2023-01-02 13:45:36 +00:00
+								        parsed = urllib.parse.urlparse(video_url[len('function/0/'):])
 								        license = cls._kvs_get_license_token(license_code)
 								        urlparts = parsed.path.split('/')
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											2021-07-29 04:03:01 +00:00
-												Update to ytdl-commit-195f22f6

[generic] Improve KVS (etc) extraction
https://github.com/ytdl-org/youtube-dl/commit/195f22f679330549882a8234e7234942893a4902

Closes #3716
Authored by: Grub4k, pukkandan
											
										
										
											2023-01-02 13:45:36 +00:00
+								        HASH_LENGTH = 32
 								        hash = urlparts[3][:HASH_LENGTH]
 								        indices = list(range(HASH_LENGTH))
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											2021-07-29 04:03:01 +00:00
-												Update to ytdl-commit-195f22f6

[generic] Improve KVS (etc) extraction
https://github.com/ytdl-org/youtube-dl/commit/195f22f679330549882a8234e7234942893a4902

Closes #3716
Authored by: Grub4k, pukkandan
											
										
										
											2023-01-02 13:45:36 +00:00
+								        # Swap indices of hash according to the destination calculated from the license token
 								        accum = 0
 								        for src in reversed(range(HASH_LENGTH)):
 								            accum += license[src]
 								            dest = (src + accum) % HASH_LENGTH
 								            indices[src], indices[dest] = indices[dest], indices[src]
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											2021-07-29 04:03:01 +00:00
-												Update to ytdl-commit-195f22f6

[generic] Improve KVS (etc) extraction
https://github.com/ytdl-org/youtube-dl/commit/195f22f679330549882a8234e7234942893a4902

Closes #3716
Authored by: Grub4k, pukkandan
											
										
										
											2023-01-02 13:45:36 +00:00
+								        urlparts[3] = ''.join(hash[index] for index in indices) + urlparts[3][HASH_LENGTH:]
 								        return urllib.parse.urlunparse(parsed._replace(path='/'.join(urlparts)))
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											2021-07-29 04:03:01 +00:00
-												Update to ytdl-commit-195f22f6

[generic] Improve KVS (etc) extraction
https://github.com/ytdl-org/youtube-dl/commit/195f22f679330549882a8234e7234942893a4902

Closes #3716
Authored by: Grub4k, pukkandan
											
										
										
											2023-01-02 13:45:36 +00:00
+								    @staticmethod
 								    def _kvs_get_license_token(license):
 								        license = license.replace('$', '')
 								        license_values = [int(char) for char in license]
 								        modlicense = license.replace('0', '1')
 								        center = len(modlicense) // 2
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											2021-07-29 04:03:01 +00:00
+								        fronthalf = int(modlicense[:center + 1])
 								        backhalf = int(modlicense[center:])
-												Update to ytdl-commit-195f22f6

[generic] Improve KVS (etc) extraction
https://github.com/ytdl-org/youtube-dl/commit/195f22f679330549882a8234e7234942893a4902

Closes #3716
Authored by: Grub4k, pukkandan
											
										
										
											2023-01-02 13:45:36 +00:00
+								        modlicense = str(4 * abs(fronthalf - backhalf))[:center + 1]
 								        return [
 								            (license_values[index + offset] + current) % 10
 								            for index, current in enumerate(map(int, modlicense))
 								            for offset in range(4)
 								        ]
 								    def _extract_kvs(self, url, webpage, video_id):
 								        flashvars = self._search_json(
 								            r'(?s:<script\b[^>]*>.*?var\s+flashvars\s*=)',
 								            webpage, 'flashvars', video_id, transform_source=js_to_json)
 								        # extract the part after the last / as the display_id from the
 								        # canonical URL.
 								        display_id = self._search_regex(
 								            r'(?:<link href="https?://[^"]+/(.+?)/?" rel="canonical"\s*/?>'
 								            r'|<link rel="canonical" href="https?://[^"]+/(.+?)/?"\s*/?>)',
 								            webpage, 'display_id', fatal=False)
 								        title = self._html_search_regex(r'<(?:h1|title)>(?:Video: )?(.+?)</(?:h1|title)>', webpage, 'title')
 								        thumbnail = flashvars['preview_url']
 								        if thumbnail.startswith('//'):
 								            protocol, _, _ = url.partition('/')
 								            thumbnail = protocol + thumbnail
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											2021-07-29 04:03:01 +00:00
-												Update to ytdl-commit-195f22f6

[generic] Improve KVS (etc) extraction
https://github.com/ytdl-org/youtube-dl/commit/195f22f679330549882a8234e7234942893a4902

Closes #3716
Authored by: Grub4k, pukkandan
											
										
										
											2023-01-02 13:45:36 +00:00
+								        url_keys = list(filter(re.compile(r'^video_(?:url|alt_url\d*)$').match, flashvars.keys()))
 								        formats = []
 								        for key in url_keys:
 								            if '/get_file/' not in flashvars[key]:
 								                continue
 								            format_id = flashvars.get(f'{key}_text', key)
 								            formats.append({
 								                'url': urljoin(url, self._kvs_get_real_url(flashvars[key], flashvars['license_code'])),
 								                'format_id': format_id,
 								                'ext': 'mp4',
 								                **(parse_resolution(format_id) or parse_resolution(flashvars[key])),
 								                'http_headers': {'Referer': url},
 								            })
 								            if not formats[-1].get('height'):
 								                formats[-1]['quality'] = 1
 								        return {
 								            'id': flashvars['video_id'],
 								            'display_id': display_id,
 								            'title': title,
-												[ie/generic] Fix KVS thumbnail extraction

Closes #8045
Authored by: bashonly

											
										
										
											2023-09-16 21:20:34 +00:00
+								            'thumbnail': urljoin(url, thumbnail),
-												Update to ytdl-commit-195f22f6

[generic] Improve KVS (etc) extraction
https://github.com/ytdl-org/youtube-dl/commit/195f22f679330549882a8234e7234942893a4902

Closes #3716
Authored by: Grub4k, pukkandan
											
										
										
											2023-01-02 13:45:36 +00:00
+								            'formats': formats,
 								        }
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											2021-07-29 04:03:01 +00:00
-												Move GenericIE into its own file

											
										
										
											2013-06-23 18:31:45 +00:00
+								    def _real_extract(self, url):
-												[generic] Add support for protocol-independent URLs (Fixes #2810)

											
										
										
											2014-04-29 23:46:06 +00:00
+								        if url.startswith('//'):
-												Refactor code to use url_result


											
										
										
											2019-01-01 16:56:05 +00:00
+								            return self.url_result(self.http_scheme() + url)
-												[generic] Add support for protocol-independent URLs (Fixes #2810)

											
										
										
											2014-04-29 23:46:06 +00:00
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 10:54:43 +00:00
+								        parsed_url = urllib.parse.urlparse(url)
-												[generic] If the url doesn't specify the protocol, then try to extract prepending 'http://'

											
										
										
											2013-09-06 16:39:35 +00:00
+								        if not parsed_url.scheme:
-												[extractor] Add `write_debug` and `get_param`

											
										
										
											2021-05-17 12:23:08 +00:00
+								            default_search = self.get_param('default_search')
-												Add new --default-search option (#2193)

											
										
										
											2014-01-22 13:16:43 +00:00
+								            if default_search is None:
-												[generic] Add --default-search fixup_error

This restores the ability to enter URLs without a scheme (and default to http), but still fail if the input is a search term.

											
										
										
											2014-07-29 15:17:43 +00:00
+								                default_search = 'fixup_error'
-												Add new --default-search option (#2193)

											
										
										
											2014-01-22 13:16:43 +00:00
-												[generic] Add --default-search fixup_error

This restores the ability to enter URLs without a scheme (and default to http), but still fail if the input is a search term.

											
										
										
											2014-07-29 15:17:43 +00:00
+								            if default_search in ('auto', 'auto_warning', 'fixup_error'):
-												[extractor/generic] Restrict --default-search schemeless URLs detection pattern (closes #21842)

											
										
										
											2019-07-20 16:08:26 +00:00
+								                if re.match(r'^[^\s/]+\.[^\s/]+/', url):
-												Fix inconsistent use of `report_warning`

											
										
										
											2021-04-16 10:01:10 +00:00
+								                    self.report_warning('The url doesn\'t specify the protocol, trying with http')
-												Add new --default-search option (#2193)

											
										
										
											2014-01-22 13:16:43 +00:00
+								                    return self.url_result('http://' + url)
-												[generic] Add --default-search fixup_error

This restores the ability to enter URLs without a scheme (and default to http), but still fail if the input is a search term.

											
										
										
											2014-07-29 15:17:43 +00:00
+								                elif default_search != 'fixup_error':
-												[generic] Warn before fallback to automatic search

											
										
										
											2014-03-30 13:57:31 +00:00
+								                    if default_search == 'auto_warning':
-												[generic] Abort if user passes in URL "url" (#2942)

											
										
										
											2014-05-19 15:10:11 +00:00
+								                        if re.match(r'^(?:url|URL)$', url):
 								                            raise ExtractorError(
-												Completely change project name to yt-dlp (#85)

* All modules and binary names are changed
* All documentation references changed
* yt-dlp no longer loads youtube-dlc config files
* All URLs changed to point to organization account

Co-authored-by: Pccode66
Co-authored-by: pukkandan
											
										
										
											2021-02-24 18:45:56 +00:00
+								                                'Invalid URL:  %r . Call yt-dlp like this:  yt-dlp -v "https://www.youtube.com/watch?v=BaW_jenozKc"  ' % url,
-												[generic] Abort if user passes in URL "url" (#2942)

											
										
										
											2014-05-19 15:10:11 +00:00
+								                                expected=True)
 								                        else:
-												Fix inconsistent use of `report_warning`

											
										
										
											2021-04-16 10:01:10 +00:00
+								                            self.report_warning(
-												[generic] Set default-search to error

This prevents users from submitting bug reports where they mistyped a URL, and prevents me from getting a weird video when holding shift and thus searching for :Tds

											
										
										
											2014-07-06 09:22:44 +00:00
+								                                'Falling back to youtube search for  %s . Set --default-search "auto" to suppress this warning.' % url)
-												Add new --default-search option (#2193)

											
										
										
											2014-01-22 13:16:43 +00:00
+								                    return self.url_result('ytsearch:' + url)
-												[generic] Add --default-search fixup_error

This restores the ability to enter URLs without a scheme (and default to http), but still fail if the input is a search term.

											
										
										
											2014-07-29 15:17:43 +00:00
 								            if default_search in ('error', 'fixup_error'):
-												[generic] Set default-search to error

This prevents users from submitting bug reports where they mistyped a URL, and prevents me from getting a weird video when holding shift and thus searching for :Tds

											
										
										
											2014-07-06 09:22:44 +00:00
+								                raise ExtractorError(
-												Fix all PEP8 issues except E501

											
										
										
											2014-11-23 21:21:46 +00:00
+								                    '%r is not a valid URL. '
-												Completely change project name to yt-dlp (#85)

* All modules and binary names are changed
* All documentation references changed
* yt-dlp no longer loads youtube-dlc config files
* All URLs changed to point to organization account

Co-authored-by: Pccode66
Co-authored-by: pukkandan
											
										
										
											2021-02-24 18:45:56 +00:00
+								                    'Set --default-search "ytsearch" (or run  yt-dlp "ytsearch:%s" ) to search YouTube'
-												Fix all PEP8 issues except E501

											
										
										
											2014-11-23 21:21:46 +00:00
+								                    % (url, url), expected=True)
-												Add new --default-search option (#2193)

											
										
										
											2014-01-22 13:16:43 +00:00
+								            else:
-												[generic] Allow --default-search without colon

											
										
										
											2014-10-23 19:13:45 +00:00
+								                if ':' not in default_search:
 								                    default_search += ':'
-												Add new --default-search option (#2193)

											
										
										
											2014-01-22 13:16:43 +00:00
+								                return self.url_result(default_search + url)
-												[ministrygrid] Add extractor (Fixes #2900)

											
										
										
											2014-08-24 02:47:18 +00:00
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2022-10-09 10:39:36 +00:00
+								        original_url = url
-												[extractor/generic] Pass through referer from json-ld

Closes #4941

											
										
										
											2022-09-16 17:35:49 +00:00
+								        url, smuggled_data = unsmuggle_url(url, {})
-												[ministrygrid] Add extractor (Fixes #2900)

											
										
										
											2014-08-24 02:47:18 +00:00
+								        force_videoid = None
-												[docs] Misc improvements

Closes #4987, Closes #4906, Closes #4919, Closes #4977, Closes #4979

											
										
										
											2022-09-21 20:07:44 +00:00
+								        is_intentional = smuggled_data.get('to_generic')
 								        if 'force_videoid' in smuggled_data:
-												[ministrygrid] Add extractor (Fixes #2900)

											
										
										
											2014-08-24 02:47:18 +00:00
+								            force_videoid = smuggled_data['force_videoid']
 								            video_id = force_videoid
 								        else:
-												[generic,commonprotocols] Move mms suuport from GenericIE

And use _generic_* helpers in those extractors

											
										
										
											2016-10-07 11:22:30 +00:00
+								            video_id = self._generic_id(url)
-												[generic] Support direct MMS links (closes #10838)

											
										
										
											2016-10-07 09:50:45 +00:00
-												[extractor/generic] Remove HEAD request

											
										
										
											2022-07-07 06:30:23 +00:00
+								        # Some webservers may serve compressed content of rather big size (e.g. gzipped flac)
 								        # making it impossible to download only chunk of the file (yet we need only 512kB to
 								        # test whether it's HTML or not). According to yt-dlp default Accept-Encoding
 								        # that will always result in downloading the whole file that is not desirable.
 								        # Therefore for extraction pass we have to override Accept-Encoding to any in order
 								        # to accept raw bytes and being able to download only a chunk.
 								        # It may probably better to solve this by checking Content-Type for application/octet-stream
 								        # after a HEAD request, but not sure if we can rely on this.
-												[ie] Do not smuggle `http_headers`

See: https://github.com/yt-dlp/yt-dlp/security/advisories/GHSA-3ch3-jhc6-5r8x

Authored by: coletdjnz

											
										
										
											2023-08-16 23:42:48 +00:00
+								        full_response = self._request_webpage(url, video_id, headers=filter_dict({
-												[extractor/generic] Use `Accept-Encoding: identity` for initial request

The existing comment seems to imply this was the desired behavior from the beginning.

Partial fix for https://github.com/yt-dlp/yt-dlp/issues/5855, https://github.com/yt-dlp/yt-dlp/issues/5851, https://github.com/yt-dlp/yt-dlp/issues/4748

											
										
										
											2023-01-01 05:40:26 +00:00
+								            'Accept-Encoding': 'identity',
-												[ie] Do not smuggle `http_headers`

See: https://github.com/yt-dlp/yt-dlp/security/advisories/GHSA-3ch3-jhc6-5r8x

Authored by: coletdjnz

											
										
										
											2023-08-16 23:42:48 +00:00
+								            'Referer': smuggled_data.get('referer'),
 								        }))
-												[compat, networking] Deprecate old functions (#2861)

Authored by: coletdjnz, pukkandan

											
										
										
											2023-07-09 07:53:02 +00:00
+								        new_url = full_response.url
-												[extractor/generic] Handle basic-auth when checking redirects

Closes #6352

											
										
										
											2023-02-26 04:57:04 +00:00
+								        if new_url != extract_basic_auth(url)[0]:
-												[extractor/generic] Remove HEAD request

											
										
										
											2022-07-07 06:30:23 +00:00
+								            self.report_following_redirect(new_url)
 								            if force_videoid:
 								                new_url = smuggle_url(new_url, {'force_videoid': force_videoid})
 								            return self.url_result(new_url)
-												[generic] Handle audio streams that do not implement HEAD (Fixes #4032)

											
										
										
											2014-10-26 16:05:44 +00:00
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											2016-03-12 21:17:25 +00:00
+								        info_dict = {
 								            'id': video_id,
-												[generic,commonprotocols] Move mms suuport from GenericIE

And use _generic_* helpers in those extractors

											
										
										
											2016-10-07 11:22:30 +00:00
+								            'title': self._generic_title(url),
-												[extractor/generic] Remove HEAD request

											
										
										
											2022-07-07 06:30:23 +00:00
+								            'timestamp': unified_timestamp(full_response.headers.get('Last-Modified'))
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											2016-03-12 21:17:25 +00:00
+								        }
-												[generic] Handle audio streams that do not implement HEAD (Fixes #4032)

											
										
										
											2014-10-26 16:05:44 +00:00
+								        # Check for direct link to a video
-												[extractor/generic] Remove HEAD request

											
										
										
											2022-07-07 06:30:23 +00:00
+								        content_type = full_response.headers.get('Content-Type', '').lower()
-												[extractor/generic] Properly extract format id from Content-Type

Fixes extraction for cases like: audio/x-mpegURL; charset=utf-8

											
										
										
											2016-03-18 15:50:10 +00:00
+								        m = re.match(r'^(?P<type>audio|video|application(?=/(?:ogg$|(?:vnd\.apple\.|x-)?mpegurl)))/(?P<format_id>[^;\s]+)', content_type)
-												[generic] Handle audio streams that do not implement HEAD (Fixes #4032)

											
										
										
											2014-10-26 16:05:44 +00:00
+								        if m:
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											2021-11-09 22:49:33 +00:00
+								            self.report_detected('direct video link')
-												[ie] Do not smuggle `http_headers`

See: https://github.com/yt-dlp/yt-dlp/security/advisories/GHSA-3ch3-jhc6-5r8x

Authored by: coletdjnz

											
										
										
											2023-08-16 23:42:48 +00:00
+								            headers = filter_dict({'Referer': smuggled_data.get('referer')})
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 10:54:43 +00:00
+								            format_id = str(m.group('format_id'))
-												[ie/generic] Improve direct video link ext detection (#8340)

Closes #8265
Authored by: bashonly
											
										
										
											2023-10-28 00:35:37 +00:00
+								            ext = determine_ext(url, default_ext=None) or urlhandle_detect_ext(full_response)
-												[generic] Extract subtitles from direct HLS manifest links

											
										
										
											2021-04-15 08:15:43 +00:00
+								            subtitles = {}
-												[extractor/generic] Detect manifest links via extension

Authored by: bashonly

											
										
										
											2023-03-01 12:38:02 +00:00
+								            if format_id.endswith('mpegurl') or ext == 'm3u8':
-												[extractor/generic] Pass through referer from json-ld

Closes #4941

											
										
										
											2022-09-16 17:35:49 +00:00
+								                formats, subtitles = self._extract_m3u8_formats_and_subtitles(url, video_id, 'mp4', headers=headers)
-												[extractor/generic] Detect manifest links via extension

Authored by: bashonly

											
										
										
											2023-03-01 12:38:02 +00:00
+								            elif format_id.endswith('mpd') or format_id.endswith('dash+xml') or ext == 'mpd':
-												[extractor/generic] Pass through referer from json-ld

Closes #4941

											
										
										
											2022-09-16 17:35:49 +00:00
+								                formats, subtitles = self._extract_mpd_formats_and_subtitles(url, video_id, headers=headers)
-												[extractor/generic] Detect manifest links via extension

Authored by: bashonly

											
										
										
											2023-03-01 12:38:02 +00:00
+								            elif format_id == 'f4m' or ext == 'f4m':
-												[extractor/generic] Pass through referer from json-ld

Closes #4941

											
										
										
											2022-09-16 17:35:49 +00:00
+								                formats = self._extract_f4m_formats(url, video_id, headers=headers)
-												[generic] extract m3u8 formats when mpegurl content type detected

											
										
										
											2016-02-04 00:25:36 +00:00
+								            else:
 								                formats = [{
-												[extractor/generic] Ensure format id is unicode string

											
										
										
											2017-06-10 16:55:05 +00:00
+								                    'format_id': format_id,
-												[generic] extract m3u8 formats when mpegurl content type detected

											
										
										
											2016-02-04 00:25:36 +00:00
+								                    'url': url,
-												[ie/generic] Improve direct video link ext detection (#8340)

Closes #8265
Authored by: bashonly
											
										
										
											2023-10-28 00:35:37 +00:00
+								                    'ext': ext,
-												[generic] extract m3u8 formats when mpegurl content type detected

											
										
										
											2016-02-04 00:25:36 +00:00
+								                    'vcodec': 'none' if m.group('type') == 'audio' else None
 								                }]
-												[extractor/generic] Fix direct link semantics

											
										
										
											2016-03-18 16:43:07 +00:00
+								                info_dict['direct'] = True
-												[extractor/generic] Pass through referer from json-ld

Closes #4941

											
										
										
											2022-09-16 17:35:49 +00:00
+								            info_dict.update({
 								                'formats': formats,
 								                'subtitles': subtitles,
-												[downloader/ffmpeg] Fix headers for video+audio formats (#5659)

Authored by: bashonly, Grub4K
											
										
										
											2022-12-09 23:36:38 +00:00
+								                'http_headers': headers or None,
-												[extractor/generic] Pass through referer from json-ld

Closes #4941

											
										
										
											2022-09-16 17:35:49 +00:00
+								            })
-												[extractor/generic] Add extractor-args `hls_key`, `variant_query` (#6567)

Authored by: bashonly
											
										
										
											2023-03-21 23:12:17 +00:00
+								            self._extra_manifest_info(info_dict, url)
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											2016-03-12 21:17:25 +00:00
+								            return info_dict
-												Add support for direct links to a video (#1973)

											
										
										
											2013-12-17 11:33:55 +00:00
-												[extractor] Add `write_debug` and `get_param`

											
										
										
											2021-05-17 12:23:08 +00:00
+								        if not self.get_param('test', False) and not is_intentional:
 								            force = self.get_param('force_generic_extractor', False)
-												[extractor] Framework for embed detection (#4307)

											
										
										
											2022-08-01 01:22:03 +00:00
+								            self.report_warning('%s generic information extractor' % ('Forcing' if force else 'Falling back on'))
-												[vimeo:likes] Add new extractor (Fixes #3835)

											
										
										
											2014-09-28 10:14:16 +00:00
-												[extractor/generic] Detect m3u playlists served without proper Content-Type

											
										
										
											2016-03-18 16:45:28 +00:00
+								        first_bytes = full_response.read(512)
 								        # Is it an M3U playlist?
-												[extractor/generic] Fix missing byte literal prefix

											
										
										
											2016-03-18 23:43:43 +00:00
+								        if first_bytes.startswith(b'#EXTM3U'):
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											2021-11-09 22:49:33 +00:00
+								            self.report_detected('M3U playlist')
-												[generic] Extract previously missed subtitles (#515)

* [generic] Extract subtitles in cases missed previously
* [common] Detect discarded subtitles in SMIL manifests
* [generic] Extract everything in the SMIL manifest

Authored by: fstirlitz 
											
										
										
											2021-07-16 14:22:56 +00:00
+								            info_dict['formats'], info_dict['subtitles'] = self._extract_m3u8_formats_and_subtitles(url, video_id, 'mp4')
-												[extractor/generic] Add extractor-args `hls_key`, `variant_query` (#6567)

Authored by: bashonly
											
										
										
											2023-03-21 23:12:17 +00:00
+								            self._extra_manifest_info(info_dict, url)
-												[extractor/generic] Detect m3u playlists served without proper Content-Type

											
										
										
											2016-03-18 16:45:28 +00:00
+								            return info_dict
-												[generic] Detect direct video links (Fixes #4149, #4313)

											
										
										
											2014-11-26 09:44:39 +00:00
+								        # Maybe it's a direct link to a video?
 								        # Be careful not to download the whole thing!
-												[generic] Add support for BOMs (Fixes #4753)

											
										
										
											2015-01-23 00:21:30 +00:00
+								        if not is_html(first_bytes):
-												Fix inconsistent use of `report_warning`

											
										
										
											2021-04-16 10:01:10 +00:00
+								            self.report_warning(
-												[generic] Detect direct video links (Fixes #4149, #4313)

											
										
										
											2014-11-26 09:44:39 +00:00
+								                'URL could be a direct video link, returning it as such.')
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											2016-03-12 21:17:25 +00:00
+								            info_dict.update({
-												[generic] Detect direct video links (Fixes #4149, #4313)

											
										
										
											2014-11-26 09:44:39 +00:00
+								                'direct': True,
 								                'url': url,
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											2016-03-12 21:17:25 +00:00
+								            })
 								            return info_dict
-												[generic] Detect direct video links (Fixes #4149, #4313)

											
										
										
											2014-11-26 09:44:39 +00:00
 								        webpage = self._webpage_read_content(
 								            full_response, url, video_id, prefix=first_bytes)
-												Update to ytdl-2021.02.04.1 except youtube

											
										
										
											2021-02-04 07:56:01 +00:00
+								        if '<title>DPG Media Privacy Gate</title>' in webpage:
 								            webpage = self._download_webpage(url, video_id)
-												Move GenericIE into its own file

											
										
										
											2013-06-23 18:31:45 +00:00
+								        self.report_extraction(video_id)
-												Support multiple embedded YouTube URLs (Fixes #1787)

											
										
										
											2013-11-18 12:28:26 +00:00
-												[extractor/generic] Detect DASH manifests and extract mpd formats

											
										
										
											2016-02-06 13:35:32 +00:00
+								        # Is it an RSS feed, a SMIL file, an XSPF playlist or a MPD manifest?
-												[generic] Add support for RSS feeds (Fixes #667)

											
										
										
											2014-02-20 12:14:05 +00:00
+								        try:
-												[generic] Respect the encoding in manifest

											
										
										
											2021-05-11 07:29:45 +00:00
+								            try:
 								                doc = compat_etree_fromstring(webpage)
-												[cleanup] Mark some compat variables for removal (#2173)

Authored by fstirlitz, pukkandan

											
										
										
											2022-04-11 20:09:26 +00:00
+								            except xml.etree.ElementTree.ParseError:
-												[generic] Respect the encoding in manifest

											
										
										
											2021-05-11 07:29:45 +00:00
+								                doc = compat_etree_fromstring(webpage.encode('utf-8'))
-												[generic] Add support for RSS feeds (Fixes #667)

											
										
										
											2014-02-20 12:14:05 +00:00
+								            if doc.tag == 'rss':
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											2021-11-09 22:49:33 +00:00
+								                self.report_detected('RSS feed')
-												[generic] Add support for RSS feeds (Fixes #667)

											
										
										
											2014-02-20 12:14:05 +00:00
+								                return self._extract_rss(url, video_id, doc)
-												[extractor/generic] Add support for ISM manifests

											
										
										
											2016-11-01 20:01:13 +00:00
+								            elif doc.tag == 'SmoothStreamingMedia':
-												[generic] Extract subtitles from direct SSTR manifest links

											
										
										
											2021-04-18 12:26:32 +00:00
+								                info_dict['formats'], info_dict['subtitles'] = self._parse_ism_formats_and_subtitles(doc, url)
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											2021-11-09 22:49:33 +00:00
+								                self.report_detected('ISM manifest')
-												[extractor/generic] Add support for ISM manifests

											
										
										
											2016-11-01 20:01:13 +00:00
+								                return info_dict
-												[extractor/generic] Improve generic SMIL detection

											
										
										
											2015-08-01 19:13:59 +00:00
+								            elif re.match(r'^(?:{[^}]+})?smil$', doc.tag):
-												Remove _sort_formats from _extract_*_formats methods

Now _sort_formats should be called explicitly.
_sort_formats has been added to all the necessary places in code.

Closes #8051

											
										
										
											2016-03-27 01:03:08 +00:00
+								                smil = self._parse_smil(doc, url, video_id)
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											2021-11-09 22:49:33 +00:00
+								                self.report_detected('SMIL file')
-												Remove _sort_formats from _extract_*_formats methods

Now _sort_formats should be called explicitly.
_sort_formats has been added to all the necessary places in code.

Closes #8051

											
										
										
											2016-03-27 01:03:08 +00:00
+								                return smil
-												[extractor/generic] Add support for xspf playlists

											
										
										
											2015-08-09 13:43:42 +00:00
+								            elif doc.tag == '{http://xspf.org/ns/0/}playlist':
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											2021-11-09 22:49:33 +00:00
+								                self.report_detected('XSPF playlist')
-												[extractor/generic] Support relative URIs in _parse_xspf

<location> can have relative URIs, not just absolute.

											
										
										
											2018-03-07 21:31:53 +00:00
+								                return self.playlist_result(
-												Generalize XML manifest processing code and improve XSPF parsing (closes #15794)

											
										
										
											2018-03-17 19:46:50 +00:00
+								                    self._parse_xspf(
 								                        doc, video_id, xspf_url=url,
-												[compat, networking] Deprecate old functions (#2861)

Authored by: coletdjnz, pukkandan

											
										
										
											2023-07-09 07:53:02 +00:00
+								                        xspf_base_url=full_response.url),
-												[extractor/generic] Support relative URIs in _parse_xspf

<location> can have relative URIs, not just absolute.

											
										
										
											2018-03-07 21:31:53 +00:00
+								                    video_id)
-												[extractor/generic] Detect DASH manifests and extract mpd formats

											
										
										
											2016-02-06 13:35:32 +00:00
+								            elif re.match(r'(?i)^(?:{[^}]+})?MPD$', doc.tag):
-												[generic] Extract subtitles from direct DASH manifest links

											
										
										
											2021-04-18 06:41:28 +00:00
+								                info_dict['formats'], info_dict['subtitles'] = self._parse_mpd_formats_and_subtitles(
-												[extractor/generic] Fix typo (closes #14902)
Don't pass video_id as mpd_id

											
										
										
											2017-12-05 16:11:15 +00:00
+								                    doc,
-												[compat, networking] Deprecate old functions (#2861)

Authored by: coletdjnz, pukkandan

											
										
										
											2023-07-09 07:53:02 +00:00
+								                    mpd_base_url=full_response.url.rpartition('/')[0],
-												Refactor fragments interface and dash segments downloader
- Eliminate segment_urls and initialization_url
+ Introduce manifest_url (manifest may contain unfragmented data in this case url will be used for direct media URL and manifest_url for manifest itself correspondingly)
* Rewrite dashsegments downloader to use fragments data
* Improve generic mpd extraction

											
										
										
											2016-09-17 13:35:22 +00:00
+								                    mpd_url=url)
-												[extractor/generic] Add extractor-args `hls_key`, `variant_query` (#6567)

Authored by: bashonly
											
										
										
											2023-03-21 23:12:17 +00:00
+								                self._extra_manifest_info(info_dict, url)
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											2021-11-09 22:49:33 +00:00
+								                self.report_detected('DASH manifest')
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											2016-03-12 21:17:25 +00:00
+								                return info_dict
 								            elif re.match(r'^{http://ns\.adobe\.com/f4m/[12]\.0}manifest$', doc.tag):
 								                info_dict['formats'] = self._parse_f4m_formats(doc, url, video_id)
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											2021-11-09 22:49:33 +00:00
+								                self.report_detected('F4M manifest')
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											2016-03-12 21:17:25 +00:00
+								                return info_dict
-												[cleanup] Mark some compat variables for removal (#2173)

Authored by fstirlitz, pukkandan

											
										
										
											2022-04-11 20:09:26 +00:00
+								        except xml.etree.ElementTree.ParseError:
-												[generic] Add support for RSS feeds (Fixes #667)

											
										
										
											2014-02-20 12:14:05 +00:00
+								            pass
-												[extractor] Framework for embed detection (#4307)

											
										
										
											2022-08-01 01:22:03 +00:00
+								        info_dict.update({
 								            # it's tempting to parse this further, but you would
 								            # have to take into account all the variations like
 								            #   Video Title - Site Name
 								            #   Site Name | Video Title
 								            #   Video Title - Tagline | Site Name
 								            # and so on and so forth; it's just not practical
-												[extractor] Improve `_generic_title`

											
										
										
											2022-10-31 12:05:20 +00:00
+								            'title': self._generic_title('', webpage, default='video'),
-												[extractor] Framework for embed detection (#4307)

											
										
										
											2022-08-01 01:22:03 +00:00
+								            'description': self._og_search_description(webpage, default=None),
 								            'thumbnail': self._og_search_thumbnail(webpage, default=None),
 								            'age_limit': self._rta_search(webpage),
 								        })
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2022-10-09 10:39:36 +00:00
+								        self._downloader.write_debug('Looking for embeds')
 								        embeds = list(self._extract_embeds(original_url, webpage, urlh=full_response, info_dict=info_dict))
 								        if len(embeds) == 1:
-												[ie/generic] Fix generic title for embeds

Closes #7067

											
										
										
											2023-07-22 02:24:25 +00:00
+								            return merge_dicts(embeds[0], info_dict)
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2022-10-09 10:39:36 +00:00
+								        elif embeds:
 								            return self.playlist_result(embeds, **info_dict)
 								        raise UnsupportedError(url)
 								    def _extract_embeds(self, url, webpage, *, urlh=None, info_dict={}):
 								        """Returns an iterator of video entries"""
 								        info_dict = types.MappingProxyType(info_dict)  # Prevents accidental mutation
 								        video_id = traverse_obj(info_dict, 'display_id', 'id') or self._generic_id(url)
 								        url, smuggled_data = unsmuggle_url(url, {})
-												[compat, networking] Deprecate old functions (#2861)

Authored by: coletdjnz, pukkandan

											
										
										
											2023-07-09 07:53:02 +00:00
+								        actual_url = urlh.url if urlh else url
-												[extractor] Framework for embed detection (#4307)

											
										
										
											2022-08-01 01:22:03 +00:00
-												[generic] Add comment for unescaping webpage contents

											
										
										
											2014-03-14 21:38:49 +00:00
+								        # Sometimes embedded video player is hidden behind percent encoding
-												Start moving to ytdl-org

											
										
										
											2019-03-09 12:14:41 +00:00
+								        # (e.g. https://github.com/ytdl-org/youtube-dl/issues/2448)
-												[generic] Add comment for unescaping webpage contents

											
										
										
											2014-03-14 21:38:49 +00:00
+								        # Unescaping the whole page allows to handle those cases in a generic way
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 12:26:37 +00:00
+								        # FIXME: unescaping the whole page may break URLs, commenting out for now.
 								        # There probably should be a second run of generic extractor on unescaped webpage.
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 10:54:43 +00:00
+								        # webpage = urllib.parse.unquote(webpage)
-												[generic] Unescape webpage contents
											
										
										
											2014-02-24 16:44:31 +00:00
-												[extractor] Framework for embed detection (#4307)

											
										
										
											2022-08-01 01:22:03 +00:00
+								        embeds = []
-												Fix bug in fe7866d0ed6bfa3904ce12b049a3424fdc0ea1fa

											
										
										
											2022-08-24 02:50:52 +00:00
+								        for ie in self._downloader._ies.values():
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2022-10-09 10:39:36 +00:00
+								            if ie.ie_key() in smuggled_data.get('block_ies', []):
 								                continue
-												[extractor] Framework for embed detection (#4307)

											
										
										
											2022-08-01 01:22:03 +00:00
+								            gen = ie.extract_from_webpage(self._downloader, url, webpage)
 								            current_embeds = []
 								            try:
 								                while True:
 								                    current_embeds.append(next(gen))
 								            except self.StopExtraction:
 								                self.report_detected(f'{ie.IE_NAME} exclusive embed', len(current_embeds),
 								                                     embeds and 'discarding other embeds')
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2022-10-09 10:39:36 +00:00
+								                return current_embeds
-												[extractor] Framework for embed detection (#4307)

											
										
										
											2022-08-01 01:22:03 +00:00
+								            except StopIteration:
 								                self.report_detected(f'{ie.IE_NAME} embed', len(current_embeds))
 								                embeds.extend(current_embeds)
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2022-10-09 10:39:36 +00:00
+								        if embeds:
 								            return embeds
-												[tiktok] Detect embeds

Closes #3799

											
										
										
											2022-05-20 00:31:08 +00:00
-												_find_jwplayer_data() returns dict or None

This simplifies code for callers of `_find_jwplayer_data()` which no longer have
to run `_parse_json()` on the return value.

It also makes sure that `_find_jwplayer_data()` returns either a `dict` or
`None` and nothing else.

											
										
										
											2017-03-25 18:38:30 +00:00
+								        jwplayer_data = self._find_jwplayer_data(
 								            webpage, video_id, transform_source=js_to_json)
 								        if jwplayer_data:
-												[generic] parse jwplayer with only the json URL
Closes #1476

											
										
										
											2021-10-29 20:23:28 +00:00
+								            if isinstance(jwplayer_data.get('playlist'), str):
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											2021-11-09 22:49:33 +00:00
+								                self.report_detected('JW Player playlist')
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2022-10-09 10:39:36 +00:00
+								                return [self.url_result(jwplayer_data['playlist'], 'JWPlatform')]
-												[generic] Skip unsuccessful jwplayer extraction (closes #16735)

											
										
										
											2018-06-14 15:12:33 +00:00
+								            try:
 								                info = self._parse_jwplayer_data(
 								                    jwplayer_data, video_id, require_title=False, base_url=url)
-												[extractor/generic] Don't return JW player without formats

CLoses #4765

											
										
										
											2022-08-27 00:50:48 +00:00
+								                if traverse_obj(info, 'formats', ('entries', ..., 'formats')):
 								                    self.report_detected('JW Player data')
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2022-10-09 10:39:36 +00:00
+								                    return [info]
-												[generic] Skip unsuccessful jwplayer extraction (closes #16735)

											
										
										
											2018-06-14 15:12:33 +00:00
+								            except ExtractorError:
-												Start moving to ytdl-org

											
										
										
											2019-03-09 12:14:41 +00:00
+								                # See https://github.com/ytdl-org/youtube-dl/pull/16735
-												[generic] Skip unsuccessful jwplayer extraction (closes #16735)

											
										
										
											2018-06-14 15:12:33 +00:00
+								                pass
-												[generic] Try parsing JWPlayer embedded videos (closes #12030)

											
										
										
											2017-02-16 15:42:36 +00:00
-												[generic] Add support for Video.js embeds

											
										
										
											2017-09-27 17:29:42 +00:00
+								        # Video.js embed
 								        mobj = re.search(
-												[generic] Extract subtitles from video.js (#3156)

Authored by: Lesmiscore 
											
										
										
											2022-03-23 06:28:53 +00:00
+								            r'(?s)\bvideojs\s*\(.+?([a-zA-Z0-9_$]+)\.src\s*\(\s*((?:\[.+?\]|{.+?}))\s*\)\s*;',
-												[generic] Add support for Video.js embeds

											
										
										
											2017-09-27 17:29:42 +00:00
+								            webpage)
 								        if mobj is not None:
-												[generic] Extract subtitles from video.js (#3156)

Authored by: Lesmiscore 
											
										
										
											2022-03-23 06:28:53 +00:00
+								            varname = mobj.group(1)
-												[cleanup Misc

Closes #5162

											
										
										
											2022-10-18 17:58:57 +00:00
+								            sources = variadic(self._parse_json(
 								                mobj.group(2), video_id, transform_source=js_to_json, fatal=False) or [])
-												[extractor/generic] Attempt to detect live HLS (#6775)

* Extract duration for non-live generic HLS videos
* Add extractor-arg `is_live` to bypass live HLS check

Closes #6705
Authored by: bashonly
											
										
										
											2023-04-13 19:36:06 +00:00
+								            formats, subtitles, src = [], {}, None
-												[generic] Add support for Video.js embeds

											
										
										
											2017-09-27 17:29:42 +00:00
+								            for source in sources:
-												[generic] Allow relative src for videojs embeds (closes #17324)

											
										
										
											2018-08-24 16:12:53 +00:00
+								                src = source.get('src')
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 10:54:43 +00:00
+								                if not src or not isinstance(src, str):
-												[generic] Add support for Video.js embeds

											
										
										
											2017-09-27 17:29:42 +00:00
+								                    continue
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 10:54:43 +00:00
+								                src = urllib.parse.urljoin(url, src)
-												[generic] Add support for Video.js embeds

											
										
										
											2017-09-27 17:29:42 +00:00
+								                src_type = source.get('type')
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 10:54:43 +00:00
+								                if isinstance(src_type, str):
-												[generic] Add support for Video.js embeds

											
										
										
											2017-09-27 17:29:42 +00:00
+								                    src_type = src_type.lower()
 								                ext = determine_ext(src).lower()
 								                if src_type == 'video/youtube':
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2022-10-09 10:39:36 +00:00
+								                    return [self.url_result(src, YoutubeIE.ie_key())]
-												[generic] Add support for Video.js embeds

											
										
										
											2017-09-27 17:29:42 +00:00
+								                if src_type == 'application/dash+xml' or ext == 'mpd':
-												[generic] Extract previously missed subtitles (#515)

* [generic] Extract subtitles in cases missed previously
* [common] Detect discarded subtitles in SMIL manifests
* [generic] Extract everything in the SMIL manifest

Authored by: fstirlitz 
											
										
										
											2021-07-16 14:22:56 +00:00
+								                    fmts, subs = self._extract_mpd_formats_and_subtitles(
 								                        src, video_id, mpd_id='dash', fatal=False)
 								                    formats.extend(fmts)
 								                    self._merge_subtitles(subs, target=subtitles)
-												[generic] Add support for Video.js embeds

											
										
										
											2017-09-27 17:29:42 +00:00
+								                elif src_type == 'application/x-mpegurl' or ext == 'm3u8':
-												[generic] Extract previously missed subtitles (#515)

* [generic] Extract subtitles in cases missed previously
* [common] Detect discarded subtitles in SMIL manifests
* [generic] Extract everything in the SMIL manifest

Authored by: fstirlitz 
											
										
										
											2021-07-16 14:22:56 +00:00
+								                    fmts, subs = self._extract_m3u8_formats_and_subtitles(
-												[generic] Add support for Video.js embeds

											
										
										
											2017-09-27 17:29:42 +00:00
+								                        src, video_id, 'mp4', entry_protocol='m3u8_native',
-												[generic] Extract previously missed subtitles (#515)

* [generic] Extract subtitles in cases missed previously
* [common] Detect discarded subtitles in SMIL manifests
* [generic] Extract everything in the SMIL manifest

Authored by: fstirlitz 
											
										
										
											2021-07-16 14:22:56 +00:00
+								                        m3u8_id='hls', fatal=False)
 								                    formats.extend(fmts)
 								                    self._merge_subtitles(subs, target=subtitles)
-												[extractor/generic] Add `fragment_query` extractor arg for DASH and HLS (#5528)

* `fragment_query`: passthrough any query in generic mpd/m3u8 manifest URLs to their fragments
* Add support for `extra_param_to_segment_url` to DASH downloader
Authored by: bashonly, pukkandan
											
										
										
											2022-11-21 00:51:45 +00:00
 								                if not formats:
-												[generic] Add support for Video.js embeds

											
										
										
											2017-09-27 17:29:42 +00:00
+								                    formats.append({
 								                        'url': src,
-												Fix W504 and disable W503 (closes #20863)

											
										
										
											2019-05-10 20:56:22 +00:00
+								                        'ext': (mimetype2ext(src_type)
 								                                or ext if ext in KNOWN_EXTENSIONS else 'mp4'),
-												Update to ytdl-commit-dfbbe29

[redbulltv] fix embed data extraction
https://github.com/ytdl-org/youtube-dl/commit/dfbbe2902fc67f0f93ee47a8077c148055c67a9b

											
										
										
											2021-05-20 15:38:49 +00:00
+								                        'http_headers': {
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2022-10-09 10:39:36 +00:00
+								                            'Referer': actual_url,
-												Update to ytdl-commit-dfbbe29

[redbulltv] fix embed data extraction
https://github.com/ytdl-org/youtube-dl/commit/dfbbe2902fc67f0f93ee47a8077c148055c67a9b

											
										
										
											2021-05-20 15:38:49 +00:00
+								                        },
-												[generic] Add support for Video.js embeds

											
										
										
											2017-09-27 17:29:42 +00:00
+								                    })
-												[generic] Extract subtitles from video.js (#3156)

Authored by: Lesmiscore 
											
										
										
											2022-03-23 06:28:53 +00:00
+								            # https://docs.videojs.com/player#addRemoteTextTrack
 								            # https://html.spec.whatwg.org/multipage/media.html#htmltrackelement
 								            for sub_match in re.finditer(rf'(?s){re.escape(varname)}' r'\.addRemoteTextTrack\(({.+?})\s*,\s*(?:true|false)\)', webpage):
 								                sub = self._parse_json(
 								                    sub_match.group(1), video_id, transform_source=js_to_json, fatal=False) or {}
-												[extractor/generic] Attempt to detect live HLS (#6775)

* Extract duration for non-live generic HLS videos
* Add extractor-arg `is_live` to bypass live HLS check

Closes #6705
Authored by: bashonly
											
										
										
											2023-04-13 19:36:06 +00:00
+								                sub_src = str_or_none(sub.get('src'))
 								                if not sub_src:
-												[generic] Extract subtitles from video.js (#3156)

Authored by: Lesmiscore 
											
										
										
											2022-03-23 06:28:53 +00:00
+								                    continue
 								                subtitles.setdefault(dict_get(sub, ('language', 'srclang')) or 'und', []).append({
-												[extractor/generic] Attempt to detect live HLS (#6775)

* Extract duration for non-live generic HLS videos
* Add extractor-arg `is_live` to bypass live HLS check

Closes #6705
Authored by: bashonly
											
										
										
											2023-04-13 19:36:06 +00:00
+								                    'url': urllib.parse.urljoin(url, sub_src),
-												[generic] Extract subtitles from video.js (#3156)

Authored by: Lesmiscore 
											
										
										
											2022-03-23 06:28:53 +00:00
+								                    'name': sub.get('label'),
 								                    'http_headers': {
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2022-10-09 10:39:36 +00:00
+								                        'Referer': actual_url,
-												[generic] Extract subtitles from video.js (#3156)

Authored by: Lesmiscore 
											
										
										
											2022-03-23 06:28:53 +00:00
+								                    },
 								                })
-												[generic] Extract previously missed subtitles (#515)

* [generic] Extract subtitles in cases missed previously
* [common] Detect discarded subtitles in SMIL manifests
* [generic] Extract everything in the SMIL manifest

Authored by: fstirlitz 
											
										
										
											2021-07-16 14:22:56 +00:00
+								            if formats or subtitles:
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											2021-11-09 22:49:33 +00:00
+								                self.report_detected('video.js embed')
-												[extractor/generic] Attempt to detect live HLS (#6775)

* Extract duration for non-live generic HLS videos
* Add extractor-arg `is_live` to bypass live HLS check

Closes #6705
Authored by: bashonly
											
										
										
											2023-04-13 19:36:06 +00:00
+								                info_dict = {'formats': formats, 'subtitles': subtitles}
 								                if formats:
 								                    self._extra_manifest_info(info_dict, src)
 								                return [info_dict]
-												[generic] Add support for Video.js embeds

											
										
										
											2017-09-27 17:29:42 +00:00
-												Update to ytdl-commit-195f22f6

[generic] Improve KVS (etc) extraction
https://github.com/ytdl-org/youtube-dl/commit/195f22f679330549882a8234e7234942893a4902

Closes #3716
Authored by: Grub4k, pukkandan
											
										
										
											2023-01-02 13:45:36 +00:00
+								        # Look for generic KVS player (before json-ld bc of some urls that break otherwise)
 								        found = self._search_regex((
-												[extractor/generic] Avoid catastrophic backtracking in KVS regex

Authored by: bashonly

											
										
										
											2023-01-29 06:59:37 +00:00
+								            r'<script\b[^>]+?\bsrc\s*=\s*(["\'])https?://(?:(?!\1)[^?#])+/kt_player\.js\?v=(?P<ver>\d+(?:\.\d+)+)\1[^>]*>',
 								            r'kt_player\s*\(\s*(["\'])(?:(?!\1)[\w\W])+\1\s*,\s*(["\'])https?://(?:(?!\2)[^?#])+/kt_player\.swf\?v=(?P<ver>\d+(?:\.\d+)+)\2\s*,',
-												Update to ytdl-commit-195f22f6

[generic] Improve KVS (etc) extraction
https://github.com/ytdl-org/youtube-dl/commit/195f22f679330549882a8234e7234942893a4902

Closes #3716
Authored by: Grub4k, pukkandan
											
										
										
											2023-01-02 13:45:36 +00:00
+								        ), webpage, 'KVS player', group='ver', default=False)
 								        if found:
-												[extractor/generic] Avoid catastrophic backtracking in KVS regex

Authored by: bashonly

											
										
										
											2023-01-29 06:59:37 +00:00
+								            self.report_detected('KVS Player')
-												Update to ytdl-commit-195f22f6

[generic] Improve KVS (etc) extraction
https://github.com/ytdl-org/youtube-dl/commit/195f22f679330549882a8234e7234942893a4902

Closes #3716
Authored by: Grub4k, pukkandan
											
										
										
											2023-01-02 13:45:36 +00:00
+								            if found.split('.')[0] not in ('4', '5', '6'):
 								                self.report_warning(f'Untested major version ({found}) in player engine - download may fail.')
 								            return [self._extract_kvs(url, webpage, video_id)]
-												[extractor/generic] Extract from LD-JSON last of all
Previous sources may contain several formats, e.g. http://tamasha.com/v/PgGZ

											
										
										
											2017-08-26 20:27:20 +00:00
+								        # Looking for http://schema.org/VideoObject
-												[generic] Detect more json_ld
Closes #1475

											
										
										
											2021-10-29 20:33:53 +00:00
+								        json_ld = self._search_json_ld(webpage, video_id, default={})
-												[generic] Allow further processing of json_ld URL
Closes #2578

											
										
										
											2022-02-02 01:58:01 +00:00
+								        if json_ld.get('url') not in (url, None):
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											2021-11-09 22:49:33 +00:00
+								            self.report_detected('JSON LD')
-												[extractor/generic] Fix JSON LD manifest extraction (#5577)

Closes #5572
Authored by: bashonly, pukkandan
											
										
										
											2022-11-18 02:04:03 +00:00
+								            is_direct = json_ld.get('ext') not in (None, *MEDIA_EXTENSIONS.manifests)
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2022-10-09 10:39:36 +00:00
+								            return [merge_dicts({
-												[extractor/generic] Fix JSON LD manifest extraction (#5577)

Closes #5572
Authored by: bashonly, pukkandan
											
										
										
											2022-11-18 02:04:03 +00:00
+								                '_type': 'video' if is_direct else 'url_transparent',
-												[extractor/generic] Pass through referer from json-ld

Closes #4941

											
										
										
											2022-09-16 17:35:49 +00:00
+								                'url': smuggle_url(json_ld['url'], {
 								                    'force_videoid': video_id,
 								                    'to_generic': True,
-												[ie] Do not smuggle `http_headers`

See: https://github.com/yt-dlp/yt-dlp/security/advisories/GHSA-3ch3-jhc6-5r8x

Authored by: coletdjnz

											
										
										
											2023-08-16 23:42:48 +00:00
+								                    'referer': url,
-												[extractor/generic] Pass through referer from json-ld

Closes #4941

											
										
										
											2022-09-16 17:35:49 +00:00
+								                }),
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2022-10-09 10:39:36 +00:00
+								            }, json_ld)]
-												[extractor/generic] Extract from LD-JSON last of all
Previous sources may contain several formats, e.g. http://tamasha.com/v/PgGZ

											
										
										
											2017-08-26 20:27:20 +00:00
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											2014-10-09 12:26:23 +00:00
+								        def check_video(vurl):
-												[generic] Add support for jwPlayer YouTube videos

This makes nationalarchives.gov.uk work (Fixes #4907, fixes #4876)

											
										
										
											2015-02-09 09:42:25 +00:00
+								            if YoutubeIE.suitable(vurl):
 								                return True
-												[extractor/generic] Improve rtmp support (closes #11993)

											
										
										
											2017-02-06 16:23:40 +00:00
+								            if RtmpIE.suitable(vurl):
 								                return True
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 10:54:43 +00:00
+								            vpath = urllib.parse.urlparse(vurl).path
-												[cleanup] Misc fixes

Closes https://github.com/yt-dlp/yt-dlp/pull/3213, Closes https://github.com/yt-dlp/yt-dlp/pull/3117

Related: https://github.com/yt-dlp/yt-dlp/issues/3146#issuecomment-1077323114, https://github.com/yt-dlp/yt-dlp/pull/3277#discussion_r841019671, https://github.com/yt-dlp/yt-dlp/commit/a825ffbffa0bea322e3ccb44c6f8e01d8d9572fb#commitcomment-68538986, https://github.com/yt-dlp/yt-dlp/issues/2360, https://github.com/yt-dlp/yt-dlp/commit/5fa3c9a88f597625296981a4a26be723e65d4842#r70393519, https://github.com/yt-dlp/yt-dlp/commit/5fa3c9a88f597625296981a4a26be723e65d4842#r70393254

											
										
										
											2022-03-27 02:20:43 +00:00
+								            vext = determine_ext(vpath, None)
 								            return vext not in (None, 'swf', 'png', 'jpg', 'srt', 'sbv', 'sub', 'vtt', 'ttml', 'js', 'xml')
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											2014-10-09 12:26:23 +00:00
 								        def filter_video(urls):
 								            return list(filter(check_video, urls))
-												Move GenericIE into its own file

											
										
										
											2013-06-23 18:31:45 +00:00
+								        # Start with something easy: JW Player in SWFObject
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											2014-10-09 12:26:23 +00:00
+								        found = filter_video(re.findall(r'flashvars: [\'"](?:.*&)?file=(http[^\'"&]*)', webpage))
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											2021-11-09 22:49:33 +00:00
+								        if found:
 								            self.report_detected('JW Player in SFWObject')
 								        else:
-												[generic] Support gorillavid.in

Previously, we were a little bit over-eager and got a random swf file.
Fixes #2084.

											
										
										
											2014-01-05 04:34:06 +00:00
+								            # Look for gorilla-vid style embedding
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											2014-10-09 12:26:23 +00:00
+								            found = filter_video(re.findall(r'''(?sx)
-												[generic] Improve jwplayer detection (Fixes #2731)

											
										
										
											2014-04-21 14:16:53 +00:00
+								                (?:
 								                    jw_plugins|
 								                    JWPlayerOptions|
 								                    jwplayer\s*\(\s*["'][^'"]+["']\s*\)\s*\.setup
 								                )
-												[generic] Add support for jwPlayer YouTube videos

This makes nationalarchives.gov.uk work (Fixes #4907, fixes #4876)

											
										
										
											2015-02-09 09:42:25 +00:00
+								                .*?
 								                ['"]?file['"]?\s*:\s*["\'](.*?)["\']''', webpage))
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											2021-11-09 22:49:33 +00:00
+								            if found:
 								                self.report_detected('JW Player embed')
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											2014-04-30 00:23:51 +00:00
+								        if not found:
-												Move GenericIE into its own file

											
										
										
											2013-06-23 18:31:45 +00:00
+								            # Broaden the search a little bit
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											2014-10-09 12:26:23 +00:00
+								            found = filter_video(re.findall(r'[^A-Za-z0-9]?(?:file|source)=(http[^\'"&]*)', webpage))
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											2021-11-09 22:49:33 +00:00
+								            if found:
 								                self.report_detected('video file')
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											2014-04-30 00:23:51 +00:00
+								        if not found:
 								            # Broaden the findall a little bit: JWPlayer JS loader
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											2014-10-09 12:26:23 +00:00
+								            found = filter_video(re.findall(
-												[generic] Expand jwplayer support

											
										
										
											2015-08-05 15:19:52 +00:00
+								                r'[^A-Za-z0-9]?(?:file|video_url)["\']?:\s*["\'](http(?![^\'"]+\.[0-9]+[\'"])[^\'"]+)["\']', webpage))
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											2021-11-09 22:49:33 +00:00
+								            if found:
 								                self.report_detected('JW Player JS loader')
-												[generic] Automatic detection of flow player and age_limit (Fixes #3576)

											
										
										
											2014-08-24 03:31:32 +00:00
+								        if not found:
 								            # Flow player
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											2014-10-09 12:26:23 +00:00
+								            found = filter_video(re.findall(r'''(?xs)
-												[generic] Automatic detection of flow player and age_limit (Fixes #3576)

											
										
										
											2014-08-24 03:31:32 +00:00
+								                flowplayer\("[^"]+",\s*
 								                    \{[^}]+?\}\s*,
-												The opening curly brace `{` is a regex reserved [control character](http://stackoverflow.com/a/400316/1106367), so it needs to be escaped.

											
										
										
											2015-01-30 07:41:40 +00:00
+								                    \s*\{[^}]+? ["']?clip["']?\s*:\s*\{\s*
-												[generic] Automatic detection of flow player and age_limit (Fixes #3576)

											
										
										
											2014-08-24 03:31:32 +00:00
+								                        ["']?url["']?\s*:\s*["']([^"']+)["']
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											2014-10-09 12:26:23 +00:00
+								            ''', webpage))
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											2021-11-09 22:49:33 +00:00
+								            if found:
 								                self.report_detected('Flow Player')
-												[generic] Add support for Cinerama player (Fixes #4752)

											
										
										
											2015-01-23 11:00:25 +00:00
+								        if not found:
 								            # Cinerama player
 								            found = re.findall(
 								                r"cinerama\.embedPlayer\(\s*\'[^']+\',\s*'([^']+)'", webpage)
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											2021-11-09 22:49:33 +00:00
+								            if found:
 								                self.report_detected('Cinerama player')
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											2014-04-30 00:23:51 +00:00
+								        if not found:
-												Move GenericIE into its own file

											
										
										
											2013-06-23 18:31:45 +00:00
+								            # Try to find twitter cards info
-												[extractor/generic] Change twitter:player embeds priority to lowest (Closes #10090)

											
										
										
											2016-07-16 08:59:43 +00:00
+								            # twitter:player:stream should be checked before twitter:player since
 								            # it is expected to contain a raw stream (see
 								            # https://dev.twitter.com/cards/types/player#On_twitter.com_via_desktop_browser)
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											2014-10-09 12:26:23 +00:00
+								            found = filter_video(re.findall(
 								                r'<meta (?:property|name)="twitter:player:stream" (?:content|value)="(.+?)"', webpage))
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											2021-11-09 22:49:33 +00:00
+								            if found:
 								                self.report_detected('Twitter card')
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											2014-04-30 00:23:51 +00:00
+								        if not found:
-												Move GenericIE into its own file

											
										
										
											2013-06-23 18:31:45 +00:00
+								            # We look for Open Graph info:
-												[docs] Consistent use of `e.g.` (#4643)

Authored by: Lesmiscore
											
										
										
											2022-08-14 12:04:13 +00:00
+								            # We have to match any number spaces between elements, some sites try to align them, e.g.: statigr.am
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											2014-04-30 00:23:51 +00:00
+								            m_video_type = re.findall(r'<meta.*?property="og:video:type".*?content="video/(.*?)"', webpage)
-												Move GenericIE into its own file

											
										
										
											2013-06-23 18:31:45 +00:00
+								            # We only look in og:video if the MIME type is a video, don't try if it's a Flash player:
 								            if m_video_type is not None:
-												Update to ytdl-commit-dfbbe29

[redbulltv] fix embed data extraction
https://github.com/ytdl-org/youtube-dl/commit/dfbbe2902fc67f0f93ee47a8077c148055c67a9b

											
										
										
											2021-05-20 15:38:49 +00:00
+								                found = filter_video(re.findall(r'<meta.*?property="og:(?:video|audio)".*?content="(.*?)"', webpage))
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											2021-11-09 22:49:33 +00:00
+								                if found:
 								                    self.report_detected('Open Graph video info')
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											2014-04-30 00:23:51 +00:00
+								        if not found:
-												[generic] Generalize redirect regex

											
										
										
											2015-03-17 18:05:40 +00:00
+								            REDIRECT_REGEX = r'[0-9]{,2};\s*(?:URL|url)=\'?([^\'"]+)'
-												[generic] Fix redirect

											
										
										
											2014-05-16 13:32:53 +00:00
+								            found = re.search(
-												[generic] Add support for <meta redirect>

Fixes #413

											
										
										
											2014-02-27 06:21:59 +00:00
+								                r'(?i)<meta\s+(?=(?:[a-z-]+="[^"]+"\s+)*http-equiv="refresh")'
-												[generic] Generalize redirect regex

											
										
										
											2015-03-17 18:05:40 +00:00
+								                r'(?:[a-z-]+="[^"]+"\s+)*?content="%s' % REDIRECT_REGEX,
-												[generic] Add support for <meta redirect>

Fixes #413

											
										
										
											2014-02-27 06:21:59 +00:00
+								                webpage)
-												[generic] Follow redirects specified by `Refresh` HTTP header

											
										
										
											2015-03-17 17:51:40 +00:00
+								            if not found:
 								                # Look also in Refresh HTTP header
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2022-10-09 10:39:36 +00:00
+								                refresh_header = urlh and urlh.headers.get('Refresh')
-												[generic] Follow redirects specified by `Refresh` HTTP header

											
										
										
											2015-03-17 17:51:40 +00:00
+								                if refresh_header:
-												[generic] Generalize redirect regex

											
										
										
											2015-03-17 18:05:40 +00:00
+								                    found = re.search(REDIRECT_REGEX, refresh_header)
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											2014-04-30 00:23:51 +00:00
+								            if found:
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 10:54:43 +00:00
+								                new_url = urllib.parse.urljoin(url, unescapeHTML(found.group(1)))
-												[generic] Do not follow redirects to the same URL

											
										
										
											2017-03-23 17:45:24 +00:00
+								                if new_url != url:
 								                    self.report_following_redirect(new_url)
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2022-10-09 10:39:36 +00:00
+								                    return [self.url_result(new_url)]
-												[generic] Do not follow redirects to the same URL

											
										
										
											2017-03-23 17:45:24 +00:00
+								                else:
 								                    found = None
-												[extractor/generic] Change twitter:player embeds priority to lowest (Closes #10090)

											
										
										
											2016-07-16 08:59:43 +00:00
 								        if not found:
 								            # twitter:player is a https URL to iframe player that may or may not
-												Completely change project name to yt-dlp (#85)

* All modules and binary names are changed
* All documentation references changed
* yt-dlp no longer loads youtube-dlc config files
* All URLs changed to point to organization account

Co-authored-by: Pccode66
Co-authored-by: pukkandan
											
										
										
											2021-02-24 18:45:56 +00:00
+								            # be supported by yt-dlp thus this is checked the very last (see
-												[extractor/generic] Change twitter:player embeds priority to lowest (Closes #10090)

											
										
										
											2016-07-16 08:59:43 +00:00
+								            # https://dev.twitter.com/cards/types/player#On_twitter.com_via_desktop_browser)
 								            embed_url = self._html_search_meta('twitter:player', webpage, default=None)
-												[generic] Fix infinite recursion for twitter:player URLs (closes #14339)

											
										
										
											2017-09-26 14:47:18 +00:00
+								            if embed_url and embed_url != url:
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											2021-11-09 22:49:33 +00:00
+								                self.report_detected('twitter:player iframe')
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2022-10-09 10:39:36 +00:00
+								                return [self.url_result(embed_url)]
-												[extractor/generic] Change twitter:player embeds priority to lowest (Closes #10090)

											
										
										
											2016-07-16 08:59:43 +00:00
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											2014-04-30 00:23:51 +00:00
+								        if not found:
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2022-10-09 10:39:36 +00:00
+								            return []
 								        domain_name = self._search_regex(r'^(?:https?://)?([^/]*)/.*', url, 'video uploader', default=None)
-												Move GenericIE into its own file

											
										
										
											2013-06-23 18:31:45 +00:00
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											2014-04-30 00:23:51 +00:00
+								        entries = []
-												[genric] Eliminate duplicated video URLs (closes #6562)

											
										
										
											2016-05-22 14:22:27 +00:00
+								        for video_url in orderedSet(found):
-												[extractor/generic] Decode unicode-escaped embed URLs (#5919)

Authored by: bashonly
Closes #5854
											
										
										
											2023-01-02 14:06:01 +00:00
+								            video_url = video_url.encode().decode('unicode-escape')
-												[generic] Unescape the video URL

Fixes #9279

											
										
										
											2016-04-24 08:23:21 +00:00
+								            video_url = unescapeHTML(video_url)
-												[generic] Unescape URLs from JWPlayer (#7582)

											
										
										
											2015-11-21 06:12:34 +00:00
+								            video_url = video_url.replace('\\/', '/')
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 10:54:43 +00:00
+								            video_url = urllib.parse.urljoin(url, video_url)
 								            video_id = urllib.parse.unquote(os.path.basename(video_url))
-												Move GenericIE into its own file

											
										
										
											2013-06-23 18:31:45 +00:00
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											2014-04-30 00:23:51 +00:00
+								            # Sometimes, jwplayer extraction will result in a YouTube URL
 								            if YoutubeIE.suitable(video_url):
 								                entries.append(self.url_result(video_url, 'Youtube'))
 								                continue
-												Move GenericIE into its own file

											
										
										
											2013-06-23 18:31:45 +00:00
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											2014-04-30 00:23:51 +00:00
+								            video_id = os.path.splitext(video_id)[0]
-												[generic] Pass referer to extracted formats

Closes #2839

											
										
										
											2022-02-20 11:43:13 +00:00
+								            headers = {
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2022-10-09 10:39:36 +00:00
+								                'referer': actual_url
-												[generic] Pass referer to extracted formats

Closes #2839

											
										
										
											2022-02-20 11:43:13 +00:00
+								            }
-												[youtube] Support jwplayer with YouTube URLs (Closes #2075)

											
										
										
											2014-01-06 00:42:58 +00:00
-												[generic] Refactor

											
										
										
											2015-11-21 08:08:54 +00:00
+								            entry_info_dict = {
 								                'id': video_id,
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-08-01 01:23:25 +00:00
+								                'uploader': domain_name,
 								                'title': info_dict['title'],
 								                'age_limit': info_dict['age_limit'],
-												[generic] Pass referer to extracted formats

Closes #2839

											
										
										
											2022-02-20 11:43:13 +00:00
+								                'http_headers': headers,
-												[generic] Refactor

											
										
										
											2015-11-21 08:08:54 +00:00
+								            }
-												[extractor/generic] Add test for #11993 and more metadata for rtmp

											
										
										
											2017-02-06 16:31:58 +00:00
+								            if RtmpIE.suitable(video_url):
 								                entry_info_dict.update({
 								                    '_type': 'url_transparent',
 								                    'ie_key': RtmpIE.ie_key(),
 								                    'url': video_url,
 								                })
 								                entries.append(entry_info_dict)
 								                continue
-												[extractor/generic] Add support for xspf playlists

											
										
										
											2015-08-09 13:43:42 +00:00
+								            ext = determine_ext(video_url)
 								            if ext == 'smil':
-												[generic] Extract previously missed subtitles (#515)

* [generic] Extract subtitles in cases missed previously
* [common] Detect discarded subtitles in SMIL manifests
* [generic] Extract everything in the SMIL manifest

Authored by: fstirlitz 
											
										
										
											2021-07-16 14:22:56 +00:00
+								                entry_info_dict = {**self._extract_smil_info(video_url, video_id), **entry_info_dict}
-												[extractor/generic] Add support for xspf playlists

											
										
										
											2015-08-09 13:43:42 +00:00
+								            elif ext == 'xspf':
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2022-10-09 10:39:36 +00:00
+								                return [self._extract_xspf_playlist(video_url, video_id)]
-												[generic] Extract M3U8 formats (closes #7582)

											
										
										
											2015-11-21 08:43:01 +00:00
+								            elif ext == 'm3u8':
-												[generic] Pass referer to extracted formats

Closes #2839

											
										
										
											2022-02-20 11:43:13 +00:00
+								                entry_info_dict['formats'], entry_info_dict['subtitles'] = self._extract_m3u8_formats_and_subtitles(video_url, video_id, ext='mp4', headers=headers)
-												[extractor/generic] Add extractor-args `hls_key`, `variant_query` (#6567)

Authored by: bashonly
											
										
										
											2023-03-21 23:12:17 +00:00
+								                self._extra_manifest_info(entry_info_dict, video_url)
-												[extractor/generic] Detect DASH manifests in found URLs and extract mpd formats

											
										
										
											2016-02-06 13:42:03 +00:00
+								            elif ext == 'mpd':
-												[generic] Pass referer to extracted formats

Closes #2839

											
										
										
											2022-02-20 11:43:13 +00:00
+								                entry_info_dict['formats'], entry_info_dict['subtitles'] = self._extract_mpd_formats_and_subtitles(video_url, video_id, headers=headers)
-												[extractor/generic] Add extractor-args `hls_key`, `variant_query` (#6567)

Authored by: bashonly
											
										
										
											2023-03-21 23:12:17 +00:00
+								                self._extra_manifest_info(entry_info_dict, video_url)
-												[extractor/generic] Extract f4m formats from final URLs

											
										
										
											2016-03-12 21:38:20 +00:00
+								            elif ext == 'f4m':
-												[generic] Pass referer to extracted formats

Closes #2839

											
										
										
											2022-02-20 11:43:13 +00:00
+								                entry_info_dict['formats'] = self._extract_f4m_formats(video_url, video_id, headers=headers)
-												[extractor/generic] Skip URLs we came from when delegating ISM extraction

											
										
										
											2016-11-02 16:43:41 +00:00
+								            elif re.search(r'(?i)\.(?:ism|smil)/manifest', video_url) and video_url != url:
-												[extractor/generic] Improve ISM extraction

											
										
										
											2016-11-02 16:34:37 +00:00
+								                # Just matching .ism/manifest is not enough to be reliably sure
 								                # whether it's actually an ISM manifest or some other streaming
 								                # manifest since there are various streaming URL formats
 								                # possible (see [1]) as well as some other shenanigans like
 								                # .smil/manifest URLs that actually serve an ISM (see [2]) and
 								                # so on.
 								                # Thus the most reasonable way to solve this is to delegate
 								                # to generic extractor in order to look into the contents of
 								                # the manifest itself.
 								                # 1. https://azure.microsoft.com/en-us/documentation/articles/media-services-deliver-content-overview/#streaming-url-formats
 								                # 2. https://svs.itworkscdn.net/lbcivod/smil:itwfcdn/lbci/170976.smil/Manifest
 								                entry_info_dict = self.url_result(
 								                    smuggle_url(video_url, {'to_generic': True}),
 								                    GenericIE.ie_key())
-												[generic] Extract videos from SMIL manifests (closes #5145 and fixes #5135)

											
										
										
											2015-04-16 09:16:11 +00:00
+								            else:
-												[generic] Refactor

											
										
										
											2015-11-21 08:08:54 +00:00
+								                entry_info_dict['url'] = video_url
 								            entries.append(entry_info_dict)
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											2014-04-30 00:23:51 +00:00
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2022-10-09 10:39:36 +00:00
+								        if len(entries) > 1:
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											2014-04-30 00:23:51 +00:00
+								            for num, e in enumerate(entries, start=1):
-												[generic] Don't set the 'title' if it's not defined in the entry (closes #5061)

Some of them may be an 'url' result, which in general don't have the 'title' field.

											
										
										
											2015-02-25 16:56:51 +00:00
+								                # 'url' results don't have a title
 								                if e.get('title') is not None:
 								                    e['title'] = '%s (%d)' % (e['title'], num)
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2022-10-09 10:39:36 +00:00
+								        return entries