yt-dlc/youtube_dl/extractor/generic.py

# coding: utf-8

from __future__ import unicode_literals

import os
import re
import sys

from .common import InfoExtractor
from .youtube import YoutubeIE
from ..compat import (
    compat_etree_fromstring,
    compat_str,
    compat_urllib_parse_unquote,
    compat_urlparse,
    compat_xml_parse_error,
)
from ..utils import (
    determine_ext,
    ExtractorError,
    float_or_none,
    HEADRequest,
    is_html,
    js_to_json,
    KNOWN_EXTENSIONS,
    merge_dicts,
    mimetype2ext,
    orderedSet,
    sanitized_Request,
    smuggle_url,
    unescapeHTML,
    unified_strdate,
    unsmuggle_url,
    UnsupportedError,
    xpath_text,
)
from .commonprotocols import RtmpIE
from .brightcove import (
    BrightcoveLegacyIE,
    BrightcoveNewIE,
)
from .nexx import (
    NexxIE,
    NexxEmbedIE,
)
from .nbc import NBCSportsVPlayerIE
from .ooyala import OoyalaIE
from .rutv import RUTVIE
from .tvc import TVCIE
from .sportbox import SportBoxEmbedIE
from .smotri import SmotriIE
from .myvi import MyviIE
from .condenast import CondeNastIE
from .udn import UDNEmbedIE
from .senateisvp import SenateISVPIE
from .svt import SVTIE
from .pornhub import PornHubIE
from .xhamster import XHamsterEmbedIE
from .tnaflix import TNAFlixNetworkEmbedIE
from .drtuber import DrTuberIE
from .redtube import RedTubeIE
from .tube8 import Tube8IE
from .vimeo import VimeoIE
from .dailymotion import DailymotionIE
from .dailymail import DailyMailIE
from .onionstudios import OnionStudiosIE
from .viewlift import ViewLiftEmbedIE
from .mtv import MTVServicesEmbeddedIE
from .pladform import PladformIE
from .videomore import VideomoreIE
from .webcaster import WebcasterFeedIE
from .googledrive import GoogleDriveIE
from .jwplatform import JWPlatformIE
from .digiteka import DigitekaIE
from .arkena import ArkenaIE
from .instagram import InstagramIE
from .liveleak import LiveLeakIE
from .threeqsdn import ThreeQSDNIE
from .theplatform import ThePlatformIE
from .vessel import VesselIE
from .kaltura import KalturaIE
from .eagleplatform import EaglePlatformIE
from .facebook import FacebookIE
from .soundcloud import SoundcloudIE
from .tunein import TuneInBaseIE
from .vbox7 import Vbox7IE
from .dbtv import DBTVIE
from .piksel import PikselIE
from .videa import VideaIE
from .twentymin import TwentyMinutenIE
from .ustream import UstreamIE
from .openload import OpenloadIE
from .videopress import VideoPressIE
from .rutube import RutubeIE
from .limelight import LimelightBaseIE
from .anvato import AnvatoIE
from .washingtonpost import WashingtonPostIE
from .wistia import WistiaIE
from .mediaset import MediasetIE
from .joj import JojIE
from .megaphone import MegaphoneIE
from .vzaar import VzaarIE
from .channel9 import Channel9IE
from .vshare import VShareIE
from .mediasite import MediasiteIE
from .springboardplatform import SpringboardPlatformIE
from .yapfiles import YapFilesIE
from .vice import ViceIE
from .xfileshare import XFileShareIE
from .cloudflarestream import CloudflareStreamIE
from .peertube import PeerTubeIE
from .indavideo import IndavideoEmbedIE
from .apa import APAIE
from .foxnews import FoxNewsIE
from .viqeo import ViqeoIE
from .expressen import ExpressenIE


class GenericIE(InfoExtractor):
    IE_DESC = 'Generic downloader that works on some sites'
    _VALID_URL = r'.*'
    IE_NAME = 'generic'
    _TESTS = [
        # Direct link to a video
        {
            'url': 'http://media.w3.org/2010/05/sintel/trailer.mp4',
            'md5': '67d406c2bcb6af27fa886f31aa934bbe',
            'info_dict': {
                'id': 'trailer',
                'ext': 'mp4',
                'title': 'trailer',
                'upload_date': '20100513',
            }
        },
        # Direct link to media delivered compressed (until Accept-Encoding is *)
        {
            'url': 'http://calimero.tk/muzik/FictionJunction-Parallel_Hearts.flac',
            'md5': '128c42e68b13950268b648275386fc74',
            'info_dict': {
                'id': 'FictionJunction-Parallel_Hearts',
                'ext': 'flac',
                'title': 'FictionJunction-Parallel_Hearts',
                'upload_date': '20140522',
            },
            'expected_warnings': [
                'URL could be a direct video link, returning it as such.'
            ],
            'skip': 'URL invalid',
        },
        # Direct download with broken HEAD
        {
            'url': 'http://ai-radio.org:8000/radio.opus',
            'info_dict': {
                'id': 'radio',
                'ext': 'opus',
                'title': 'radio',
            },
            'params': {
                'skip_download': True,  # infinite live stream
            },
            'expected_warnings': [
                r'501.*Not Implemented',
                r'400.*Bad Request',
            ],
        },
        # Direct link with incorrect MIME type
        {
            'url': 'http://ftp.nluug.nl/video/nluug/2014-11-20_nj14/zaal-2/5_Lennart_Poettering_-_Systemd.webm',
            'md5': '4ccbebe5f36706d85221f204d7eb5913',
            'info_dict': {
                'url': 'http://ftp.nluug.nl/video/nluug/2014-11-20_nj14/zaal-2/5_Lennart_Poettering_-_Systemd.webm',
                'id': '5_Lennart_Poettering_-_Systemd',
                'ext': 'webm',
                'title': '5_Lennart_Poettering_-_Systemd',
                'upload_date': '20141120',
            },
            'expected_warnings': [
                'URL could be a direct video link, returning it as such.'
            ]
        },
        # RSS feed
        {
            'url': 'http://phihag.de/2014/youtube-dl/rss2.xml',
            'info_dict': {
                'id': 'http://phihag.de/2014/youtube-dl/rss2.xml',
                'title': 'Zero Punctuation',
                'description': 're:.*groundbreaking video review series.*'
            },
            'playlist_mincount': 11,
        },
        # RSS feed with enclosure
        {
            'url': 'http://podcastfeeds.nbcnews.com/audio/podcast/MSNBC-MADDOW-NETCAST-M4V.xml',
            'info_dict': {
                'id': 'pdv_maddow_netcast_m4v-02-27-2015-201624',
                'ext': 'm4v',
                'upload_date': '20150228',
                'title': 'pdv_maddow_netcast_m4v-02-27-2015-201624',
            }
        },
        # RSS feed with enclosures and unsupported link URLs
        {
            'url': 'http://www.hellointernet.fm/podcast?format=rss',
            'info_dict': {
                'id': 'http://www.hellointernet.fm/podcast?format=rss',
                'description': 'CGP Grey and Brady Haran talk about YouTube, life, work, whatever.',
                'title': 'Hello Internet',
            },
            'playlist_mincount': 100,
        },
        # SMIL from http://videolectures.net/promogram_igor_mekjavic_eng
        {
            'url': 'http://videolectures.net/promogram_igor_mekjavic_eng/video/1/smil.xml',
            'info_dict': {
                'id': 'smil',
                'ext': 'mp4',
                'title': 'Automatics, robotics and biocybernetics',
                'description': 'md5:815fc1deb6b3a2bff99de2d5325be482',
                'upload_date': '20130627',
                'formats': 'mincount:16',
                'subtitles': 'mincount:1',
            },
            'params': {
                'force_generic_extractor': True,
                'skip_download': True,
            },
        },
        # SMIL from http://www1.wdr.de/mediathek/video/livestream/index.html
        {
            'url': 'http://metafilegenerator.de/WDR/WDR_FS/hds/hds.smil',
            'info_dict': {
                'id': 'hds',
                'ext': 'flv',
                'title': 'hds',
                'formats': 'mincount:1',
            },
            'params': {
                'skip_download': True,
            },
        },
        # SMIL from https://www.restudy.dk/video/play/id/1637
        {
            'url': 'https://www.restudy.dk/awsmedia/SmilDirectory/video_1637.xml',
            'info_dict': {
                'id': 'video_1637',
                'ext': 'flv',
                'title': 'video_1637',
                'formats': 'mincount:3',
            },
            'params': {
                'skip_download': True,
            },
        },
        # SMIL from http://adventure.howstuffworks.com/5266-cool-jobs-iditarod-musher-video.htm
        {
            'url': 'http://services.media.howstuffworks.com/videos/450221/smil-service.smil',
            'info_dict': {
                'id': 'smil-service',
                'ext': 'flv',
                'title': 'smil-service',
                'formats': 'mincount:1',
            },
            'params': {
                'skip_download': True,
            },
        },
        # SMIL from http://new.livestream.com/CoheedandCambria/WebsterHall/videos/4719370
        {
            'url': 'http://api.new.livestream.com/accounts/1570303/events/1585861/videos/4719370.smil',
            'info_dict': {
                'id': '4719370',
                'ext': 'mp4',
                'title': '571de1fd-47bc-48db-abf9-238872a58d1f',
                'formats': 'mincount:3',
            },
            'params': {
                'skip_download': True,
            },
        },
        # XSPF playlist from http://www.telegraaf.nl/tv/nieuws/binnenland/24353229/__Tikibad_ontruimd_wegens_brand__.html
        {
            'url': 'http://www.telegraaf.nl/xml/playlist/2015/8/7/mZlp2ctYIUEB.xspf',
            'info_dict': {
                'id': 'mZlp2ctYIUEB',
                'ext': 'mp4',
                'title': 'Tikibad ontruimd wegens brand',
                'description': 'md5:05ca046ff47b931f9b04855015e163a4',
                'thumbnail': r're:^https?://.*\.jpg$',
                'duration': 33,
            },
            'params': {
                'skip_download': True,
            },
        },
        # MPD from http://dash-mse-test.appspot.com/media.html
        {
            'url': 'http://yt-dash-mse-test.commondatastorage.googleapis.com/media/car-20120827-manifest.mpd',
            'md5': '4b57baab2e30d6eb3a6a09f0ba57ef53',
            'info_dict': {
                'id': 'car-20120827-manifest',
                'ext': 'mp4',
                'title': 'car-20120827-manifest',
                'formats': 'mincount:9',
                'upload_date': '20130904',
            },
            'params': {
                'format': 'bestvideo',
            },
        },
        # m3u8 served with Content-Type: audio/x-mpegURL; charset=utf-8
        {
            'url': 'http://once.unicornmedia.com/now/master/playlist/bb0b18ba-64f5-4b1b-a29f-0ac252f06b68/77a785f3-5188-4806-b788-0893a61634ed/93677179-2d99-4ef4-9e17-fe70d49abfbf/content.m3u8',
            'info_dict': {
                'id': 'content',
                'ext': 'mp4',
                'title': 'content',
                'formats': 'mincount:8',
            },
            'params': {
                # m3u8 downloads
                'skip_download': True,
            },
            'skip': 'video gone',
        },
        # m3u8 served with Content-Type: text/plain
        {
            'url': 'http://www.nacentapps.com/m3u8/index.m3u8',
            'info_dict': {
                'id': 'index',
                'ext': 'mp4',
                'title': 'index',
                'upload_date': '20140720',
                'formats': 'mincount:11',
            },
            'params': {
                # m3u8 downloads
                'skip_download': True,
            },
            'skip': 'video gone',
        },
        # google redirect
        {
            'url': 'http://www.google.com/url?sa=t&rct=j&q=&esrc=s&source=web&cd=1&cad=rja&ved=0CCUQtwIwAA&url=http%3A%2F%2Fwww.youtube.com%2Fwatch%3Fv%3DcmQHVoWB5FY&ei=F-sNU-LLCaXk4QT52ICQBQ&usg=AFQjCNEw4hL29zgOohLXvpJ-Bdh2bils1Q&bvm=bv.61965928,d.bGE',
            'info_dict': {
                'id': 'cmQHVoWB5FY',
                'ext': 'mp4',
                'upload_date': '20130224',
                'uploader_id': 'TheVerge',
                'description': r're:^Chris Ziegler takes a look at the\.*',
                'uploader': 'The Verge',
                'title': 'First Firefox OS phones side-by-side',
            },
            'params': {
                'skip_download': False,
            }
        },
        {
            # redirect in Refresh HTTP header
            'url': 'https://www.facebook.com/l.php?u=https%3A%2F%2Fwww.youtube.com%2Fwatch%3Fv%3DpO8h3EaFRdo&h=TAQHsoToz&enc=AZN16h-b6o4Zq9pZkCCdOLNKMN96BbGMNtcFwHSaazus4JHT_MFYkAA-WARTX2kvsCIdlAIyHZjl6d33ILIJU7Jzwk_K3mcenAXoAzBNoZDI_Q7EXGDJnIhrGkLXo_LJ_pAa2Jzbx17UHMd3jAs--6j2zaeto5w9RTn8T_1kKg3fdC5WPX9Dbb18vzH7YFX0eSJmoa6SP114rvlkw6pkS1-T&s=1',
            'info_dict': {
                'id': 'pO8h3EaFRdo',
                'ext': 'mp4',
                'title': 'Tripeo Boiler Room x Dekmantel Festival DJ Set',
                'description': 'md5:6294cc1af09c4049e0652b51a2df10d5',
                'upload_date': '20150917',
                'uploader_id': 'brtvofficial',
                'uploader': 'Boiler Room',
            },
            'params': {
                'skip_download': False,
            },
        },
        {
            'url': 'http://www.hodiho.fr/2013/02/regis-plante-sa-jeep.html',
            'md5': '85b90ccc9d73b4acd9138d3af4c27f89',
            'info_dict': {
                'id': '13601338388002',
                'ext': 'mp4',
                'uploader': 'www.hodiho.fr',
                'title': 'R\u00e9gis plante sa Jeep',
            }
        },
        # bandcamp page with custom domain
        {
            'add_ie': ['Bandcamp'],
            'url': 'http://bronyrock.com/track/the-pony-mash',
            'info_dict': {
                'id': '3235767654',
                'ext': 'mp3',
                'title': 'The Pony Mash',
                'uploader': 'M_Pallante',
            },
            'skip': 'There is a limit of 200 free downloads / month for the test song',
        },
        {
            # embedded brightcove video
            # it also tests brightcove videos that need to set the 'Referer'
            # in the http requests
            'add_ie': ['BrightcoveLegacy'],
            'url': 'http://www.bfmtv.com/video/bfmbusiness/cours-bourse/cours-bourse-l-analyse-technique-154522/',
            'info_dict': {
                'id': '2765128793001',
                'ext': 'mp4',
                'title': 'Le cours de bourse : l’analyse technique',
                'description': 'md5:7e9ad046e968cb2d1114004aba466fd9',
                'uploader': 'BFM BUSINESS',
            },
            'params': {
                'skip_download': True,
            },
        },
        {
            # embedded with itemprop embedURL and video id spelled as `idVideo`
            'add_id': ['BrightcoveLegacy'],
            'url': 'http://bfmbusiness.bfmtv.com/mediaplayer/chroniques/olivier-delamarche/',
            'info_dict': {
                'id': '5255628253001',
                'ext': 'mp4',
                'title': 'md5:37c519b1128915607601e75a87995fc0',
                'description': 'md5:37f7f888b434bb8f8cc8dbd4f7a4cf26',
                'uploader': 'BFM BUSINESS',
                'uploader_id': '876450612001',
                'timestamp': 1482255315,
                'upload_date': '20161220',
            },
            'params': {
                'skip_download': True,
            },
        },
        {
            # https://github.com/rg3/youtube-dl/issues/2253
            'url': 'http://bcove.me/i6nfkrc3',
            'md5': '0ba9446db037002366bab3b3eb30c88c',
            'info_dict': {
                'id': '3101154703001',
                'ext': 'mp4',
                'title': 'Still no power',
                'uploader': 'thestar.com',
                'description': 'Mississauga resident David Farmer is still out of power as a result of the ice storm a month ago. To keep the house warm, Farmer cuts wood from his property for a wood burning stove downstairs.',
            },
            'add_ie': ['BrightcoveLegacy'],
            'skip': 'video gone',
        },
        {
            'url': 'http://www.championat.com/video/football/v/87/87499.html',
            'md5': 'fb973ecf6e4a78a67453647444222983',
            'info_dict': {
                'id': '3414141473001',
                'ext': 'mp4',
                'title': 'Видео. Удаление Дзагоева (ЦСКА)',
                'description': 'Онлайн-трансляция матча ЦСКА - "Волга"',
                'uploader': 'Championat',
            },
        },
        {
            # https://github.com/rg3/youtube-dl/issues/3541
            'add_ie': ['BrightcoveLegacy'],
            'url': 'http://www.kijk.nl/sbs6/leermijvrouwenkennen/videos/jqMiXKAYan2S/aflevering-1',
            'info_dict': {
                'id': '3866516442001',
                'ext': 'mp4',
                'title': 'Leer mij vrouwen kennen: Aflevering 1',
                'description': 'Leer mij vrouwen kennen: Aflevering 1',
                'uploader': 'SBS Broadcasting',
            },
            'skip': 'Restricted to Netherlands',
            'params': {
                'skip_download': True,  # m3u8 download
            },
        },
        {
            # Brightcove video in <iframe>
            'url': 'http://www.un.org/chinese/News/story.asp?NewsID=27724',
            'md5': '36d74ef5e37c8b4a2ce92880d208b968',
            'info_dict': {
                'id': '5360463607001',
                'ext': 'mp4',
                'title': '叙利亚失明儿童在废墟上演唱《心跳》  呼吁获得正常童年生活',
                'description': '联合国儿童基金会中东和北非区域大使、作曲家扎德·迪拉尼（Zade Dirani）在3月15日叙利亚冲突爆发7周年纪念日之际发布了为叙利亚谱写的歌曲《心跳》（HEARTBEAT），为受到六年冲突影响的叙利亚儿童发出强烈呐喊，呼吁世界做出共同努力，使叙利亚儿童重新获得享有正常童年生活的权利。',
                'uploader': 'United Nations',
                'uploader_id': '1362235914001',
                'timestamp': 1489593889,
                'upload_date': '20170315',
            },
            'add_ie': ['BrightcoveLegacy'],
        },
        {
            # Brightcove with alternative playerID key
            'url': 'http://www.nature.com/nmeth/journal/v9/n7/fig_tab/nmeth.2062_SV1.html',
            'info_dict': {
                'id': 'nmeth.2062_SV1',
                'title': 'Simultaneous multiview imaging of the Drosophila syncytial blastoderm : Quantitative high-speed imaging of entire developing embryos with simultaneous multiview light-sheet microscopy : Nature Methods : Nature Research',
            },
            'playlist': [{
                'info_dict': {
                    'id': '2228375078001',
                    'ext': 'mp4',
                    'title': 'nmeth.2062-sv1',
                    'description': 'nmeth.2062-sv1',
                    'timestamp': 1363357591,
                    'upload_date': '20130315',
                    'uploader': 'Nature Publishing Group',
                    'uploader_id': '1964492299001',
                },
            }],
        },
        {
            # Brightcove with UUID in videoPlayer
            'url': 'http://www8.hp.com/cn/zh/home.html',
            'info_dict': {
                'id': '5255815316001',
                'ext': 'mp4',
                'title': 'Sprocket Video - China',
                'description': 'Sprocket Video - China',
                'uploader': 'HP-Video Gallery',
                'timestamp': 1482263210,
                'upload_date': '20161220',
                'uploader_id': '1107601872001',
            },
            'params': {
                'skip_download': True,  # m3u8 download
            },
            'skip': 'video rotates...weekly?',
        },
        {
            # Brightcove:new type [2].
            'url': 'http://www.delawaresportszone.com/video-st-thomas-more-earns-first-trip-to-basketball-semis',
            'md5': '2b35148fcf48da41c9fb4591650784f3',
            'info_dict': {
                'id': '5348741021001',
                'ext': 'mp4',
                'upload_date': '20170306',
                'uploader_id': '4191638492001',
                'timestamp': 1488769918,
                'title': 'VIDEO:  St. Thomas More earns first trip to basketball semis',

            },
        },
        {
            # Alternative brightcove <video> attributes
            'url': 'http://www.programme-tv.net/videos/extraits/81095-guillaume-canet-evoque-les-rumeurs-d-infidelite-de-marion-cotillard-avec-brad-pitt-dans-vivement-dimanche/',
            'info_dict': {
                'id': '81095-guillaume-canet-evoque-les-rumeurs-d-infidelite-de-marion-cotillard-avec-brad-pitt-dans-vivement-dimanche',
                'title': "Guillaume Canet évoque les rumeurs d'infidélité de Marion Cotillard avec Brad Pitt dans Vivement Dimanche, Extraits : toutes les vidéos avec Télé-Loisirs",
            },
            'playlist': [{
                'md5': '732d22ba3d33f2f3fc253c39f8f36523',
                'info_dict': {
                    'id': '5311302538001',
                    'ext': 'mp4',
                    'title': "Guillaume Canet évoque les rumeurs d'infidélité de Marion Cotillard avec Brad Pitt dans Vivement Dimanche",
                    'description': "Guillaume Canet évoque les rumeurs d'infidélité de Marion Cotillard avec Brad Pitt dans Vivement Dimanche (France 2, 5 février 2017)",
                    'timestamp': 1486321708,
                    'upload_date': '20170205',
                    'uploader_id': '800000640001',
                },
                'only_matching': True,
            }],
        },
        {
            # Brightcove with UUID in videoPlayer
            'url': 'http://www8.hp.com/cn/zh/home.html',
            'info_dict': {
                'id': '5255815316001',
                'ext': 'mp4',
                'title': 'Sprocket Video - China',
                'description': 'Sprocket Video - China',
                'uploader': 'HP-Video Gallery',
                'timestamp': 1482263210,
                'upload_date': '20161220',
                'uploader_id': '1107601872001',
            },
            'params': {
                'skip_download': True,  # m3u8 download
            },
        },
        # ooyala video
        {
            'url': 'http://www.rollingstone.com/music/videos/norwegian-dj-cashmere-cat-goes-spartan-on-with-me-premiere-20131219',
            'md5': '166dd577b433b4d4ebfee10b0824d8ff',
            'info_dict': {
                'id': 'BwY2RxaTrTkslxOfcan0UCf0YqyvWysJ',
                'ext': 'mp4',
                'title': '2cc213299525360.mov',  # that's what we get
                'duration': 238.231,
            },
            'add_ie': ['Ooyala'],
        },
        {
            # ooyala video embedded with http://player.ooyala.com/iframe.js
            'url': 'http://www.macrumors.com/2015/07/24/steve-jobs-the-man-in-the-machine-first-trailer/',
            'info_dict': {
                'id': 'p0MGJndjoG5SOKqO_hZJuZFPB-Tr5VgB',
                'ext': 'mp4',
                'title': '"Steve Jobs: Man in the Machine" trailer',
                'description': 'The first trailer for the Alex Gibney documentary "Steve Jobs: Man in the Machine."',
                'duration': 135.427,
            },
            'params': {
                'skip_download': True,
            },
            'skip': 'movie expired',
        },
        # ooyala video embedded with http://player.ooyala.com/static/v4/production/latest/core.min.js
        {
            'url': 'http://wnep.com/2017/07/22/steampunk-fest-comes-to-honesdale/',
            'info_dict': {
                'id': 'lwYWYxYzE6V5uJMjNGyKtwwiw9ZJD7t2',
                'ext': 'mp4',
                'title': 'Steampunk Fest Comes to Honesdale',
                'duration': 43.276,
            },
            'params': {
                'skip_download': True,
            }
        },
        # embed.ly video
        {
            'url': 'http://www.tested.com/science/weird/460206-tested-grinding-coffee-2000-frames-second/',
            'info_dict': {
                'id': '9ODmcdjQcHQ',
                'ext': 'mp4',
                'title': 'Tested: Grinding Coffee at 2000 Frames Per Second',
                'upload_date': '20140225',
                'description': 'md5:06a40fbf30b220468f1e0957c0f558ff',
                'uploader': 'Tested',
                'uploader_id': 'testedcom',
            },
            # No need to test YoutubeIE here
            'params': {
                'skip_download': True,
            },
        },
        # funnyordie embed
        {
            'url': 'http://www.theguardian.com/world/2014/mar/11/obama-zach-galifianakis-between-two-ferns',
            'info_dict': {
                'id': '18e820ec3f',
                'ext': 'mp4',
                'title': 'Between Two Ferns with Zach Galifianakis: President Barack Obama',
                'description': 'Episode 18: President Barack Obama sits down with Zach Galifianakis for his most memorable interview yet.',
            },
            # HEAD requests lead to endless 301, while GET is OK
            'expected_warnings': ['301'],
        },
        # RUTV embed
        {
            'url': 'http://www.rg.ru/2014/03/15/reg-dfo/anklav-anons.html',
            'info_dict': {
                'id': '776940',
                'ext': 'mp4',
                'title': 'Охотское море стало целиком российским',
                'description': 'md5:5ed62483b14663e2a95ebbe115eb8f43',
            },
            'params': {
                # m3u8 download
                'skip_download': True,
            },
        },
        # TVC embed
        {
            'url': 'http://sch1298sz.mskobr.ru/dou_edu/karamel_ki/filial_galleries/video/iframe_src_http_tvc_ru_video_iframe_id_55304_isplay_false_acc_video_id_channel_brand_id_11_show_episodes_episode_id_32307_frameb/',
            'info_dict': {
                'id': '55304',
                'ext': 'mp4',
                'title': 'Дошкольное воспитание',
            },
        },
        # SportBox embed
        {
            'url': 'http://www.vestifinance.ru/articles/25753',
            'info_dict': {
                'id': '25753',
                'title': 'Прямые трансляции с Форума-выставки "Госзаказ-2013"',
            },
            'playlist': [{
                'info_dict': {
                    'id': '370908',
                    'title': 'Госзаказ. День 3',
                    'ext': 'mp4',
                }
            }, {
                'info_dict': {
                    'id': '370905',
                    'title': 'Госзаказ. День 2',
                    'ext': 'mp4',
                }
            }, {
                'info_dict': {
                    'id': '370902',
                    'title': 'Госзаказ. День 1',
                    'ext': 'mp4',
                }
            }],
            'params': {
                # m3u8 download
                'skip_download': True,
            },
        },
        # Myvi.ru embed
        {
            'url': 'http://www.kinomyvi.tv/news/detail/Pervij-dublirovannij-trejler--Uzhastikov-_nOw1',
            'info_dict': {
                'id': 'f4dafcad-ff21-423d-89b5-146cfd89fa1e',
                'ext': 'mp4',
                'title': 'Ужастики, русский трейлер (2015)',
                'thumbnail': r're:^https?://.*\.jpg$',
                'duration': 153,
            }
        },
        # XHamster embed
        {
            'url': 'http://www.numisc.com/forum/showthread.php?11696-FM15-which-pumiscer-was-this-%28-vid-%29-%28-alfa-as-fuck-srx-%29&s=711f5db534502e22260dec8c5e2d66d8',
            'info_dict': {
                'id': 'showthread',
                'title': '[NSFL] [FM15] which pumiscer was this ( vid ) ( alfa as fuck srx )',
            },
            'playlist_mincount': 7,
            # This forum does not allow <iframe> syntaxes anymore
            # Now HTML tags are displayed as-is
            'skip': 'No videos on this page',
        },
        # Embedded TED video
        {
            'url': 'http://en.support.wordpress.com/videos/ted-talks/',
            'md5': '65fdff94098e4a607385a60c5177c638',
            'info_dict': {
                'id': '1969',
                'ext': 'mp4',
                'title': 'Hidden miracles of the natural world',
                'uploader': 'Louie Schwartzberg',
                'description': 'md5:8145d19d320ff3e52f28401f4c4283b9',
            }
        },
        # nowvideo embed hidden behind percent encoding
        {
            'url': 'http://www.waoanime.tv/the-super-dimension-fortress-macross-episode-1/',
            'md5': '2baf4ddd70f697d94b1c18cf796d5107',
            'info_dict': {
                'id': '06e53103ca9aa',
                'ext': 'flv',
                'title': 'Macross Episode 001  Watch Macross Episode 001 onl',
                'description': 'No description',
            },
        },
        # arte embed
        {
            'url': 'http://www.tv-replay.fr/redirection/20-03-14/x-enius-arte-10753389.html',
            'md5': '7653032cbb25bf6c80d80f217055fa43',
            'info_dict': {
                'id': '048195-004_PLUS7-F',
                'ext': 'flv',
                'title': 'X:enius',
                'description': 'md5:d5fdf32ef6613cdbfd516ae658abf168',
                'upload_date': '20140320',
            },
            'params': {
                'skip_download': 'Requires rtmpdump'
            },
            'skip': 'video gone',
        },
        # francetv embed
        {
            'url': 'http://www.tsprod.com/replay-du-concert-alcaline-de-calogero',
            'info_dict': {
                'id': 'EV_30231',
                'ext': 'mp4',
                'title': 'Alcaline, le concert avec Calogero',
                'description': 'md5:61f08036dcc8f47e9cfc33aed08ffaff',
                'upload_date': '20150226',
                'timestamp': 1424989860,
                'duration': 5400,
            },
            'params': {
                # m3u8 downloads
                'skip_download': True,
            },
            'expected_warnings': [
                'Forbidden'
            ]
        },
        # Condé Nast embed
        {
            'url': 'http://www.wired.com/2014/04/honda-asimo/',
            'md5': 'ba0dfe966fa007657bd1443ee672db0f',
            'info_dict': {
                'id': '53501be369702d3275860000',
                'ext': 'mp4',
                'title': 'Honda’s  New Asimo Robot Is More Human Than Ever',
            }
        },
        # Dailymotion embed
        {
            'url': 'http://www.spi0n.com/zap-spi0n-com-n216/',
            'md5': '441aeeb82eb72c422c7f14ec533999cd',
            'info_dict': {
                'id': 'k2mm4bCdJ6CQ2i7c8o2',
                'ext': 'mp4',
                'title': 'Le Zap de Spi0n n°216 - Zapping du Web',
                'description': 'md5:faf028e48a461b8b7fad38f1e104b119',
                'uploader': 'Spi0n',
                'uploader_id': 'xgditw',
                'upload_date': '20140425',
                'timestamp': 1398441542,
            },
            'add_ie': ['Dailymotion'],
        },
        # DailyMail embed
        {
            'url': 'http://www.bumm.sk/krimi/2017/07/05/biztonsagi-kamera-buktatta-le-az-agg-ferfit-utlegelo-apolot',
            'info_dict': {
                'id': '1495629',
                'ext': 'mp4',
                'title': 'Care worker punches elderly dementia patient in head 11 times',
                'description': 'md5:3a743dee84e57e48ec68bf67113199a5',
            },
            'add_ie': ['DailyMail'],
            'params': {
                'skip_download': True,
            },
        },
        # YouTube embed
        {
            'url': 'http://www.badzine.de/ansicht/datum/2014/06/09/so-funktioniert-die-neue-englische-badminton-liga.html',
            'info_dict': {
                'id': 'FXRb4ykk4S0',
                'ext': 'mp4',
                'title': 'The NBL Auction 2014',
                'uploader': 'BADMINTON England',
                'uploader_id': 'BADMINTONEvents',
                'upload_date': '20140603',
                'description': 'md5:9ef128a69f1e262a700ed83edb163a73',
            },
            'add_ie': ['Youtube'],
            'params': {
                'skip_download': True,
            }
        },
        # MTVSercices embed
        {
            'url': 'http://www.vulture.com/2016/06/new-key-peele-sketches-released.html',
            'md5': 'ca1aef97695ef2c1d6973256a57e5252',
            'info_dict': {
                'id': '769f7ec0-0692-4d62-9b45-0d88074bffc1',
                'ext': 'mp4',
                'title': 'Key and Peele|October 10, 2012|2|203|Liam Neesons - Uncensored',
                'description': 'Two valets share their love for movie star Liam Neesons.',
                'timestamp': 1349922600,
                'upload_date': '20121011',
            },
        },
        # YouTube embed via <data-embed-url="">
        {
            'url': 'https://play.google.com/store/apps/details?id=com.gameloft.android.ANMP.GloftA8HM',
            'info_dict': {
                'id': '4vAffPZIT44',
                'ext': 'mp4',
                'title': 'Asphalt 8: Airborne - Update - Welcome to Dubai!',
                'uploader': 'Gameloft',
                'uploader_id': 'gameloft',
                'upload_date': '20140828',
                'description': 'md5:c80da9ed3d83ae6d1876c834de03e1c4',
            },
            'params': {
                'skip_download': True,
            }
        },
        # YouTube <object> embed
        {
            'url': 'http://www.improbable.com/2017/04/03/untrained-modern-youths-and-ancient-masters-in-selfie-portraits/',
            'md5': '516718101ec834f74318df76259fb3cc',
            'info_dict': {
                'id': 'msN87y-iEx0',
                'ext': 'webm',
                'title': 'Feynman: Mirrors FUN TO IMAGINE 6',
                'upload_date': '20080526',
                'description': 'md5:0ffc78ea3f01b2e2c247d5f8d1d3c18d',
                'uploader': 'Christopher Sykes',
                'uploader_id': 'ChristopherJSykes',
            },
            'add_ie': ['Youtube'],
        },
        # Camtasia studio
        {
            'url': 'http://www.ll.mit.edu/workshops/education/videocourses/antennas/lecture1/video/',
            'playlist': [{
                'md5': '0c5e352edabf715d762b0ad4e6d9ee67',
                'info_dict': {
                    'id': 'Fenn-AA_PA_Radar_Course_Lecture_1c_Final',
                    'title': 'Fenn-AA_PA_Radar_Course_Lecture_1c_Final - video1',
                    'ext': 'flv',
                    'duration': 2235.90,
                }
            }, {
                'md5': '10e4bb3aaca9fd630e273ff92d9f3c63',
                'info_dict': {
                    'id': 'Fenn-AA_PA_Radar_Course_Lecture_1c_Final_PIP',
                    'title': 'Fenn-AA_PA_Radar_Course_Lecture_1c_Final - pip',
                    'ext': 'flv',
                    'duration': 2235.93,
                }
            }],
            'info_dict': {
                'title': 'Fenn-AA_PA_Radar_Course_Lecture_1c_Final',
            }
        },
        # Flowplayer
        {
            'url': 'http://www.handjobhub.com/video/busty-blonde-siri-tit-fuck-while-wank-6313.html',
            'md5': '9d65602bf31c6e20014319c7d07fba27',
            'info_dict': {
                'id': '5123ea6d5e5a7',
                'ext': 'mp4',
                'age_limit': 18,
                'uploader': 'www.handjobhub.com',
                'title': 'Busty Blonde Siri Tit Fuck While Wank at HandjobHub.com',
            }
        },
        # Multiple brightcove videos
        # https://github.com/rg3/youtube-dl/issues/2283
        {
            'url': 'http://www.newyorker.com/online/blogs/newsdesk/2014/01/always-never-nuclear-command-and-control.html',
            'info_dict': {
                'id': 'always-never',
                'title': 'Always / Never - The New Yorker',
            },
            'playlist_count': 3,
            'params': {
                'extract_flat': False,
                'skip_download': True,
            }
        },
        # MLB embed
        {
            'url': 'http://umpire-empire.com/index.php/topic/58125-laz-decides-no-thats-low/',
            'md5': '96f09a37e44da40dd083e12d9a683327',
            'info_dict': {
                'id': '33322633',
                'ext': 'mp4',
                'title': 'Ump changes call to ball',
                'description': 'md5:71c11215384298a172a6dcb4c2e20685',
                'duration': 48,
                'timestamp': 1401537900,
                'upload_date': '20140531',
                'thumbnail': r're:^https?://.*\.jpg$',
            },
        },
        # Wistia embed
        {
            'url': 'http://study.com/academy/lesson/north-american-exploration-failed-colonies-of-spain-france-england.html#lesson',
            'md5': '1953f3a698ab51cfc948ed3992a0b7ff',
            'info_dict': {
                'id': '6e2wtrbdaf',
                'ext': 'mov',
                'title': 'paywall_north-american-exploration-failed-colonies-of-spain-france-england',
                'description': 'a Paywall Videos video from Remilon',
                'duration': 644.072,
                'uploader': 'study.com',
                'timestamp': 1459678540,
                'upload_date': '20160403',
                'filesize': 24687186,
            },
        },
        {
            'url': 'http://thoughtworks.wistia.com/medias/uxjb0lwrcz',
            'md5': 'baf49c2baa8a7de5f3fc145a8506dcd4',
            'info_dict': {
                'id': 'uxjb0lwrcz',
                'ext': 'mp4',
                'title': 'Conversation about Hexagonal Rails Part 1',
                'description': 'a Martin Fowler video from ThoughtWorks',
                'duration': 1715.0,
                'uploader': 'thoughtworks.wistia.com',
                'timestamp': 1401832161,
                'upload_date': '20140603',
            },
        },
        # Wistia standard embed (async)
        {
            'url': 'https://www.getdrip.com/university/brennan-dunn-drip-workshop/',
            'info_dict': {
                'id': '807fafadvk',
                'ext': 'mp4',
                'title': 'Drip Brennan Dunn Workshop',
                'description': 'a JV Webinars video from getdrip-1',
                'duration': 4986.95,
                'timestamp': 1463607249,
                'upload_date': '20160518',
            },
            'params': {
                'skip_download': True,
            }
        },
        # Soundcloud embed
        {
            'url': 'http://nakedsecurity.sophos.com/2014/10/29/sscc-171-are-you-sure-that-1234-is-a-bad-password-podcast/',
            'info_dict': {
                'id': '174391317',
                'ext': 'mp3',
                'description': 'md5:ff867d6b555488ad3c52572bb33d432c',
                'uploader': 'Sophos Security',
                'title': 'Chet Chat 171 - Oct 29, 2014',
                'upload_date': '20141029',
            }
        },
        # Soundcloud multiple embeds
        {
            'url': 'http://www.guitarplayer.com/lessons/1014/legato-workout-one-hour-to-more-fluid-performance---tab/52809',
            'info_dict': {
                'id': '52809',
                'title': 'Guitar Essentials: Legato Workout—One-Hour to Fluid Performance  | TAB + AUDIO',
            },
            'playlist_mincount': 7,
        },
        # TuneIn station embed
        {
            'url': 'http://radiocnrv.com/promouvoir-radio-cnrv/',
            'info_dict': {
                'id': '204146',
                'ext': 'mp3',
                'title': 'CNRV',
                'location': 'Paris, France',
                'is_live': True,
            },
            'params': {
                # Live stream
                'skip_download': True,
            },
        },
        # Livestream embed
        {
            'url': 'http://www.esa.int/Our_Activities/Space_Science/Rosetta/Philae_comet_touch-down_webcast',
            'info_dict': {
                'id': '67864563',
                'ext': 'flv',
                'upload_date': '20141112',
                'title': 'Rosetta #CometLanding webcast HL 10',
            }
        },
        # Another Livestream embed, without 'new.' in URL
        {
            'url': 'https://www.freespeech.org/',
            'info_dict': {
                'id': '123537347',
                'ext': 'mp4',
                'title': 're:^FSTV [0-9]{4}-[0-9]{2}-[0-9]{2} [0-9]{2}:[0-9]{2}$',
            },
            'params': {
                # Live stream
                'skip_download': True,
            },
        },
        # LazyYT
        {
            'url': 'https://skiplagged.com/',
            'info_dict': {
                'id': 'skiplagged',
                'title': 'Skiplagged: The smart way to find cheap flights',
            },
            'playlist_mincount': 1,
            'add_ie': ['Youtube'],
        },
        # Cinchcast embed
        {
            'url': 'http://undergroundwellness.com/podcasts/306-5-steps-to-permanent-gut-healing/',
            'info_dict': {
                'id': '7141703',
                'ext': 'mp3',
                'upload_date': '20141126',
                'title': 'Jack Tips: 5 Steps to Permanent Gut Healing',
            }
        },
        # Cinerama player
        {
            'url': 'http://www.abc.net.au/7.30/content/2015/s4164797.htm',
            'info_dict': {
                'id': '730m_DandD_1901_512k',
                'ext': 'mp4',
                'uploader': 'www.abc.net.au',
                'title': 'Game of Thrones with dice - Dungeons and Dragons fantasy role-playing game gets new life - 19/01/2015',
            }
        },
        # embedded viddler video
        {
            'url': 'http://deadspin.com/i-cant-stop-watching-john-wall-chop-the-nuggets-with-th-1681801597',
            'info_dict': {
                'id': '4d03aad9',
                'ext': 'mp4',
                'uploader': 'deadspin',
                'title': 'WALL-TO-GORTAT',
                'timestamp': 1422285291,
                'upload_date': '20150126',
            },
            'add_ie': ['Viddler'],
        },
        # Libsyn embed
        {
            'url': 'http://thedailyshow.cc.com/podcast/episodetwelve',
            'info_dict': {
                'id': '3377616',
                'ext': 'mp3',
                'title': "The Daily Show Podcast without Jon Stewart - Episode 12: Bassem Youssef: Egypt's Jon Stewart",
                'description': 'md5:601cb790edd05908957dae8aaa866465',
                'upload_date': '20150220',
            },
            'skip': 'All The Daily Show URLs now redirect to http://www.cc.com/shows/',
        },
        # jwplayer YouTube
        {
            'url': 'http://media.nationalarchives.gov.uk/index.php/webinar-using-discovery-national-archives-online-catalogue/',
            'info_dict': {
                'id': 'Mrj4DVp2zeA',
                'ext': 'mp4',
                'upload_date': '20150212',
                'uploader': 'The National Archives UK',
                'description': 'md5:8078af856dca76edc42910b61273dbbf',
                'uploader_id': 'NationalArchives08',
                'title': 'Webinar: Using Discovery, The National Archives’ online catalogue',
            },
        },
        # jwplayer rtmp
        {
            'url': 'http://www.suffolk.edu/sjc/live.php',
            'info_dict': {
                'id': 'live',
                'ext': 'flv',
                'title': 'Massachusetts Supreme Judicial Court Oral Arguments',
                'uploader': 'www.suffolk.edu',
            },
            'params': {
                'skip_download': True,
            },
            'skip': 'Only has video a few mornings per month, see http://www.suffolk.edu/sjc/',
        },
        # Complex jwplayer
        {
            'url': 'http://www.indiedb.com/games/king-machine/videos',
            'info_dict': {
                'id': 'videos',
                'ext': 'mp4',
                'title': 'king machine trailer 1',
                'description': 'Browse King Machine videos & audio for sweet media. Your eyes will thank you.',
                'thumbnail': r're:^https?://.*\.jpg$',
            },
        },
        {
            # JWPlayer config passed as variable
            'url': 'http://www.txxx.com/videos/3326530/ariele/',
            'info_dict': {
                'id': '3326530_hq',
                'ext': 'mp4',
                'title': 'ARIELE | Tube Cup',
                'uploader': 'www.txxx.com',
                'age_limit': 18,
            },
            'params': {
                'skip_download': True,
            }
        },
        {
            # JWPlatform iframe
            'url': 'https://www.mediaite.com/tv/dem-senator-claims-gary-cohn-faked-a-bad-connection-during-trump-call-to-get-him-off-the-phone/',
            'md5': 'ca00a040364b5b439230e7ebfd02c4e9',
            'info_dict': {
                'id': 'O0c5JcKT',
                'ext': 'mp4',
                'upload_date': '20171122',
                'timestamp': 1511366290,
                'title': 'Dem Senator Claims Gary Cohn Faked a Bad Connection During Trump Call to Get Him Off the Phone',
            },
            'add_ie': [JWPlatformIE.ie_key()],
        },
        {
            # Video.js embed, multiple formats
            'url': 'http://ortcam.com/solidworks-урок-6-настройка-чертежа_33f9b7351.html',
            'info_dict': {
                'id': 'yygqldloqIk',
                'ext': 'mp4',
                'title': 'SolidWorks. Урок 6 Настройка чертежа',
                'description': 'md5:baf95267792646afdbf030e4d06b2ab3',
                'upload_date': '20130314',
                'uploader': 'PROстое3D',
                'uploader_id': 'PROstoe3D',
            },
            'params': {
                'skip_download': True,
            },
        },
        {
            # Video.js embed, single format
            'url': 'https://www.vooplayer.com/v3/watch/watch.php?v=NzgwNTg=',
            'info_dict': {
                'id': 'watch',
                'ext': 'mp4',
                'title': 'Step 1 -  Good Foundation',
                'description': 'md5:d1e7ff33a29fc3eb1673d6c270d344f4',
            },
            'params': {
                'skip_download': True,
            },
        },
        # rtl.nl embed
        {
            'url': 'http://www.rtlnieuws.nl/nieuws/buitenland/aanslagen-kopenhagen',
            'playlist_mincount': 5,
            'info_dict': {
                'id': 'aanslagen-kopenhagen',
                'title': 'Aanslagen Kopenhagen',
            }
        },
        # Zapiks embed
        {
            'url': 'http://www.skipass.com/news/116090-bon-appetit-s5ep3-baqueira-mi-cor.html',
            'info_dict': {
                'id': '118046',
                'ext': 'mp4',
                'title': 'EP3S5 - Bon Appétit - Baqueira Mi Corazon !',
            }
        },
        # Kaltura embed (different embed code)
        {
            'url': 'http://www.premierchristianradio.com/Shows/Saturday/Unbelievable/Conference-Videos/Os-Guinness-Is-It-Fools-Talk-Unbelievable-Conference-2014',
            'info_dict': {
                'id': '1_a52wc67y',
                'ext': 'flv',
                'upload_date': '20150127',
                'uploader_id': 'PremierMedia',
                'timestamp': int,
                'title': 'Os Guinness // Is It Fools Talk? // Unbelievable? Conference 2014',
            },
        },
        # Kaltura embed with single quotes
        {
            'url': 'http://fod.infobase.com/p_ViewPlaylist.aspx?AssignmentID=NUN8ZY',
            'info_dict': {
                'id': '0_izeg5utt',
                'ext': 'mp4',
                'title': '35871',
                'timestamp': 1355743100,
                'upload_date': '20121217',
                'uploader_id': 'cplapp@learn360.com',
            },
            'add_ie': ['Kaltura'],
        },
        {
            # Kaltura embedded via quoted entry_id
            'url': 'https://www.oreilly.com/ideas/my-cloud-makes-pretty-pictures',
            'info_dict': {
                'id': '0_utuok90b',
                'ext': 'mp4',
                'title': '06_matthew_brender_raj_dutt',
                'timestamp': 1466638791,
                'upload_date': '20160622',
            },
            'add_ie': ['Kaltura'],
            'expected_warnings': [
                'Could not send HEAD request'
            ],
            'params': {
                'skip_download': True,
            }
        },
        {
            # Kaltura embedded, some fileExt broken (#11480)
            'url': 'http://www.cornell.edu/video/nima-arkani-hamed-standard-models-of-particle-physics',
            'info_dict': {
                'id': '1_sgtvehim',
                'ext': 'mp4',
                'title': 'Our "Standard Models" of particle physics and cosmology',
                'description': 'md5:67ea74807b8c4fea92a6f38d6d323861',
                'timestamp': 1321158993,
                'upload_date': '20111113',
                'uploader_id': 'kps1',
            },
            'add_ie': ['Kaltura'],
        },
        {
            # Kaltura iframe embed
            'url': 'http://www.gsd.harvard.edu/event/i-m-pei-a-centennial-celebration/',
            'md5': 'ae5ace8eb09dc1a35d03b579a9c2cc44',
            'info_dict': {
                'id': '0_f2cfbpwy',
                'ext': 'mp4',
                'title': 'I. M. Pei: A Centennial Celebration',
                'description': 'md5:1db8f40c69edc46ca180ba30c567f37c',
                'upload_date': '20170403',
                'uploader_id': 'batchUser',
                'timestamp': 1491232186,
            },
            'add_ie': ['Kaltura'],
        },
        {
            # Kaltura iframe embed, more sophisticated
            'url': 'http://www.cns.nyu.edu/~eero/math-tools/Videos/lecture-05sep2017.html',
            'info_dict': {
                'id': '1_9gzouybz',
                'ext': 'mp4',
                'title': 'lecture-05sep2017',
                'description': 'md5:40f347d91fd4ba047e511c5321064b49',
                'upload_date': '20170913',
                'uploader_id': 'eps2',
                'timestamp': 1505340777,
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': ['Kaltura'],
        },
        {
            # meta twitter:player
            'url': 'http://thechive.com/2017/12/08/all-i-want-for-christmas-is-more-twerk/',
            'info_dict': {
                'id': '0_01b42zps',
                'ext': 'mp4',
                'title': 'Main Twerk (Video)',
                'upload_date': '20171208',
                'uploader_id': 'sebastian.salinas@thechive.com',
                'timestamp': 1512713057,
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': ['Kaltura'],
        },
        # referrer protected EaglePlatform embed
        {
            'url': 'https://tvrain.ru/lite/teleshow/kak_vse_nachinalos/namin-418921/',
            'info_dict': {
                'id': '582306',
                'ext': 'mp4',
                'title': 'Стас Намин: «Мы нарушили девственность Кремля»',
                'thumbnail': r're:^https?://.*\.jpg$',
                'duration': 3382,
                'view_count': int,
            },
            'params': {
                'skip_download': True,
            },
        },
        # ClipYou (EaglePlatform) embed (custom URL)
        {
            'url': 'http://muz-tv.ru/play/7129/',
            # Not checking MD5 as sometimes the direct HTTP link results in 404 and HLS is used
            'info_dict': {
                'id': '12820',
                'ext': 'mp4',
                'title': "'O Sole Mio",
                'thumbnail': r're:^https?://.*\.jpg$',
                'duration': 216,
                'view_count': int,
            },
            'params': {
                'skip_download': True,
            },
            'skip': 'This video is unavailable.',
        },
        # Pladform embed
        {
            'url': 'http://muz-tv.ru/kinozal/view/7400/',
            'info_dict': {
                'id': '100183293',
                'ext': 'mp4',
                'title': 'Тайны перевала Дятлова • 1 серия 2 часть',
                'description': 'Документальный сериал-расследование одной из самых жутких тайн ХХ века',
                'thumbnail': r're:^https?://.*\.jpg$',
                'duration': 694,
                'age_limit': 0,
            },
            'skip': 'HTTP Error 404: Not Found',
        },
        # Playwire embed
        {
            'url': 'http://www.cinemablend.com/new/First-Joe-Dirt-2-Trailer-Teaser-Stupid-Greatness-70874.html',
            'info_dict': {
                'id': '3519514',
                'ext': 'mp4',
                'title': 'Joe Dirt 2 Beautiful Loser Teaser Trailer',
                'thumbnail': r're:^https?://.*\.png$',
                'duration': 45.115,
            },
        },
        # 5min embed
        {
            'url': 'http://techcrunch.com/video/facebook-creates-on-this-day-crunch-report/518726732/',
            'md5': '4c6f127a30736b59b3e2c19234ee2bf7',
            'info_dict': {
                'id': '518726732',
                'ext': 'mp4',
                'title': 'Facebook Creates "On This Day" | Crunch Report',
                'description': 'Amazon updates Fire TV line, Tesla\'s Model X spotted in the wild',
                'timestamp': 1427237531,
                'uploader': 'Crunch Report',
                'upload_date': '20150324',
            },
            'params': {
                # m3u8 download
                'skip_download': True,
            },
        },
        # Crooks and Liars embed
        {
            'url': 'http://crooksandliars.com/2015/04/fox-friends-says-protecting-atheists',
            'info_dict': {
                'id': '8RUoRhRi',
                'ext': 'mp4',
                'title': "Fox & Friends Says Protecting Atheists From Discrimination Is Anti-Christian!",
                'description': 'md5:e1a46ad1650e3a5ec7196d432799127f',
                'timestamp': 1428207000,
                'upload_date': '20150405',
                'uploader': 'Heather',
            },
        },
        # Crooks and Liars external embed
        {
            'url': 'http://theothermccain.com/2010/02/02/video-proves-that-bill-kristol-has-been-watching-glenn-beck/comment-page-1/',
            'info_dict': {
                'id': 'MTE3MjUtMzQ2MzA',
                'ext': 'mp4',
                'title': 'md5:5e3662a81a4014d24c250d76d41a08d5',
                'description': 'md5:9b8e9542d6c3c5de42d6451b7d780cec',
                'timestamp': 1265032391,
                'upload_date': '20100201',
                'uploader': 'Heather',
            },
        },
        # NBC Sports vplayer embed
        {
            'url': 'http://www.riderfans.com/forum/showthread.php?121827-Freeman&s=e98fa1ea6dc08e886b1678d35212494a',
            'info_dict': {
                'id': 'ln7x1qSThw4k',
                'ext': 'flv',
                'title': "PFT Live: New leader in the 'new-look' defense",
                'description': 'md5:65a19b4bbfb3b0c0c5768bed1dfad74e',
                'uploader': 'NBCU-SPORTS',
                'upload_date': '20140107',
                'timestamp': 1389118457,
            },
            'skip': 'Invalid Page URL',
        },
        # NBC News embed
        {
            'url': 'http://www.vulture.com/2016/06/letterman-couldnt-care-less-about-late-night.html',
            'md5': '1aa589c675898ae6d37a17913cf68d66',
            'info_dict': {
                'id': 'x_dtl_oa_LettermanliftPR_160608',
                'ext': 'mp4',
                'title': 'David Letterman: A Preview',
                'description': 'A preview of Tom Brokaw\'s interview with David Letterman as part of the On Assignment series powered by Dateline. Airs Sunday June 12 at 7/6c.',
                'upload_date': '20160609',
                'timestamp': 1465431544,
                'uploader': 'NBCU-NEWS',
            },
        },
        # UDN embed
        {
            'url': 'https://video.udn.com/news/300346',
            'md5': 'fd2060e988c326991037b9aff9df21a6',
            'info_dict': {
                'id': '300346',
                'ext': 'mp4',
                'title': '中一中男師變性 全校師生力挺',
                'thumbnail': r're:^https?://.*\.jpg$',
            },
            'params': {
                # m3u8 download
                'skip_download': True,
            },
            'expected_warnings': ['Failed to parse JSON Expecting value'],
        },
        # Brightcove URL in single quotes
        {
            'url': 'http://www.sportsnet.ca/baseball/mlb/sn-presents-russell-martin-world-citizen/',
            'md5': '4ae374f1f8b91c889c4b9203c8c752af',
            'info_dict': {
                'id': '4255764656001',
                'ext': 'mp4',
                'title': 'SN Presents: Russell Martin, World Citizen',
                'description': 'To understand why he was the Toronto Blue Jays’ top off-season priority is to appreciate his background and upbringing in Montreal, where he first developed his baseball skills. Written and narrated by Stephen Brunt.',
                'uploader': 'Rogers Sportsnet',
                'uploader_id': '1704050871',
                'upload_date': '20150525',
                'timestamp': 1432570283,
            },
        },
        # OnionStudios embed
        {
            'url': 'http://www.clickhole.com/video/dont-understand-bitcoin-man-will-mumble-explanatio-2537',
            'info_dict': {
                'id': '2855',
                'ext': 'mp4',
                'title': 'Don’t Understand Bitcoin? This Man Will Mumble An Explanation At You',
                'thumbnail': r're:^https?://.*\.jpe?g$',
                'uploader': 'ClickHole',
                'uploader_id': 'clickhole',
            }
        },
        # SnagFilms embed
        {
            'url': 'http://whilewewatch.blogspot.ru/2012/06/whilewewatch-whilewewatch-gripping.html',
            'info_dict': {
                'id': '74849a00-85a9-11e1-9660-123139220831',
                'ext': 'mp4',
                'title': '#whilewewatch',
            }
        },
        # AdobeTVVideo embed
        {
            'url': 'https://helpx.adobe.com/acrobat/how-to/new-experience-acrobat-dc.html?set=acrobat--get-started--essential-beginners',
            'md5': '43662b577c018ad707a63766462b1e87',
            'info_dict': {
                'id': '2456',
                'ext': 'mp4',
                'title': 'New experience with Acrobat DC',
                'description': 'New experience with Acrobat DC',
                'duration': 248.667,
            },
        },
        # BrightcoveInPageEmbed embed
        {
            'url': 'http://www.geekandsundry.com/tabletop-bonus-wils-final-thoughts-on-dread/',
            'info_dict': {
                'id': '4238694884001',
                'ext': 'flv',
                'title': 'Tabletop: Dread, Last Thoughts',
                'description': 'Tabletop: Dread, Last Thoughts',
                'duration': 51690,
            },
        },
        # Brightcove embed, with no valid 'renditions' but valid 'IOSRenditions'
        # This video can't be played in browsers if Flash disabled and UA set to iPhone, which is actually a false alarm
        {
            'url': 'https://dl.dropboxusercontent.com/u/29092637/interview.html',
            'info_dict': {
                'id': '4785848093001',
                'ext': 'mp4',
                'title': 'The Cardinal Pell Interview',
                'description': 'Sky News Contributor Andrew Bolt interviews George Pell in Rome, following the Cardinal\'s evidence before the Royal Commission into Child Abuse. ',
                'uploader': 'GlobeCast Australia - GlobeStream',
                'uploader_id': '2733773828001',
                'upload_date': '20160304',
                'timestamp': 1457083087,
            },
            'params': {
                # m3u8 downloads
                'skip_download': True,
            },
        },
        {
            # Brightcove embed with whitespace around attribute names
            'url': 'http://www.stack.com/video/3167554373001/learn-to-hit-open-three-pointers-with-damian-lillard-s-baseline-drift-drill',
            'info_dict': {
                'id': '3167554373001',
                'ext': 'mp4',
                'title': "Learn to Hit Open Three-Pointers With Damian Lillard's Baseline Drift Drill",
                'description': 'md5:57bacb0e0f29349de4972bfda3191713',
                'uploader_id': '1079349493',
                'upload_date': '20140207',
                'timestamp': 1391810548,
            },
            'params': {
                'skip_download': True,
            },
        },
        # Another form of arte.tv embed
        {
            'url': 'http://www.tv-replay.fr/redirection/09-04-16/arte-reportage-arte-11508975.html',
            'md5': '850bfe45417ddf221288c88a0cffe2e2',
            'info_dict': {
                'id': '030273-562_PLUS7-F',
                'ext': 'mp4',
                'title': 'ARTE Reportage - Nulle part, en France',
                'description': 'md5:e3a0e8868ed7303ed509b9e3af2b870d',
                'upload_date': '20160409',
            },
        },
        # LiveLeak embed
        {
            'url': 'http://www.wykop.pl/link/3088787/',
            'md5': '7619da8c820e835bef21a1efa2a0fc71',
            'info_dict': {
                'id': '874_1459135191',
                'ext': 'mp4',
                'title': 'Man shows poor quality of new apartment building',
                'description': 'The wall is like a sand pile.',
                'uploader': 'Lake8737',
            },
            'add_ie': [LiveLeakIE.ie_key()],
        },
        # Another LiveLeak embed pattern (#13336)
        {
            'url': 'https://milo.yiannopoulos.net/2017/06/concealed-carry-robbery/',
            'info_dict': {
                'id': '2eb_1496309988',
                'ext': 'mp4',
                'title': 'Thief robs place where everyone was armed',
                'description': 'md5:694d73ee79e535953cf2488562288eee',
                'uploader': 'brazilwtf',
            },
            'add_ie': [LiveLeakIE.ie_key()],
        },
        # Duplicated embedded video URLs
        {
            'url': 'http://www.hudl.com/athlete/2538180/highlights/149298443',
            'info_dict': {
                'id': '149298443_480_16c25b74_2',
                'ext': 'mp4',
                'title': 'vs. Blue Orange Spring Game',
                'uploader': 'www.hudl.com',
            },
        },
        # twitter:player:stream embed
        {
            'url': 'http://www.rtl.be/info/video/589263.aspx?CategoryID=288',
            'info_dict': {
                'id': 'master',
                'ext': 'mp4',
                'title': 'Une nouvelle espèce de dinosaure découverte en Argentine',
                'uploader': 'www.rtl.be',
            },
            'params': {
                # m3u8 downloads
                'skip_download': True,
            },
        },
        # twitter:player embed
        {
            'url': 'http://www.theatlantic.com/video/index/484130/what-do-black-holes-sound-like/',
            'md5': 'a3e0df96369831de324f0778e126653c',
            'info_dict': {
                'id': '4909620399001',
                'ext': 'mp4',
                'title': 'What Do Black Holes Sound Like?',
                'description': 'what do black holes sound like',
                'upload_date': '20160524',
                'uploader_id': '29913724001',
                'timestamp': 1464107587,
                'uploader': 'TheAtlantic',
            },
            'add_ie': ['BrightcoveLegacy'],
        },
        # Facebook <iframe> embed
        {
            'url': 'https://www.hostblogger.de/blog/archives/6181-Auto-jagt-Betonmischer.html',
            'md5': 'fbcde74f534176ecb015849146dd3aee',
            'info_dict': {
                'id': '599637780109885',
                'ext': 'mp4',
                'title': 'Facebook video #599637780109885',
            },
        },
        # Facebook <iframe> embed, plugin video
        {
            'url': 'http://5pillarsuk.com/2017/06/07/tariq-ramadan-disagrees-with-pr-exercise-by-imams-refusing-funeral-prayers-for-london-attackers/',
            'info_dict': {
                'id': '1754168231264132',
                'ext': 'mp4',
                'title': 'About the Imams and Religious leaders refusing to perform funeral prayers for...',
                'uploader': 'Tariq Ramadan (official)',
                'timestamp': 1496758379,
                'upload_date': '20170606',
            },
            'params': {
                'skip_download': True,
            },
        },
        # Facebook API embed
        {
            'url': 'http://www.lothype.com/blue-stars-2016-preview-standstill-full-show/',
            'md5': 'a47372ee61b39a7b90287094d447d94e',
            'info_dict': {
                'id': '10153467542406923',
                'ext': 'mp4',
                'title': 'Facebook video #10153467542406923',
            },
        },
        # Wordpress "YouTube Video Importer" plugin
        {
            'url': 'http://www.lothype.com/blue-devils-drumline-stanford-lot-2016/',
            'md5': 'd16797741b560b485194eddda8121b48',
            'info_dict': {
                'id': 'HNTXWDXV9Is',
                'ext': 'mp4',
                'title': 'Blue Devils Drumline Stanford lot 2016',
                'upload_date': '20160627',
                'uploader_id': 'GENOCIDE8GENERAL10',
                'uploader': 'cylus cyrus',
            },
        },
        {
            # video stored on custom kaltura server
            'url': 'http://www.expansion.com/multimedia/videos.html?media=EQcM30NHIPv',
            'md5': '537617d06e64dfed891fa1593c4b30cc',
            'info_dict': {
                'id': '0_1iotm5bh',
                'ext': 'mp4',
                'title': 'Elecciones británicas: 5 lecciones para Rajoy',
                'description': 'md5:435a89d68b9760b92ce67ed227055f16',
                'uploader_id': 'videos.expansion@el-mundo.net',
                'upload_date': '20150429',
                'timestamp': 1430303472,
            },
            'add_ie': ['Kaltura'],
        },
        {
            # Non-standard Vimeo embed
            'url': 'https://openclassrooms.com/courses/understanding-the-web',
            'md5': '64d86f1c7d369afd9a78b38cbb88d80a',
            'info_dict': {
                'id': '148867247',
                'ext': 'mp4',
                'title': 'Understanding the web - Teaser',
                'description': 'This is "Understanding the web - Teaser" by openclassrooms on Vimeo, the home for high quality videos and the people who love them.',
                'upload_date': '20151214',
                'uploader': 'OpenClassrooms',
                'uploader_id': 'openclassrooms',
            },
            'add_ie': ['Vimeo'],
        },
        {
            # generic vimeo embed that requires original URL passed as Referer
            'url': 'http://racing4everyone.eu/2016/07/30/formula-1-2016-round12-germany/',
            'only_matching': True,
        },
        {
            'url': 'https://support.arkena.com/display/PLAY/Ways+to+embed+your+video',
            'md5': 'b96f2f71b359a8ecd05ce4e1daa72365',
            'info_dict': {
                'id': 'b41dda37-d8e7-4d3f-b1b5-9a9db578bdfe',
                'ext': 'mp4',
                'title': 'Big Buck Bunny',
                'description': 'Royalty free test video',
                'timestamp': 1432816365,
                'upload_date': '20150528',
                'is_live': False,
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': [ArkenaIE.ie_key()],
        },
        {
            'url': 'http://nova.bg/news/view/2016/08/16/156543/%D0%BD%D0%B0-%D0%BA%D0%BE%D1%81%D1%8A%D0%BC-%D0%BE%D1%82-%D0%B2%D0%B7%D1%80%D0%B8%D0%B2-%D0%BE%D1%82%D1%86%D0%B5%D0%BF%D0%B8%D1%85%D0%B0-%D1%86%D1%8F%D0%BB-%D0%BA%D0%B2%D0%B0%D1%80%D1%82%D0%B0%D0%BB-%D0%B7%D0%B0%D1%80%D0%B0%D0%B4%D0%B8-%D0%B8%D0%B7%D1%82%D0%B8%D1%87%D0%B0%D0%BD%D0%B5-%D0%BD%D0%B0-%D0%B3%D0%B0%D0%B7-%D0%B2-%D0%BF%D0%BB%D0%BE%D0%B2%D0%B4%D0%B8%D0%B2/',
            'info_dict': {
                'id': '1c7141f46c',
                'ext': 'mp4',
                'title': 'НА КОСЪМ ОТ ВЗРИВ: Изтичане на газ на бензиностанция в Пловдив',
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': [Vbox7IE.ie_key()],
        },
        {
            # DBTV embeds
            'url': 'http://www.dagbladet.no/2016/02/23/nyheter/nordlys/ski/troms/ver/43254897/',
            'info_dict': {
                'id': '43254897',
                'title': 'Etter ett års planlegging, klaffet endelig alt: - Jeg måtte ta en liten dans',
            },
            'playlist_mincount': 3,
        },
        {
            # Videa embeds
            'url': 'http://forum.dvdtalk.com/movie-talk/623756-deleted-magic-star-wars-ot-deleted-alt-scenes-docu-style.html',
            'info_dict': {
                'id': '623756-deleted-magic-star-wars-ot-deleted-alt-scenes-docu-style',
                'title': 'Deleted Magic - Star Wars: OT Deleted / Alt. Scenes Docu. Style - DVD Talk Forum',
            },
            'playlist_mincount': 2,
        },
        {
            # 20 minuten embed
            'url': 'http://www.20min.ch/schweiz/news/story/So-kommen-Sie-bei-Eis-und-Schnee-sicher-an-27032552',
            'info_dict': {
                'id': '523629',
                'ext': 'mp4',
                'title': 'So kommen Sie bei Eis und Schnee sicher an',
                'description': 'md5:117c212f64b25e3d95747e5276863f7d',
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': [TwentyMinutenIE.ie_key()],
        },
        {
            # VideoPress embed
            'url': 'https://en.support.wordpress.com/videopress/',
            'info_dict': {
                'id': 'OcobLTqC',
                'ext': 'm4v',
                'title': 'IMG_5786',
                'timestamp': 1435711927,
                'upload_date': '20150701',
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': [VideoPressIE.ie_key()],
        },
        {
            # Rutube embed
            'url': 'http://magazzino.friday.ru/videos/vipuski/kazan-2',
            'info_dict': {
                'id': '9b3d5bee0a8740bf70dfd29d3ea43541',
                'ext': 'flv',
                'title': 'Магаззино: Казань 2',
                'description': 'md5:99bccdfac2269f0e8fdbc4bbc9db184a',
                'uploader': 'Магаззино',
                'upload_date': '20170228',
                'uploader_id': '996642',
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': [RutubeIE.ie_key()],
        },
        {
            # ThePlatform embedded with whitespaces in URLs
            'url': 'http://www.golfchannel.com/topics/shows/golftalkcentral.htm',
            'only_matching': True,
        },
        {
            # Senate ISVP iframe https
            'url': 'https://www.hsgac.senate.gov/hearings/canadas-fast-track-refugee-plan-unanswered-questions-and-implications-for-us-national-security',
            'md5': 'fb8c70b0b515e5037981a2492099aab8',
            'info_dict': {
                'id': 'govtaff020316',
                'ext': 'mp4',
                'title': 'Integrated Senate Video Player',
            },
            'add_ie': [SenateISVPIE.ie_key()],
        },
        {
            # Limelight embeds (1 channel embed + 4 media embeds)
            'url': 'http://www.sedona.com/FacilitatorTraining2017',
            'info_dict': {
                'id': 'FacilitatorTraining2017',
                'title': 'Facilitator Training 2017',
            },
            'playlist_mincount': 5,
        },
        {
            # Limelight embed (LimelightPlayerUtil.embed)
            'url': 'https://tv5.ca/videos?v=xuu8qowr291ri',
            'info_dict': {
                'id': '95d035dc5c8a401588e9c0e6bd1e9c92',
                'ext': 'mp4',
                'title': '07448641',
                'timestamp': 1499890639,
                'upload_date': '20170712',
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': ['LimelightMedia'],
        },
        {
            'url': 'http://kron4.com/2017/04/28/standoff-with-walnut-creek-murder-suspect-ends-with-arrest/',
            'info_dict': {
                'id': 'standoff-with-walnut-creek-murder-suspect-ends-with-arrest',
                'title': 'Standoff with Walnut Creek murder suspect ends',
                'description': 'md5:3ccc48a60fc9441eeccfc9c469ebf788',
            },
            'playlist_mincount': 4,
        },
        {
            # WashingtonPost embed
            'url': 'http://www.vanityfair.com/hollywood/2017/04/donald-trump-tv-pitches',
            'info_dict': {
                'id': '8caf6e88-d0ec-11e5-90d3-34c2c42653ac',
                'ext': 'mp4',
                'title': "No one has seen the drama series based on Trump's life \u2014 until now",
                'description': 'Donald Trump wanted a weekly TV drama based on his life. It never aired. But The Washington Post recently obtained a scene from the pilot script — and enlisted actors.',
                'timestamp': 1455216756,
                'uploader': 'The Washington Post',
                'upload_date': '20160211',
            },
            'add_ie': [WashingtonPostIE.ie_key()],
        },
        {
            # Mediaset embed
            'url': 'http://www.tgcom24.mediaset.it/politica/serracchiani-voglio-vivere-in-una-societa-aperta-reazioni-sproporzionate-_3071354-201702a.shtml',
            'info_dict': {
                'id': '720642',
                'ext': 'mp4',
                'title': 'Serracchiani: "Voglio vivere in una società aperta, con tutela del patto di fiducia"',
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': [MediasetIE.ie_key()],
        },
        {
            # JOJ.sk embeds
            'url': 'https://www.noviny.sk/slovensko/238543-slovenskom-sa-prehnala-vlna-silnych-burok',
            'info_dict': {
                'id': '238543-slovenskom-sa-prehnala-vlna-silnych-burok',
                'title': 'Slovenskom sa prehnala vlna silných búrok',
            },
            'playlist_mincount': 5,
            'add_ie': [JojIE.ie_key()],
        },
        {
            # AMP embed (see https://www.ampproject.org/docs/reference/components/amp-video)
            'url': 'https://tvrain.ru/amp/418921/',
            'md5': 'cc00413936695987e8de148b67d14f1d',
            'info_dict': {
                'id': '418921',
                'ext': 'mp4',
                'title': 'Стас Намин: «Мы нарушили девственность Кремля»',
            },
        },
        {
            # vzaar embed
            'url': 'http://help.vzaar.com/article/165-embedding-video',
            'md5': '7e3919d9d2620b89e3e00bec7fe8c9d4',
            'info_dict': {
                'id': '8707641',
                'ext': 'mp4',
                'title': 'Building A Business Online: Principal Chairs Q & A',
            },
        },
        {
            # multiple HTML5 videos on one page
            'url': 'https://www.paragon-software.com/home/rk-free/keyscenarios.html',
            'info_dict': {
                'id': 'keyscenarios',
                'title': 'Rescue Kit 14 Free Edition - Getting started',
            },
            'playlist_count': 4,
        },
        {
            # vshare embed
            'url': 'https://youtube-dl-demo.neocities.org/vshare.html',
            'md5': '17b39f55b5497ae8b59f5fbce8e35886',
            'info_dict': {
                'id': '0f64ce6',
                'title': 'vl14062007715967',
                'ext': 'mp4',
            }
        },
        {
            'url': 'http://www.heidelberg-laureate-forum.org/blog/video/lecture-friday-september-23-2016-sir-c-antony-r-hoare/',
            'md5': 'aecd089f55b1cb5a59032cb049d3a356',
            'info_dict': {
                'id': '90227f51a80c4d8f86c345a7fa62bd9a1d',
                'ext': 'mp4',
                'title': 'Lecture: Friday, September 23, 2016 - Sir Tony Hoare',
                'description': 'md5:5a51db84a62def7b7054df2ade403c6c',
                'timestamp': 1474354800,
                'upload_date': '20160920',
            }
        },
        {
            'url': 'http://www.kidzworld.com/article/30935-trolls-the-beat-goes-on-interview-skylar-astin-and-amanda-leighton',
            'info_dict': {
                'id': '1731611',
                'ext': 'mp4',
                'title': 'Official Trailer | TROLLS: THE BEAT GOES ON!',
                'description': 'md5:eb5f23826a027ba95277d105f248b825',
                'timestamp': 1516100691,
                'upload_date': '20180116',
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': [SpringboardPlatformIE.ie_key()],
        },
        {
            'url': 'https://www.youtube.com/shared?ci=1nEzmT-M4fU',
            'info_dict': {
                'id': 'uPDB5I9wfp8',
                'ext': 'webm',
                'title': 'Pocoyo: 90 minutos de episódios completos Português para crianças - PARTE 3',
                'description': 'md5:d9e4d9346a2dfff4c7dc4c8cec0f546d',
                'upload_date': '20160219',
                'uploader': 'Pocoyo - Português (BR)',
                'uploader_id': 'PocoyoBrazil',
            },
            'add_ie': [YoutubeIE.ie_key()],
            'params': {
                'skip_download': True,
            },
        },
        {
            'url': 'https://www.yapfiles.ru/show/1872528/690b05d3054d2dbe1e69523aa21bb3b1.mp4.html',
            'info_dict': {
                'id': 'vMDE4NzI1Mjgt690b',
                'ext': 'mp4',
                'title': 'Котята',
            },
            'add_ie': [YapFilesIE.ie_key()],
            'params': {
                'skip_download': True,
            },
        },
        {
            # CloudflareStream embed
            'url': 'https://www.cloudflare.com/products/cloudflare-stream/',
            'info_dict': {
                'id': '31c9291ab41fac05471db4e73aa11717',
                'ext': 'mp4',
                'title': '31c9291ab41fac05471db4e73aa11717',
            },
            'add_ie': [CloudflareStreamIE.ie_key()],
            'params': {
                'skip_download': True,
            },
        },
        {
            # PeerTube embed
            'url': 'https://joinpeertube.org/fr/home/',
            'info_dict': {
                'id': 'home',
                'title': 'Reprenez le contrôle de vos vidéos ! #JoinPeertube',
            },
            'playlist_count': 2,
        },
        {
            # Indavideo embed
            'url': 'https://streetkitchen.hu/receptek/igy_kell_otthon_hamburgert_sutni/',
            'info_dict': {
                'id': '1693903',
                'ext': 'mp4',
                'title': 'Így kell otthon hamburgert sütni',
                'description': 'md5:f5a730ecf900a5c852e1e00540bbb0f7',
                'timestamp': 1426330212,
                'upload_date': '20150314',
                'uploader': 'StreetKitchen',
                'uploader_id': '546363',
            },
            'add_ie': [IndavideoEmbedIE.ie_key()],
            'params': {
                'skip_download': True,
            },
        },
        {
            # APA embed via JWPlatform embed
            'url': 'http://www.vol.at/blue-man-group/5593454',
            'info_dict': {
                'id': 'jjv85FdZ',
                'ext': 'mp4',
                'title': '"Blau ist mysteriös": Die Blue Man Group im Interview',
                'description': 'md5:d41d8cd98f00b204e9800998ecf8427e',
                'thumbnail': r're:^https?://.*\.jpg$',
                'duration': 254,
                'timestamp': 1519211149,
                'upload_date': '20180221',
            },
            'params': {
                'skip_download': True,
            },
        },
        {
            'url': 'http://share-videos.se/auto/video/83645793?uid=13',
            'md5': 'b68d276de422ab07ee1d49388103f457',
            'info_dict': {
                'id': '83645793',
                'title': 'Lock up and get excited',
                'ext': 'mp4'
            },
            'skip': 'TODO: fix nested playlists processing in tests',
        },
        {
            # Viqeo embeds
            'url': 'https://viqeo.tv/',
            'info_dict': {
                'id': 'viqeo',
                'title': 'All-new video platform',
            },
            'playlist_count': 6,
        },
        {
            # videojs embed
            'url': 'https://video.sibnet.ru/shell.php?videoid=3422904',
            'info_dict': {
                'id': 'shell',
                'ext': 'mp4',
                'title': 'Доставщик пиццы спросил разрешения сыграть на фортепиано',
                'description': 'md5:89209cdc587dab1e4a090453dbaa2cb1',
                'thumbnail': r're:^https?://.*\.jpg$',
            },
            'params': {
                'skip_download': True,
            },
            'expected_warnings': ['Failed to download MPD manifest'],
        },
        # {
        #     # TODO: find another test
        #     # http://schema.org/VideoObject
        #     'url': 'https://flipagram.com/f/nyvTSJMKId',
        #     'md5': '888dcf08b7ea671381f00fab74692755',
        #     'info_dict': {
        #         'id': 'nyvTSJMKId',
        #         'ext': 'mp4',
        #         'title': 'Flipagram by sjuria101 featuring Midnight Memories by One Direction',
        #         'description': '#love for cats.',
        #         'timestamp': 1461244995,
        #         'upload_date': '20160421',
        #     },
        #     'params': {
        #         'force_generic_extractor': True,
        #     },
        # }
    ]

    def report_following_redirect(self, new_url):
        """Report information extraction."""
        self._downloader.to_screen('[redirect] Following redirect to %s' % new_url)

    def _extract_rss(self, url, video_id, doc):
        playlist_title = doc.find('./channel/title').text
        playlist_desc_el = doc.find('./channel/description')
        playlist_desc = None if playlist_desc_el is None else playlist_desc_el.text

        entries = []
        for it in doc.findall('./channel/item'):
            next_url = None
            enclosure_nodes = it.findall('./enclosure')
            for e in enclosure_nodes:
                next_url = e.attrib.get('url')
                if next_url:
                    break

            if not next_url:
                next_url = xpath_text(it, 'link', fatal=False)

            if not next_url:
                continue

            entries.append({
                '_type': 'url_transparent',
                'url': next_url,
                'title': it.find('title').text,
            })

        return {
            '_type': 'playlist',
            'id': url,
            'title': playlist_title,
            'description': playlist_desc,
            'entries': entries,
        }

    def _extract_camtasia(self, url, video_id, webpage):
        """ Returns None if no camtasia video can be found. """

        camtasia_cfg = self._search_regex(
            r'fo\.addVariable\(\s*"csConfigFile",\s*"([^"]+)"\s*\);',
            webpage, 'camtasia configuration file', default=None)
        if camtasia_cfg is None:
            return None

        title = self._html_search_meta('DC.title', webpage, fatal=True)

        camtasia_url = compat_urlparse.urljoin(url, camtasia_cfg)
        camtasia_cfg = self._download_xml(
            camtasia_url, video_id,
            note='Downloading camtasia configuration',
            errnote='Failed to download camtasia configuration')
        fileset_node = camtasia_cfg.find('./playlist/array/fileset')

        entries = []
        for n in fileset_node.getchildren():
            url_n = n.find('./uri')
            if url_n is None:
                continue

            entries.append({
                'id': os.path.splitext(url_n.text.rpartition('/')[2])[0],
                'title': '%s - %s' % (title, n.tag),
                'url': compat_urlparse.urljoin(url, url_n.text),
                'duration': float_or_none(n.find('./duration').text),
            })

        return {
            '_type': 'playlist',
            'entries': entries,
            'title': title,
        }

    def _real_extract(self, url):
        if url.startswith('//'):
            return {
                '_type': 'url',
                'url': self.http_scheme() + url,
            }

        parsed_url = compat_urlparse.urlparse(url)
        if not parsed_url.scheme:
            default_search = self._downloader.params.get('default_search')
            if default_search is None:
                default_search = 'fixup_error'

            if default_search in ('auto', 'auto_warning', 'fixup_error'):
                if '/' in url:
                    self._downloader.report_warning('The url doesn\'t specify the protocol, trying with http')
                    return self.url_result('http://' + url)
                elif default_search != 'fixup_error':
                    if default_search == 'auto_warning':
                        if re.match(r'^(?:url|URL)$', url):
                            raise ExtractorError(
                                'Invalid URL:  %r . Call youtube-dl like this:  youtube-dl -v "https://www.youtube.com/watch?v=BaW_jenozKc"  ' % url,
                                expected=True)
                        else:
                            self._downloader.report_warning(
                                'Falling back to youtube search for  %s . Set --default-search "auto" to suppress this warning.' % url)
                    return self.url_result('ytsearch:' + url)

            if default_search in ('error', 'fixup_error'):
                raise ExtractorError(
                    '%r is not a valid URL. '
                    'Set --default-search "ytsearch" (or run  youtube-dl "ytsearch:%s" ) to search YouTube'
                    % (url, url), expected=True)
            else:
                if ':' not in default_search:
                    default_search += ':'
                return self.url_result(default_search + url)

        url, smuggled_data = unsmuggle_url(url)
        force_videoid = None
        is_intentional = smuggled_data and smuggled_data.get('to_generic')
        if smuggled_data and 'force_videoid' in smuggled_data:
            force_videoid = smuggled_data['force_videoid']
            video_id = force_videoid
        else:
            video_id = self._generic_id(url)

        self.to_screen('%s: Requesting header' % video_id)

        head_req = HEADRequest(url)
        head_response = self._request_webpage(
            head_req, video_id,
            note=False, errnote='Could not send HEAD request to %s' % url,
            fatal=False)

        if head_response is not False:
            # Check for redirect
            new_url = compat_str(head_response.geturl())
            if url != new_url:
                self.report_following_redirect(new_url)
                if force_videoid:
                    new_url = smuggle_url(
                        new_url, {'force_videoid': force_videoid})
                return self.url_result(new_url)

        full_response = None
        if head_response is False:
            request = sanitized_Request(url)
            request.add_header('Accept-Encoding', '*')
            full_response = self._request_webpage(request, video_id)
            head_response = full_response

        info_dict = {
            'id': video_id,
            'title': self._generic_title(url),
            'upload_date': unified_strdate(head_response.headers.get('Last-Modified'))
        }

        # Check for direct link to a video
        content_type = head_response.headers.get('Content-Type', '').lower()
        m = re.match(r'^(?P<type>audio|video|application(?=/(?:ogg$|(?:vnd\.apple\.|x-)?mpegurl)))/(?P<format_id>[^;\s]+)', content_type)
        if m:
            format_id = compat_str(m.group('format_id'))
            if format_id.endswith('mpegurl'):
                formats = self._extract_m3u8_formats(url, video_id, 'mp4')
            elif format_id == 'f4m':
                formats = self._extract_f4m_formats(url, video_id)
            else:
                formats = [{
                    'format_id': format_id,
                    'url': url,
                    'vcodec': 'none' if m.group('type') == 'audio' else None
                }]
                info_dict['direct'] = True
            self._sort_formats(formats)
            info_dict['formats'] = formats
            return info_dict

        if not self._downloader.params.get('test', False) and not is_intentional:
            force = self._downloader.params.get('force_generic_extractor', False)
            self._downloader.report_warning(
                '%s on generic information extractor.' % ('Forcing' if force else 'Falling back'))

        if not full_response:
            request = sanitized_Request(url)
            # Some webservers may serve compressed content of rather big size (e.g. gzipped flac)
            # making it impossible to download only chunk of the file (yet we need only 512kB to
            # test whether it's HTML or not). According to youtube-dl default Accept-Encoding
            # that will always result in downloading the whole file that is not desirable.
            # Therefore for extraction pass we have to override Accept-Encoding to any in order
            # to accept raw bytes and being able to download only a chunk.
            # It may probably better to solve this by checking Content-Type for application/octet-stream
            # after HEAD request finishes, but not sure if we can rely on this.
            request.add_header('Accept-Encoding', '*')
            full_response = self._request_webpage(request, video_id)

        first_bytes = full_response.read(512)

        # Is it an M3U playlist?
        if first_bytes.startswith(b'#EXTM3U'):
            info_dict['formats'] = self._extract_m3u8_formats(url, video_id, 'mp4')
            self._sort_formats(info_dict['formats'])
            return info_dict

        # Maybe it's a direct link to a video?
        # Be careful not to download the whole thing!
        if not is_html(first_bytes):
            self._downloader.report_warning(
                'URL could be a direct video link, returning it as such.')
            info_dict.update({
                'direct': True,
                'url': url,
            })
            return info_dict

        webpage = self._webpage_read_content(
            full_response, url, video_id, prefix=first_bytes)

        self.report_extraction(video_id)

        # Is it an RSS feed, a SMIL file, an XSPF playlist or a MPD manifest?
        try:
            doc = compat_etree_fromstring(webpage.encode('utf-8'))
            if doc.tag == 'rss':
                return self._extract_rss(url, video_id, doc)
            elif doc.tag == 'SmoothStreamingMedia':
                info_dict['formats'] = self._parse_ism_formats(doc, url)
                self._sort_formats(info_dict['formats'])
                return info_dict
            elif re.match(r'^(?:{[^}]+})?smil$', doc.tag):
                smil = self._parse_smil(doc, url, video_id)
                self._sort_formats(smil['formats'])
                return smil
            elif doc.tag == '{http://xspf.org/ns/0/}playlist':
                return self.playlist_result(
                    self._parse_xspf(
                        doc, video_id, xspf_url=url,
                        xspf_base_url=compat_str(full_response.geturl())),
                    video_id)
            elif re.match(r'(?i)^(?:{[^}]+})?MPD$', doc.tag):
                info_dict['formats'] = self._parse_mpd_formats(
                    doc,
                    mpd_base_url=compat_str(full_response.geturl()).rpartition('/')[0],
                    mpd_url=url)
                self._sort_formats(info_dict['formats'])
                return info_dict
            elif re.match(r'^{http://ns\.adobe\.com/f4m/[12]\.0}manifest$', doc.tag):
                info_dict['formats'] = self._parse_f4m_formats(doc, url, video_id)
                self._sort_formats(info_dict['formats'])
                return info_dict
        except compat_xml_parse_error:
            pass

        # Is it a Camtasia project?
        camtasia_res = self._extract_camtasia(url, video_id, webpage)
        if camtasia_res is not None:
            return camtasia_res

        # Sometimes embedded video player is hidden behind percent encoding
        # (e.g. https://github.com/rg3/youtube-dl/issues/2448)
        # Unescaping the whole page allows to handle those cases in a generic way
        webpage = compat_urllib_parse_unquote(webpage)

        # it's tempting to parse this further, but you would
        # have to take into account all the variations like
        #   Video Title - Site Name
        #   Site Name | Video Title
        #   Video Title - Tagline | Site Name
        # and so on and so forth; it's just not practical
        video_title = self._og_search_title(
            webpage, default=None) or self._html_search_regex(
            r'(?s)<title>(.*?)</title>', webpage, 'video title',
            default='video')

        # Try to detect age limit automatically
        age_limit = self._rta_search(webpage)
        # And then there are the jokers who advertise that they use RTA,
        # but actually don't.
        AGE_LIMIT_MARKERS = [
            r'Proudly Labeled <a href="http://www\.rtalabel\.org/" title="Restricted to Adults">RTA</a>',
        ]
        if any(re.search(marker, webpage) for marker in AGE_LIMIT_MARKERS):
            age_limit = 18

        # video uploader is domain name
        video_uploader = self._search_regex(
            r'^(?:https?://)?([^/]*)/.*', url, 'video uploader')

        video_description = self._og_search_description(webpage, default=None)
        video_thumbnail = self._og_search_thumbnail(webpage, default=None)

        info_dict.update({
            'title': video_title,
            'description': video_description,
            'thumbnail': video_thumbnail,
            'age_limit': age_limit,
        })

        # Look for Brightcove Legacy Studio embeds
        bc_urls = BrightcoveLegacyIE._extract_brightcove_urls(webpage)
        if bc_urls:
            entries = [{
                '_type': 'url',
                'url': smuggle_url(bc_url, {'Referer': url}),
                'ie_key': 'BrightcoveLegacy'
            } for bc_url in bc_urls]

            return {
                '_type': 'playlist',
                'title': video_title,
                'id': video_id,
                'entries': entries,
            }

        # Look for Brightcove New Studio embeds
        bc_urls = BrightcoveNewIE._extract_urls(self, webpage)
        if bc_urls:
            return self.playlist_from_matches(
                bc_urls, video_id, video_title,
                getter=lambda x: smuggle_url(x, {'referrer': url}),
                ie='BrightcoveNew')

        # Look for Nexx embeds
        nexx_urls = NexxIE._extract_urls(webpage)
        if nexx_urls:
            return self.playlist_from_matches(nexx_urls, video_id, video_title, ie=NexxIE.ie_key())

        # Look for Nexx iFrame embeds
        nexx_embed_urls = NexxEmbedIE._extract_urls(webpage)
        if nexx_embed_urls:
            return self.playlist_from_matches(nexx_embed_urls, video_id, video_title, ie=NexxEmbedIE.ie_key())

        # Look for ThePlatform embeds
        tp_urls = ThePlatformIE._extract_urls(webpage)
        if tp_urls:
            return self.playlist_from_matches(tp_urls, video_id, video_title, ie='ThePlatform')

        # Look for Vessel embeds
        vessel_urls = VesselIE._extract_urls(webpage)
        if vessel_urls:
            return self.playlist_from_matches(vessel_urls, video_id, video_title, ie=VesselIE.ie_key())

        # Look for embedded rtl.nl player
        matches = re.findall(
            r'<iframe[^>]+?src="((?:https?:)?//(?:(?:www|static)\.)?rtl\.nl/(?:system/videoplayer/[^"]+(?:video_)?)?embed[^"]+)"',
            webpage)
        if matches:
            return self.playlist_from_matches(matches, video_id, video_title, ie='RtlNl')

        vimeo_urls = VimeoIE._extract_urls(url, webpage)
        if vimeo_urls:
            return self.playlist_from_matches(vimeo_urls, video_id, video_title, ie=VimeoIE.ie_key())

        vid_me_embed_url = self._search_regex(
            r'src=[\'"](https?://vid\.me/[^\'"]+)[\'"]',
            webpage, 'vid.me embed', default=None)
        if vid_me_embed_url is not None:
            return self.url_result(vid_me_embed_url, 'Vidme')

        # Look for YouTube embeds
        youtube_urls = YoutubeIE._extract_urls(webpage)
        if youtube_urls:
            return self.playlist_from_matches(
                youtube_urls, video_id, video_title, ie=YoutubeIE.ie_key())

        matches = DailymotionIE._extract_urls(webpage)
        if matches:
            return self.playlist_from_matches(matches, video_id, video_title)

        # Look for embedded Dailymotion playlist player (#3822)
        m = re.search(
            r'<iframe[^>]+?src=(["\'])(?P<url>(?:https?:)?//(?:www\.)?dailymotion\.[a-z]{2,3}/widget/jukebox\?.+?)\1', webpage)
        if m:
            playlists = re.findall(
                r'list\[\]=/playlist/([^/]+)/', unescapeHTML(m.group('url')))
            if playlists:
                return self.playlist_from_matches(
                    playlists, video_id, video_title, lambda p: '//dailymotion.com/playlist/%s' % p)

        # Look for DailyMail embeds
        dailymail_urls = DailyMailIE._extract_urls(webpage)
        if dailymail_urls:
            return self.playlist_from_matches(
                dailymail_urls, video_id, video_title, ie=DailyMailIE.ie_key())

        # Look for embedded Wistia player
        wistia_url = WistiaIE._extract_url(webpage)
        if wistia_url:
            return {
                '_type': 'url_transparent',
                'url': self._proto_relative_url(wistia_url),
                'ie_key': WistiaIE.ie_key(),
                'uploader': video_uploader,
            }

        # Look for SVT player
        svt_url = SVTIE._extract_url(webpage)
        if svt_url:
            return self.url_result(svt_url, 'SVT')

        # Look for Bandcamp pages with custom domain
        mobj = re.search(r'<meta property="og:url"[^>]*?content="(.*?bandcamp\.com.*?)"', webpage)
        if mobj is not None:
            burl = unescapeHTML(mobj.group(1))
            # Don't set the extractor because it can be a track url or an album
            return self.url_result(burl)

        # Look for embedded Vevo player
        mobj = re.search(
            r'<iframe[^>]+?src=(["\'])(?P<url>(?:https?:)?//(?:cache\.)?vevo\.com/.+?)\1', webpage)
        if mobj is not None:
            return self.url_result(mobj.group('url'))

        # Look for embedded Viddler player
        mobj = re.search(
            r'<(?:iframe[^>]+?src|param[^>]+?value)=(["\'])(?P<url>(?:https?:)?//(?:www\.)?viddler\.com/(?:embed|player)/.+?)\1',
            webpage)
        if mobj is not None:
            return self.url_result(mobj.group('url'))

        # Look for NYTimes player
        mobj = re.search(
            r'<iframe[^>]+src=(["\'])(?P<url>(?:https?:)?//graphics8\.nytimes\.com/bcvideo/[^/]+/iframe/embed\.html.+?)\1>',
            webpage)
        if mobj is not None:
            return self.url_result(mobj.group('url'))

        # Look for Libsyn player
        mobj = re.search(
            r'<iframe[^>]+src=(["\'])(?P<url>(?:https?:)?//html5-player\.libsyn\.com/embed/.+?)\1', webpage)
        if mobj is not None:
            return self.url_result(mobj.group('url'))

        # Look for Ooyala videos
        mobj = (re.search(r'player\.ooyala\.com/[^"?]+[?#][^"]*?(?:embedCode|ec)=(?P<ec>[^"&]+)', webpage) or
                re.search(r'OO\.Player\.create\([\'"].*?[\'"],\s*[\'"](?P<ec>.{32})[\'"]', webpage) or
                re.search(r'OO\.Player\.create\.apply\(\s*OO\.Player\s*,\s*op\(\s*\[\s*[\'"][^\'"]*[\'"]\s*,\s*[\'"](?P<ec>.{32})[\'"]', webpage) or
                re.search(r'SBN\.VideoLinkset\.ooyala\([\'"](?P<ec>.{32})[\'"]\)', webpage) or
                re.search(r'data-ooyala-video-id\s*=\s*[\'"](?P<ec>.{32})[\'"]', webpage))
        if mobj is not None:
            embed_token = self._search_regex(
                r'embedToken[\'"]?\s*:\s*[\'"]([^\'"]+)',
                webpage, 'ooyala embed token', default=None)
            return OoyalaIE._build_url_result(smuggle_url(
                mobj.group('ec'), {
                    'domain': url,
                    'embed_token': embed_token,
                }))

        # Look for multiple Ooyala embeds on SBN network websites
        mobj = re.search(r'SBN\.VideoLinkset\.entryGroup\((\[.*?\])', webpage)
        if mobj is not None:
            embeds = self._parse_json(mobj.group(1), video_id, fatal=False)
            if embeds:
                return self.playlist_from_matches(
                    embeds, video_id, video_title,
                    getter=lambda v: OoyalaIE._url_for_embed_code(smuggle_url(v['provider_video_id'], {'domain': url})), ie='Ooyala')

        # Look for Aparat videos
        mobj = re.search(r'<iframe .*?src="(http://www\.aparat\.com/video/[^"]+)"', webpage)
        if mobj is not None:
            return self.url_result(mobj.group(1), 'Aparat')

        # Look for MPORA videos
        mobj = re.search(r'<iframe .*?src="(http://mpora\.(?:com|de)/videos/[^"]+)"', webpage)
        if mobj is not None:
            return self.url_result(mobj.group(1), 'Mpora')

        # Look for embedded NovaMov-based player
        mobj = re.search(
            r'''(?x)<(?:pagespeed_)?iframe[^>]+?src=(["\'])
                    (?P<url>http://(?:(?:embed|www)\.)?
                        (?:novamov\.com|
                           nowvideo\.(?:ch|sx|eu|at|ag|co)|
                           videoweed\.(?:es|com)|
                           movshare\.(?:net|sx|ag)|
                           divxstage\.(?:eu|net|ch|co|at|ag))
                        /embed\.php.+?)\1''', webpage)
        if mobj is not None:
            return self.url_result(mobj.group('url'))

        # Look for embedded Facebook player
        facebook_urls = FacebookIE._extract_urls(webpage)
        if facebook_urls:
            return self.playlist_from_matches(facebook_urls, video_id, video_title)

        # Look for embedded VK player
        mobj = re.search(r'<iframe[^>]+?src=(["\'])(?P<url>https?://vk\.com/video_ext\.php.+?)\1', webpage)
        if mobj is not None:
            return self.url_result(mobj.group('url'), 'VK')

        # Look for embedded Odnoklassniki player
        mobj = re.search(r'<iframe[^>]+?src=(["\'])(?P<url>https?://(?:odnoklassniki|ok)\.ru/videoembed/.+?)\1', webpage)
        if mobj is not None:
            return self.url_result(mobj.group('url'), 'Odnoklassniki')

        # Look for embedded ivi player
        mobj = re.search(r'<embed[^>]+?src=(["\'])(?P<url>https?://(?:www\.)?ivi\.ru/video/player.+?)\1', webpage)
        if mobj is not None:
            return self.url_result(mobj.group('url'), 'Ivi')

        # Look for embedded Huffington Post player
        mobj = re.search(
            r'<iframe[^>]+?src=(["\'])(?P<url>https?://embed\.live\.huffingtonpost\.com/.+?)\1', webpage)
        if mobj is not None:
            return self.url_result(mobj.group('url'), 'HuffPost')

        # Look for embed.ly
        mobj = re.search(r'class=["\']embedly-card["\'][^>]href=["\'](?P<url>[^"\']+)', webpage)
        if mobj is not None:
            return self.url_result(mobj.group('url'))
        mobj = re.search(r'class=["\']embedly-embed["\'][^>]src=["\'][^"\']*url=(?P<url>[^&]+)', webpage)
        if mobj is not None:
            return self.url_result(compat_urllib_parse_unquote(mobj.group('url')))

        # Look for funnyordie embed
        matches = re.findall(r'<iframe[^>]+?src="(https?://(?:www\.)?funnyordie\.com/embed/[^"]+)"', webpage)
        if matches:
            return self.playlist_from_matches(
                matches, video_id, video_title, getter=unescapeHTML, ie='FunnyOrDie')

        # Look for BBC iPlayer embed
        matches = re.findall(r'setPlaylist\("(https?://www\.bbc\.co\.uk/iplayer/[^/]+/[\da-z]{8})"\)', webpage)
        if matches:
            return self.playlist_from_matches(matches, video_id, video_title, ie='BBCCoUk')

        # Look for embedded RUTV player
        rutv_url = RUTVIE._extract_url(webpage)
        if rutv_url:
            return self.url_result(rutv_url, 'RUTV')

        # Look for embedded TVC player
        tvc_url = TVCIE._extract_url(webpage)
        if tvc_url:
            return self.url_result(tvc_url, 'TVC')

        # Look for embedded SportBox player
        sportbox_urls = SportBoxEmbedIE._extract_urls(webpage)
        if sportbox_urls:
            return self.playlist_from_matches(sportbox_urls, video_id, video_title, ie='SportBoxEmbed')

        # Look for embedded XHamster player
        xhamster_urls = XHamsterEmbedIE._extract_urls(webpage)
        if xhamster_urls:
            return self.playlist_from_matches(xhamster_urls, video_id, video_title, ie='XHamsterEmbed')

        # Look for embedded TNAFlixNetwork player
        tnaflix_urls = TNAFlixNetworkEmbedIE._extract_urls(webpage)
        if tnaflix_urls:
            return self.playlist_from_matches(tnaflix_urls, video_id, video_title, ie=TNAFlixNetworkEmbedIE.ie_key())

        # Look for embedded PornHub player
        pornhub_urls = PornHubIE._extract_urls(webpage)
        if pornhub_urls:
            return self.playlist_from_matches(pornhub_urls, video_id, video_title, ie=PornHubIE.ie_key())

        # Look for embedded DrTuber player
        drtuber_urls = DrTuberIE._extract_urls(webpage)
        if drtuber_urls:
            return self.playlist_from_matches(drtuber_urls, video_id, video_title, ie=DrTuberIE.ie_key())

        # Look for embedded RedTube player
        redtube_urls = RedTubeIE._extract_urls(webpage)
        if redtube_urls:
            return self.playlist_from_matches(redtube_urls, video_id, video_title, ie=RedTubeIE.ie_key())

        # Look for embedded Tube8 player
        tube8_urls = Tube8IE._extract_urls(webpage)
        if tube8_urls:
            return self.playlist_from_matches(tube8_urls, video_id, video_title, ie=Tube8IE.ie_key())

        # Look for embedded Tvigle player
        mobj = re.search(
            r'<iframe[^>]+?src=(["\'])(?P<url>(?:https?:)?//cloud\.tvigle\.ru/video/.+?)\1', webpage)
        if mobj is not None:
            return self.url_result(mobj.group('url'), 'Tvigle')

        # Look for embedded TED player
        mobj = re.search(
            r'<iframe[^>]+?src=(["\'])(?P<url>https?://embed(?:-ssl)?\.ted\.com/.+?)\1', webpage)
        if mobj is not None:
            return self.url_result(mobj.group('url'), 'TED')

        # Look for embedded Ustream videos
        ustream_url = UstreamIE._extract_url(webpage)
        if ustream_url:
            return self.url_result(ustream_url, UstreamIE.ie_key())

        # Look for embedded arte.tv player
        mobj = re.search(
            r'<(?:script|iframe) [^>]*?src="(?P<url>http://www\.arte\.tv/(?:playerv2/embed|arte_vp/index)[^"]+)"',
            webpage)
        if mobj is not None:
            return self.url_result(mobj.group('url'), 'ArteTVEmbed')

        # Look for embedded francetv player
        mobj = re.search(
            r'<iframe[^>]+?src=(["\'])(?P<url>(?:https?://)?embed\.francetv\.fr/\?ue=.+?)\1',
            webpage)
        if mobj is not None:
            return self.url_result(mobj.group('url'))

        # Look for embedded smotri.com player
        smotri_url = SmotriIE._extract_url(webpage)
        if smotri_url:
            return self.url_result(smotri_url, 'Smotri')

        # Look for embedded Myvi.ru player
        myvi_url = MyviIE._extract_url(webpage)
        if myvi_url:
            return self.url_result(myvi_url)

        # Look for embedded soundcloud player
        soundcloud_urls = SoundcloudIE._extract_urls(webpage)
        if soundcloud_urls:
            return self.playlist_from_matches(soundcloud_urls, video_id, video_title, getter=unescapeHTML, ie=SoundcloudIE.ie_key())

        # Look for tunein player
        tunein_urls = TuneInBaseIE._extract_urls(webpage)
        if tunein_urls:
            return self.playlist_from_matches(tunein_urls, video_id, video_title)

        # Look for embedded mtvservices player
        mtvservices_url = MTVServicesEmbeddedIE._extract_url(webpage)
        if mtvservices_url:
            return self.url_result(mtvservices_url, ie='MTVServicesEmbedded')

        # Look for embedded yahoo player
        mobj = re.search(
            r'<iframe[^>]+?src=(["\'])(?P<url>https?://(?:screen|movies)\.yahoo\.com/.+?\.html\?format=embed)\1',
            webpage)
        if mobj is not None:
            return self.url_result(mobj.group('url'), 'Yahoo')

        # Look for embedded sbs.com.au player
        mobj = re.search(
            r'''(?x)
            (?:
                <meta\s+property="og:video"\s+content=|
                <iframe[^>]+?src=
            )
            (["\'])(?P<url>https?://(?:www\.)?sbs\.com\.au/ondemand/video/.+?)\1''',
            webpage)
        if mobj is not None:
            return self.url_result(mobj.group('url'), 'SBS')

        # Look for embedded Cinchcast player
        mobj = re.search(
            r'<iframe[^>]+?src=(["\'])(?P<url>https?://player\.cinchcast\.com/.+?)\1',
            webpage)
        if mobj is not None:
            return self.url_result(mobj.group('url'), 'Cinchcast')

        mobj = re.search(
            r'<iframe[^>]+?src=(["\'])(?P<url>https?://m(?:lb)?\.mlb\.com/shared/video/embed/embed\.html\?.+?)\1',
            webpage)
        if not mobj:
            mobj = re.search(
                r'data-video-link=["\'](?P<url>http://m.mlb.com/video/[^"\']+)',
                webpage)
        if mobj is not None:
            return self.url_result(mobj.group('url'), 'MLB')

        mobj = re.search(
            r'<(?:iframe|script)[^>]+?src=(["\'])(?P<url>%s)\1' % CondeNastIE.EMBED_URL,
            webpage)
        if mobj is not None:
            return self.url_result(self._proto_relative_url(mobj.group('url'), scheme='http:'), 'CondeNast')

        mobj = re.search(
            r'<iframe[^>]+src="(?P<url>https?://(?:new\.)?livestream\.com/[^"]+/player[^"]+)"',
            webpage)
        if mobj is not None:
            return self.url_result(mobj.group('url'), 'Livestream')

        # Look for Zapiks embed
        mobj = re.search(
            r'<iframe[^>]+src="(?P<url>https?://(?:www\.)?zapiks\.fr/index\.php\?.+?)"', webpage)
        if mobj is not None:
            return self.url_result(mobj.group('url'), 'Zapiks')

        # Look for Kaltura embeds
        kaltura_url = KalturaIE._extract_url(webpage)
        if kaltura_url:
            return self.url_result(smuggle_url(kaltura_url, {'source_url': url}), KalturaIE.ie_key())

        # Look for EaglePlatform embeds
        eagleplatform_url = EaglePlatformIE._extract_url(webpage)
        if eagleplatform_url:
            return self.url_result(smuggle_url(eagleplatform_url, {'referrer': url}), EaglePlatformIE.ie_key())

        # Look for ClipYou (uses EaglePlatform) embeds
        mobj = re.search(
            r'<iframe[^>]+src="https?://(?P<host>media\.clipyou\.ru)/index/player\?.*\brecord_id=(?P<id>\d+).*"', webpage)
        if mobj is not None:
            return self.url_result('eagleplatform:%(host)s:%(id)s' % mobj.groupdict(), 'EaglePlatform')

        # Look for Pladform embeds
        pladform_url = PladformIE._extract_url(webpage)
        if pladform_url:
            return self.url_result(pladform_url)

        # Look for Videomore embeds
        videomore_url = VideomoreIE._extract_url(webpage)
        if videomore_url:
            return self.url_result(videomore_url)

        # Look for Webcaster embeds
        webcaster_url = WebcasterFeedIE._extract_url(self, webpage)
        if webcaster_url:
            return self.url_result(webcaster_url, ie=WebcasterFeedIE.ie_key())

        # Look for Playwire embeds
        mobj = re.search(
            r'<script[^>]+data-config=(["\'])(?P<url>(?:https?:)?//config\.playwire\.com/.+?)\1', webpage)
        if mobj is not None:
            return self.url_result(mobj.group('url'))

        # Look for 5min embeds
        mobj = re.search(
            r'<meta[^>]+property="og:video"[^>]+content="https?://embed\.5min\.com/(?P<id>[0-9]+)/?', webpage)
        if mobj is not None:
            return self.url_result('5min:%s' % mobj.group('id'), 'FiveMin')

        # Look for Crooks and Liars embeds
        mobj = re.search(
            r'<(?:iframe[^>]+src|param[^>]+value)=(["\'])(?P<url>(?:https?:)?//embed\.crooksandliars\.com/(?:embed|v)/.+?)\1', webpage)
        if mobj is not None:
            return self.url_result(mobj.group('url'))

        # Look for NBC Sports VPlayer embeds
        nbc_sports_url = NBCSportsVPlayerIE._extract_url(webpage)
        if nbc_sports_url:
            return self.url_result(nbc_sports_url, 'NBCSportsVPlayer')

        # Look for NBC News embeds
        nbc_news_embed_url = re.search(
            r'<iframe[^>]+src=(["\'])(?P<url>(?:https?:)?//www\.nbcnews\.com/widget/video-embed/[^"\']+)\1', webpage)
        if nbc_news_embed_url:
            return self.url_result(nbc_news_embed_url.group('url'), 'NBCNews')

        # Look for Google Drive embeds
        google_drive_url = GoogleDriveIE._extract_url(webpage)
        if google_drive_url:
            return self.url_result(google_drive_url, 'GoogleDrive')

        # Look for UDN embeds
        mobj = re.search(
            r'<iframe[^>]+src="(?:https?:)?(?P<url>%s)"' % UDNEmbedIE._PROTOCOL_RELATIVE_VALID_URL, webpage)
        if mobj is not None:
            return self.url_result(
                compat_urlparse.urljoin(url, mobj.group('url')), 'UDNEmbed')

        # Look for Senate ISVP iframe
        senate_isvp_url = SenateISVPIE._search_iframe_url(webpage)
        if senate_isvp_url:
            return self.url_result(senate_isvp_url, 'SenateISVP')

        # Look for OnionStudios embeds
        onionstudios_url = OnionStudiosIE._extract_url(webpage)
        if onionstudios_url:
            return self.url_result(onionstudios_url)

        # Look for ViewLift embeds
        viewlift_url = ViewLiftEmbedIE._extract_url(webpage)
        if viewlift_url:
            return self.url_result(viewlift_url)

        # Look for JWPlatform embeds
        jwplatform_urls = JWPlatformIE._extract_urls(webpage)
        if jwplatform_urls:
            return self.playlist_from_matches(jwplatform_urls, video_id, video_title, ie=JWPlatformIE.ie_key())

        # Look for Digiteka embeds
        digiteka_url = DigitekaIE._extract_url(webpage)
        if digiteka_url:
            return self.url_result(self._proto_relative_url(digiteka_url), DigitekaIE.ie_key())

        # Look for Arkena embeds
        arkena_url = ArkenaIE._extract_url(webpage)
        if arkena_url:
            return self.url_result(arkena_url, ArkenaIE.ie_key())

        # Look for Piksel embeds
        piksel_url = PikselIE._extract_url(webpage)
        if piksel_url:
            return self.url_result(piksel_url, PikselIE.ie_key())

        # Look for Limelight embeds
        limelight_urls = LimelightBaseIE._extract_urls(webpage, url)
        if limelight_urls:
            return self.playlist_result(
                limelight_urls, video_id, video_title, video_description)

        # Look for Anvato embeds
        anvato_urls = AnvatoIE._extract_urls(self, webpage, video_id)
        if anvato_urls:
            return self.playlist_result(
                anvato_urls, video_id, video_title, video_description)

        # Look for AdobeTVVideo embeds
        mobj = re.search(
            r'<iframe[^>]+src=[\'"]((?:https?:)?//video\.tv\.adobe\.com/v/\d+[^"]+)[\'"]',
            webpage)
        if mobj is not None:
            return self.url_result(
                self._proto_relative_url(unescapeHTML(mobj.group(1))),
                'AdobeTVVideo')

        # Look for Vine embeds
        mobj = re.search(
            r'<iframe[^>]+src=[\'"]((?:https?:)?//(?:www\.)?vine\.co/v/[^/]+/embed/(?:simple|postcard))',
            webpage)
        if mobj is not None:
            return self.url_result(
                self._proto_relative_url(unescapeHTML(mobj.group(1))), 'Vine')

        # Look for VODPlatform embeds
        mobj = re.search(
            r'<iframe[^>]+src=(["\'])(?P<url>(?:https?:)?//(?:www\.)?vod-platform\.net/[eE]mbed/.+?)\1',
            webpage)
        if mobj is not None:
            return self.url_result(
                self._proto_relative_url(unescapeHTML(mobj.group('url'))), 'VODPlatform')

        # Look for Mangomolo embeds
        mobj = re.search(
            r'''(?x)<iframe[^>]+src=(["\'])(?P<url>(?:https?:)?//(?:www\.)?admin\.mangomolo\.com/analytics/index\.php/customers/embed/
                (?:
                    video\?.*?\bid=(?P<video_id>\d+)|
                    index\?.*?\bchannelid=(?P<channel_id>(?:[A-Za-z0-9+/=]|%2B|%2F|%3D)+)
                ).+?)\1''', webpage)
        if mobj is not None:
            info = {
                '_type': 'url_transparent',
                'url': self._proto_relative_url(unescapeHTML(mobj.group('url'))),
                'title': video_title,
                'description': video_description,
                'thumbnail': video_thumbnail,
                'uploader': video_uploader,
            }
            video_id = mobj.group('video_id')
            if video_id:
                info.update({
                    'ie_key': 'MangomoloVideo',
                    'id': video_id,
                })
            else:
                info.update({
                    'ie_key': 'MangomoloLive',
                    'id': mobj.group('channel_id'),
                })
            return info

        # Look for Instagram embeds
        instagram_embed_url = InstagramIE._extract_embed_url(webpage)
        if instagram_embed_url is not None:
            return self.url_result(
                self._proto_relative_url(instagram_embed_url), InstagramIE.ie_key())

        # Look for LiveLeak embeds
        liveleak_urls = LiveLeakIE._extract_urls(webpage)
        if liveleak_urls:
            return self.playlist_from_matches(liveleak_urls, video_id, video_title)

        # Look for 3Q SDN embeds
        threeqsdn_url = ThreeQSDNIE._extract_url(webpage)
        if threeqsdn_url:
            return {
                '_type': 'url_transparent',
                'ie_key': ThreeQSDNIE.ie_key(),
                'url': self._proto_relative_url(threeqsdn_url),
                'title': video_title,
                'description': video_description,
                'thumbnail': video_thumbnail,
                'uploader': video_uploader,
            }

        # Look for VBOX7 embeds
        vbox7_url = Vbox7IE._extract_url(webpage)
        if vbox7_url:
            return self.url_result(vbox7_url, Vbox7IE.ie_key())

        # Look for DBTV embeds
        dbtv_urls = DBTVIE._extract_urls(webpage)
        if dbtv_urls:
            return self.playlist_from_matches(dbtv_urls, video_id, video_title, ie=DBTVIE.ie_key())

        # Look for Videa embeds
        videa_urls = VideaIE._extract_urls(webpage)
        if videa_urls:
            return self.playlist_from_matches(videa_urls, video_id, video_title, ie=VideaIE.ie_key())

        # Look for 20 minuten embeds
        twentymin_urls = TwentyMinutenIE._extract_urls(webpage)
        if twentymin_urls:
            return self.playlist_from_matches(
                twentymin_urls, video_id, video_title, ie=TwentyMinutenIE.ie_key())

        # Look for Openload embeds
        openload_urls = OpenloadIE._extract_urls(webpage)
        if openload_urls:
            return self.playlist_from_matches(
                openload_urls, video_id, video_title, ie=OpenloadIE.ie_key())

        # Look for VideoPress embeds
        videopress_urls = VideoPressIE._extract_urls(webpage)
        if videopress_urls:
            return self.playlist_from_matches(
                videopress_urls, video_id, video_title, ie=VideoPressIE.ie_key())

        # Look for Rutube embeds
        rutube_urls = RutubeIE._extract_urls(webpage)
        if rutube_urls:
            return self.playlist_from_matches(
                rutube_urls, video_id, video_title, ie=RutubeIE.ie_key())

        # Look for WashingtonPost embeds
        wapo_urls = WashingtonPostIE._extract_urls(webpage)
        if wapo_urls:
            return self.playlist_from_matches(
                wapo_urls, video_id, video_title, ie=WashingtonPostIE.ie_key())

        # Look for Mediaset embeds
        mediaset_urls = MediasetIE._extract_urls(self, webpage)
        if mediaset_urls:
            return self.playlist_from_matches(
                mediaset_urls, video_id, video_title, ie=MediasetIE.ie_key())

        # Look for JOJ.sk embeds
        joj_urls = JojIE._extract_urls(webpage)
        if joj_urls:
            return self.playlist_from_matches(
                joj_urls, video_id, video_title, ie=JojIE.ie_key())

        # Look for megaphone.fm embeds
        mpfn_urls = MegaphoneIE._extract_urls(webpage)
        if mpfn_urls:
            return self.playlist_from_matches(
                mpfn_urls, video_id, video_title, ie=MegaphoneIE.ie_key())

        # Look for vzaar embeds
        vzaar_urls = VzaarIE._extract_urls(webpage)
        if vzaar_urls:
            return self.playlist_from_matches(
                vzaar_urls, video_id, video_title, ie=VzaarIE.ie_key())

        channel9_urls = Channel9IE._extract_urls(webpage)
        if channel9_urls:
            return self.playlist_from_matches(
                channel9_urls, video_id, video_title, ie=Channel9IE.ie_key())

        vshare_urls = VShareIE._extract_urls(webpage)
        if vshare_urls:
            return self.playlist_from_matches(
                vshare_urls, video_id, video_title, ie=VShareIE.ie_key())

        # Look for Mediasite embeds
        mediasite_urls = MediasiteIE._extract_urls(webpage)
        if mediasite_urls:
            entries = [
                self.url_result(smuggle_url(
                    compat_urlparse.urljoin(url, mediasite_url),
                    {'UrlReferrer': url}), ie=MediasiteIE.ie_key())
                for mediasite_url in mediasite_urls]
            return self.playlist_result(entries, video_id, video_title)

        springboardplatform_urls = SpringboardPlatformIE._extract_urls(webpage)
        if springboardplatform_urls:
            return self.playlist_from_matches(
                springboardplatform_urls, video_id, video_title,
                ie=SpringboardPlatformIE.ie_key())

        yapfiles_urls = YapFilesIE._extract_urls(webpage)
        if yapfiles_urls:
            return self.playlist_from_matches(
                yapfiles_urls, video_id, video_title, ie=YapFilesIE.ie_key())

        vice_urls = ViceIE._extract_urls(webpage)
        if vice_urls:
            return self.playlist_from_matches(
                vice_urls, video_id, video_title, ie=ViceIE.ie_key())

        xfileshare_urls = XFileShareIE._extract_urls(webpage)
        if xfileshare_urls:
            return self.playlist_from_matches(
                xfileshare_urls, video_id, video_title, ie=XFileShareIE.ie_key())

        cloudflarestream_urls = CloudflareStreamIE._extract_urls(webpage)
        if cloudflarestream_urls:
            return self.playlist_from_matches(
                cloudflarestream_urls, video_id, video_title, ie=CloudflareStreamIE.ie_key())

        peertube_urls = PeerTubeIE._extract_urls(webpage, url)
        if peertube_urls:
            return self.playlist_from_matches(
                peertube_urls, video_id, video_title, ie=PeerTubeIE.ie_key())

        indavideo_urls = IndavideoEmbedIE._extract_urls(webpage)
        if indavideo_urls:
            return self.playlist_from_matches(
                indavideo_urls, video_id, video_title, ie=IndavideoEmbedIE.ie_key())

        apa_urls = APAIE._extract_urls(webpage)
        if apa_urls:
            return self.playlist_from_matches(
                apa_urls, video_id, video_title, ie=APAIE.ie_key())

        foxnews_urls = FoxNewsIE._extract_urls(webpage)
        if foxnews_urls:
            return self.playlist_from_matches(
                foxnews_urls, video_id, video_title, ie=FoxNewsIE.ie_key())

        sharevideos_urls = [sharevideos_mobj.group('url') for sharevideos_mobj in re.finditer(
            r'<iframe[^>]+?\bsrc\s*=\s*(["\'])(?P<url>(?:https?:)?//embed\.share-videos\.se/auto/embed/\d+\?.*?\buid=\d+.*?)\1',
            webpage)]
        if sharevideos_urls:
            return self.playlist_from_matches(
                sharevideos_urls, video_id, video_title)

        viqeo_urls = ViqeoIE._extract_urls(webpage)
        if viqeo_urls:
            return self.playlist_from_matches(
                viqeo_urls, video_id, video_title, ie=ViqeoIE.ie_key())

        expressen_urls = ExpressenIE._extract_urls(webpage)
        if expressen_urls:
            return self.playlist_from_matches(
                expressen_urls, video_id, video_title, ie=ExpressenIE.ie_key())

        # Look for HTML5 media
        entries = self._parse_html5_media_entries(url, webpage, video_id, m3u8_id='hls')
        if entries:
            if len(entries) == 1:
                entries[0].update({
                    'id': video_id,
                    'title': video_title,
                })
            else:
                for num, entry in enumerate(entries, start=1):
                    entry.update({
                        'id': '%s-%s' % (video_id, num),
                        'title': '%s (%d)' % (video_title, num),
                    })
            for entry in entries:
                self._sort_formats(entry['formats'])
            return self.playlist_result(entries, video_id, video_title)

        jwplayer_data = self._find_jwplayer_data(
            webpage, video_id, transform_source=js_to_json)
        if jwplayer_data:
            try:
                info = self._parse_jwplayer_data(
                    jwplayer_data, video_id, require_title=False, base_url=url)
                return merge_dicts(info, info_dict)
            except ExtractorError:
                # See https://github.com/rg3/youtube-dl/pull/16735
                pass

        # Video.js embed
        mobj = re.search(
            r'(?s)\bvideojs\s*\(.+?\.src\s*\(\s*((?:\[.+?\]|{.+?}))\s*\)\s*;',
            webpage)
        if mobj is not None:
            sources = self._parse_json(
                mobj.group(1), video_id, transform_source=js_to_json,
                fatal=False) or []
            if not isinstance(sources, list):
                sources = [sources]
            formats = []
            for source in sources:
                src = source.get('src')
                if not src or not isinstance(src, compat_str):
                    continue
                src = compat_urlparse.urljoin(url, src)
                src_type = source.get('type')
                if isinstance(src_type, compat_str):
                    src_type = src_type.lower()
                ext = determine_ext(src).lower()
                if src_type == 'video/youtube':
                    return self.url_result(src, YoutubeIE.ie_key())
                if src_type == 'application/dash+xml' or ext == 'mpd':
                    formats.extend(self._extract_mpd_formats(
                        src, video_id, mpd_id='dash', fatal=False))
                elif src_type == 'application/x-mpegurl' or ext == 'm3u8':
                    formats.extend(self._extract_m3u8_formats(
                        src, video_id, 'mp4', entry_protocol='m3u8_native',
                        m3u8_id='hls', fatal=False))
                else:
                    formats.append({
                        'url': src,
                        'ext': (mimetype2ext(src_type) or
                                ext if ext in KNOWN_EXTENSIONS else 'mp4'),
                    })
            if formats:
                self._sort_formats(formats)
                info_dict['formats'] = formats
                return info_dict

        # Looking for http://schema.org/VideoObject
        json_ld = self._search_json_ld(
            webpage, video_id, default={}, expected_type='VideoObject')
        if json_ld.get('url'):
            return merge_dicts(json_ld, info_dict)

        def check_video(vurl):
            if YoutubeIE.suitable(vurl):
                return True
            if RtmpIE.suitable(vurl):
                return True
            vpath = compat_urlparse.urlparse(vurl).path
            vext = determine_ext(vpath)
            return '.' in vpath and vext not in ('swf', 'png', 'jpg', 'srt', 'sbv', 'sub', 'vtt', 'ttml', 'js', 'xml')

        def filter_video(urls):
            return list(filter(check_video, urls))

        # Start with something easy: JW Player in SWFObject
        found = filter_video(re.findall(r'flashvars: [\'"](?:.*&)?file=(http[^\'"&]*)', webpage))
        if not found:
            # Look for gorilla-vid style embedding
            found = filter_video(re.findall(r'''(?sx)
                (?:
                    jw_plugins|
                    JWPlayerOptions|
                    jwplayer\s*\(\s*["'][^'"]+["']\s*\)\s*\.setup
                )
                .*?
                ['"]?file['"]?\s*:\s*["\'](.*?)["\']''', webpage))
        if not found:
            # Broaden the search a little bit
            found = filter_video(re.findall(r'[^A-Za-z0-9]?(?:file|source)=(http[^\'"&]*)', webpage))
        if not found:
            # Broaden the findall a little bit: JWPlayer JS loader
            found = filter_video(re.findall(
                r'[^A-Za-z0-9]?(?:file|video_url)["\']?:\s*["\'](http(?![^\'"]+\.[0-9]+[\'"])[^\'"]+)["\']', webpage))
        if not found:
            # Flow player
            found = filter_video(re.findall(r'''(?xs)
                flowplayer\("[^"]+",\s*
                    \{[^}]+?\}\s*,
                    \s*\{[^}]+? ["']?clip["']?\s*:\s*\{\s*
                        ["']?url["']?\s*:\s*["']([^"']+)["']
            ''', webpage))
        if not found:
            # Cinerama player
            found = re.findall(
                r"cinerama\.embedPlayer\(\s*\'[^']+\',\s*'([^']+)'", webpage)
        if not found:
            # Try to find twitter cards info
            # twitter:player:stream should be checked before twitter:player since
            # it is expected to contain a raw stream (see
            # https://dev.twitter.com/cards/types/player#On_twitter.com_via_desktop_browser)
            found = filter_video(re.findall(
                r'<meta (?:property|name)="twitter:player:stream" (?:content|value)="(.+?)"', webpage))
        if not found:
            # We look for Open Graph info:
            # We have to match any number spaces between elements, some sites try to align them (eg.: statigr.am)
            m_video_type = re.findall(r'<meta.*?property="og:video:type".*?content="video/(.*?)"', webpage)
            # We only look in og:video if the MIME type is a video, don't try if it's a Flash player:
            if m_video_type is not None:
                found = filter_video(re.findall(r'<meta.*?property="og:video".*?content="(.*?)"', webpage))
        if not found:
            REDIRECT_REGEX = r'[0-9]{,2};\s*(?:URL|url)=\'?([^\'"]+)'
            found = re.search(
                r'(?i)<meta\s+(?=(?:[a-z-]+="[^"]+"\s+)*http-equiv="refresh")'
                r'(?:[a-z-]+="[^"]+"\s+)*?content="%s' % REDIRECT_REGEX,
                webpage)
            if not found:
                # Look also in Refresh HTTP header
                refresh_header = head_response.headers.get('Refresh')
                if refresh_header:
                    # In python 2 response HTTP headers are bytestrings
                    if sys.version_info < (3, 0) and isinstance(refresh_header, str):
                        refresh_header = refresh_header.decode('iso-8859-1')
                    found = re.search(REDIRECT_REGEX, refresh_header)
            if found:
                new_url = compat_urlparse.urljoin(url, unescapeHTML(found.group(1)))
                if new_url != url:
                    self.report_following_redirect(new_url)
                    return {
                        '_type': 'url',
                        'url': new_url,
                    }
                else:
                    found = None

        if not found:
            # twitter:player is a https URL to iframe player that may or may not
            # be supported by youtube-dl thus this is checked the very last (see
            # https://dev.twitter.com/cards/types/player#On_twitter.com_via_desktop_browser)
            embed_url = self._html_search_meta('twitter:player', webpage, default=None)
            if embed_url and embed_url != url:
                return self.url_result(embed_url)

        if not found:
            raise UnsupportedError(url)

        entries = []
        for video_url in orderedSet(found):
            video_url = unescapeHTML(video_url)
            video_url = video_url.replace('\\/', '/')
            video_url = compat_urlparse.urljoin(url, video_url)
            video_id = compat_urllib_parse_unquote(os.path.basename(video_url))

            # Sometimes, jwplayer extraction will result in a YouTube URL
            if YoutubeIE.suitable(video_url):
                entries.append(self.url_result(video_url, 'Youtube'))
                continue

            # here's a fun little line of code for you:
            video_id = os.path.splitext(video_id)[0]

            entry_info_dict = {
                'id': video_id,
                'uploader': video_uploader,
                'title': video_title,
                'age_limit': age_limit,
            }

            if RtmpIE.suitable(video_url):
                entry_info_dict.update({
                    '_type': 'url_transparent',
                    'ie_key': RtmpIE.ie_key(),
                    'url': video_url,
                })
                entries.append(entry_info_dict)
                continue

            ext = determine_ext(video_url)
            if ext == 'smil':
                entry_info_dict['formats'] = self._extract_smil_formats(video_url, video_id)
            elif ext == 'xspf':
                return self.playlist_result(self._extract_xspf_playlist(video_url, video_id), video_id)
            elif ext == 'm3u8':
                entry_info_dict['formats'] = self._extract_m3u8_formats(video_url, video_id, ext='mp4')
            elif ext == 'mpd':
                entry_info_dict['formats'] = self._extract_mpd_formats(video_url, video_id)
            elif ext == 'f4m':
                entry_info_dict['formats'] = self._extract_f4m_formats(video_url, video_id)
            elif re.search(r'(?i)\.(?:ism|smil)/manifest', video_url) and video_url != url:
                # Just matching .ism/manifest is not enough to be reliably sure
                # whether it's actually an ISM manifest or some other streaming
                # manifest since there are various streaming URL formats
                # possible (see [1]) as well as some other shenanigans like
                # .smil/manifest URLs that actually serve an ISM (see [2]) and
                # so on.
                # Thus the most reasonable way to solve this is to delegate
                # to generic extractor in order to look into the contents of
                # the manifest itself.
                # 1. https://azure.microsoft.com/en-us/documentation/articles/media-services-deliver-content-overview/#streaming-url-formats
                # 2. https://svs.itworkscdn.net/lbcivod/smil:itwfcdn/lbci/170976.smil/Manifest
                entry_info_dict = self.url_result(
                    smuggle_url(video_url, {'to_generic': True}),
                    GenericIE.ie_key())
            else:
                entry_info_dict['url'] = video_url

            if entry_info_dict.get('formats'):
                self._sort_formats(entry_info_dict['formats'])

            entries.append(entry_info_dict)

        if len(entries) == 1:
            return entries[0]
        else:
            for num, e in enumerate(entries, start=1):
                # 'url' results don't have a title
                if e.get('title') is not None:
                    e['title'] = '%s (%d)' % (e['title'], num)
            return {
                '_type': 'playlist',
                'entries': entries,
            }
-												Unify coding cookie

											
										
										
											8 years ago
+								# coding: utf-8
-												GenericIE: Detect videos from Brightcove

Brightcove videos info is usually found in an <object class="BrightcoveExperience"></object> node, this is passed to a new method of BrightcoveIE that builds a url to extract the video.

											
										
										
											12 years ago
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								from __future__ import unicode_literals
-												Move GenericIE into its own file

											
										
										
											12 years ago
+								import os
 								import re
-												[extractor/generic] Fix following redirect in Refresh HTTP header on python 2

											
										
										
											9 years ago
+								import sys
-												Move GenericIE into its own file

											
										
										
											12 years ago
 								from .common import InfoExtractor
-												[youtube] Support jwplayer with YouTube URLs (Closes #2075)

											
										
										
											11 years ago
+								from .youtube import YoutubeIE
-												[util] Move compatibility functions out of util

utils is large enough without these compatibility functions.

Everything that is present in newer versions of Python (i.e. with dev Python it's just an import) goes into compat.py .
Everything else (i.e. youtube-dl-specific helpers) goes into utils.py .

											
										
										
											10 years ago
+								from ..compat import (
-												[compat] compat_etree_fromstring: also decode the text attribute

Deletes parse_xml from utils, because it also does it.

											
										
										
											9 years ago
+								    compat_etree_fromstring,
-												[extractor/generic] Ensure format id is unicode string

											
										
										
											8 years ago
+								    compat_str,
-												[extractor/generic] Use compat_urllib_parse_unquote for unquoting video_id and title from URL

											
										
										
											10 years ago
+								    compat_urllib_parse_unquote,
-												[generic] simply use urljoin

											
										
										
											11 years ago
+								    compat_urlparse,
-												[generic] Fix on python 2.6

`ParseError` is not available, it raises `xml.parsers.expat.ExpatError`.
The webpage needs to be encoded.

											
										
										
											11 years ago
+								    compat_xml_parse_error,
-												[util] Move compatibility functions out of util

utils is large enough without these compatibility functions.

Everything that is present in newer versions of Python (i.e. with dev Python it's just an import) goes into compat.py .
Everything else (i.e. youtube-dl-specific helpers) goes into utils.py .

											
										
										
											10 years ago
+								)
 								from ..utils import (
-												fix up imports

											
										
										
											10 years ago
+								    determine_ext,
-												Move GenericIE into its own file

											
										
										
											12 years ago
+								    ExtractorError,
-												[generic] Add support for camtasia videos (Fixes #3574)

											
										
										
											10 years ago
+								    float_or_none,
-												[aparat] Add support (Fixes #2012)

											
										
										
											11 years ago
+								    HEADRequest,
-												[generic] Add support for BOMs (Fixes #4753)

											
										
										
											10 years ago
+								    is_html,
-												[generic] Try parsing JWPlayer embedded videos (closes #12030)

											
										
										
											8 years ago
+								    js_to_json,
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
+								    KNOWN_EXTENSIONS,
-												[utils] Introduce merge_dicts

											
										
										
											7 years ago
+								    merge_dicts,
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
+								    mimetype2ext,
-												[generic] Simplify playlist support (#2948)

											
										
										
											10 years ago
+								    orderedSet,
-												Switch codebase to use sanitized_Request instead of
compat_urllib_request.Request

[downloader/dash] Use sanitized_Request

[downloader/http] Use sanitized_Request

[atresplayer] Use sanitized_Request

[bambuser] Use sanitized_Request

[bliptv] Use sanitized_Request

[brightcove] Use sanitized_Request

[cbs] Use sanitized_Request

[ceskatelevize] Use sanitized_Request

[collegerama] Use sanitized_Request

[extractor/common] Use sanitized_Request

[crunchyroll] Use sanitized_Request

[dailymotion] Use sanitized_Request

[dcn] Use sanitized_Request

[dramafever] Use sanitized_Request

[dumpert] Use sanitized_Request

[eitb] Use sanitized_Request

[escapist] Use sanitized_Request

[everyonesmixtape] Use sanitized_Request

[extremetube] Use sanitized_Request

[facebook] Use sanitized_Request

[fc2] Use sanitized_Request

[flickr] Use sanitized_Request

[4tube] Use sanitized_Request

[gdcvault] Use sanitized_Request

[extractor/generic] Use sanitized_Request

[hearthisat] Use sanitized_Request

[hotnewhiphop] Use sanitized_Request

[hypem] Use sanitized_Request

[iprima] Use sanitized_Request

[ivi] Use sanitized_Request

[keezmovies] Use sanitized_Request

[letv] Use sanitized_Request

[lynda] Use sanitized_Request

[metacafe] Use sanitized_Request

[minhateca] Use sanitized_Request

[miomio] Use sanitized_Request

[meovideo] Use sanitized_Request

[mofosex] Use sanitized_Request

[moniker] Use sanitized_Request

[mooshare] Use sanitized_Request

[movieclips] Use sanitized_Request

[mtv] Use sanitized_Request

[myvideo] Use sanitized_Request

[neteasemusic] Use sanitized_Request

[nfb] Use sanitized_Request

[niconico] Use sanitized_Request

[noco] Use sanitized_Request

[nosvideo] Use sanitized_Request

[novamov] Use sanitized_Request

[nowness] Use sanitized_Request

[nuvid] Use sanitized_Request

[played] Use sanitized_Request

[pluralsight] Use sanitized_Request

[pornhub] Use sanitized_Request

[pornotube] Use sanitized_Request

[primesharetv] Use sanitized_Request

[promptfile] Use sanitized_Request

[qqmusic] Use sanitized_Request

[rtve] Use sanitized_Request

[safari] Use sanitized_Request

[sandia] Use sanitized_Request

[shared] Use sanitized_Request

[sharesix] Use sanitized_Request

[sina] Use sanitized_Request

[smotri] Use sanitized_Request

[sohu] Use sanitized_Request

[spankwire] Use sanitized_Request

[sportdeutschland] Use sanitized_Request

[streamcloud] Use sanitized_Request

[streamcz] Use sanitized_Request

[tapely] Use sanitized_Request

[tube8] Use sanitized_Request

[tubitv] Use sanitized_Request

[twitch] Use sanitized_Request

[twitter] Use sanitized_Request

[udemy] Use sanitized_Request

[vbox7] Use sanitized_Request

[veoh] Use sanitized_Request

[vessel] Use sanitized_Request

[vevo] Use sanitized_Request

[viddler] Use sanitized_Request

[videomega] Use sanitized_Request

[viewvster] Use sanitized_Request

[viki] Use sanitized_Request

[vk] Use sanitized_Request

[vodlocker] Use sanitized_Request

[voicerepublic] Use sanitized_Request

[wistia] Use sanitized_Request

[xfileshare] Use sanitized_Request

[xtube] Use sanitized_Request

[xvideos] Use sanitized_Request

[yandexmusic] Use sanitized_Request

[youku] Use sanitized_Request

[youporn] Use sanitized_Request

[youtube] Use sanitized_Request

[patreon] Use sanitized_Request

[extractor/common] Remove unused import

[nfb] PEP 8

											
										
										
											9 years ago
+								    sanitized_Request,
-												[generic] Support embedded vimeo videos (#1602)

											
										
										
											11 years ago
+								    smuggle_url,
 								    unescapeHTML,
-												Add support for direct links to a video (#1973)

											
										
										
											11 years ago
+								    unified_strdate,
-												[ministrygrid] Add extractor (Fixes #2900)

											
										
										
											10 years ago
+								    unsmuggle_url,
-												Add documentation about supported sites (Fixes #4503)

											
										
										
											10 years ago
+								    UnsupportedError,
-												[generic] Parse RSS enclosure URLs (Fixes #5091)

											
										
										
											10 years ago
+								    xpath_text,
-												Move GenericIE into its own file

											
										
										
											12 years ago
+								)
-												[extractor/generic] Improve rtmp support (closes #11993)

											
										
										
											8 years ago
+								from .commonprotocols import RtmpIE
-												[brightcove] add support for brightcove in page embed(fixes #6824)

											
										
										
											9 years ago
+								from .brightcove import (
-												[brightcove] Rename extractor to brightcove legacy

Old embedding approaches are now "Legacy Studio"

											
										
										
											9 years ago
+								    BrightcoveLegacyIE,
-												[brightcove:embedinpage] Rename extractor to brightcove new

It's not actually embed_in_page but "New Studio" and allows both iframe and embed_in_page embeds

											
										
										
											9 years ago
+								    BrightcoveNewIE,
-												[brightcove] add support for brightcove in page embed(fixes #6824)

											
										
										
											9 years ago
+								)
-												[nexx:embed] Add extractor for iframe embeds

											
										
										
											8 years ago
+								from .nexx import (
 								    NexxIE,
 								    NexxEmbedIE,
 								)
-												[NBC/ThePlatform/Generic] Add a generic detector for NBCSportsVPlayer and enhance error detection in ThePlatformIE

											
										
										
											10 years ago
+								from .nbc import NBCSportsVPlayerIE
-												[generic] Detect ooyala videos (fixes #2013)

											
										
										
											11 years ago
+								from .ooyala import OoyalaIE
-												[generic] Add support for embedded rutv player

											
										
										
											11 years ago
+								from .rutv import RUTVIE
-												[tvc] Refactor extractor names

											
										
										
											10 years ago
+								from .tvc import TVCIE
-												[generic] Add support for sportbox embeds

											
										
										
											10 years ago
+								from .sportbox import SportBoxEmbedIE
-												[smotri] Modernize and add support for emdebbed videos (Closes #2585)

											
										
										
											11 years ago
+								from .smotri import SmotriIE
-												[myvi:embed] Rename to myvi

											
										
										
											10 years ago
+								from .myvi import MyviIE
-												[condenast] Add support for embedded videos (Closes #3929)

											
										
										
											10 years ago
+								from .condenast import CondeNastIE
-												[udn] Add new extractor

											
										
										
											10 years ago
+								from .udn import UDNEmbedIE
-												[CSpan] Add detection for Senate ISVP. Closes #5302

											
										
										
											10 years ago
+								from .senateisvp import SenateISVPIE
-												[extractor/generic] Add support for svt embeds (Closes #5622)

											
										
										
											10 years ago
+								from .svt import SVTIE
-												[extractor/generic] Add support for pornhub embeds

											
										
										
											10 years ago
+								from .pornhub import PornHubIE
-												[generic] Add support for xhamster embeds

											
										
										
											10 years ago
+								from .xhamster import XHamsterEmbedIE
-												[extractor/generic] Add support for tnaflix network embeds (Closes #7505)

											
										
										
											9 years ago
+								from .tnaflix import TNAFlixNetworkEmbedIE
-												[extractor/generic] Add support for drtuber embds (closes #11098)

											
										
										
											8 years ago
+								from .drtuber import DrTuberIE
-												[extractor/generic] Add support for redtube embds (closes #11099)

											
										
										
											8 years ago
+								from .redtube import RedTubeIE
-												[generic] Add support for tube8 embeds

											
										
										
											7 years ago
+								from .tube8 import Tube8IE
-												[vimeo/generic] Move detection logic from GenericIE to VimeoIE

											
										
										
											10 years ago
+								from .vimeo import VimeoIE
-												[dailymotion] remove dailymotion cloud extractor(closes #6794)

https://web.archive.org/web/20160312110217/https://www.dmcloud.net/

											
										
										
											7 years ago
+								from .dailymotion import DailymotionIE
-												[dailymail] Add support for embeds

											
										
										
											8 years ago
+								from .dailymail import DailyMailIE
-												[extractor/generic] Add support for OnionStudios embeds (Closes #5841)

											
										
										
											10 years ago
+								from .onionstudios import OnionStudiosIE
-												[viewlift] replace SnagFilms extractors

- add support for other sites that use the same logic
- improve format extraction and sorting

											
										
										
											9 years ago
+								from .viewlift import ViewLiftEmbedIE
-												[extractor/generic] Use _extract_url for mtvservices

											
										
										
											9 years ago
+								from .mtv import MTVServicesEmbeddedIE
-												[extractor/generic] Use _extract_url for pladform

											
										
										
											9 years ago
+								from .pladform import PladformIE
-												[extractor/generic] Add support for videomore embeds

											
										
										
											9 years ago
+								from .videomore import VideomoreIE
-												[extractor/generic] Add support for webcaster.pro embeds

											
										
										
											8 years ago
+								from .webcaster import WebcasterFeedIE
-												[googledrive] Modernize

											
										
										
											9 years ago
+								from .googledrive import GoogleDriveIE
-												[makertv] improve extraction

											
										
										
											9 years ago
+								from .jwplatform import JWPlatformIE
-												[ultimedia] Rename to digiteka

											
										
										
											9 years ago
+								from .digiteka import DigitekaIE
-												[extractor/generic] Add support for arkena embeds

											
										
										
											9 years ago
+								from .arkena import ArkenaIE
-												[generic] Extract Instagram embeds (#8817)

											
										
										
											9 years ago
+								from .instagram import InstagramIE
-												[generic] Add support for LiveLeak embeds

											
										
										
											9 years ago
+								from .liveleak import LiveLeakIE
-												[extractor/generic:3qsdn] Add support for embeds

											
										
										
											9 years ago
+								from .threeqsdn import ThreeQSDNIE
-												[extractor/generic] Add support for theplatform embeds (Closes #8636, closes #9476)

											
										
										
											9 years ago
+								from .theplatform import ThePlatformIE
-												[extractor/generic] Add support vessel embeds (Closes #7083)

											
										
										
											9 years ago
+								from .vessel import VesselIE
-												[extractor/generic] Use _extract_url for kaltura embeds (Closes #9922)

											
										
										
											9 years ago
+								from .kaltura import KalturaIE
-												[eagleplatform] Improve embed detection and extract in separate routine (Closes #9926)

											
										
										
											9 years ago
+								from .eagleplatform import EaglePlatformIE
-												[facebook] Improve Facebook embedded detection

Related to #9938.

Another example comes from 9834872bf63b4e03b66c5e3b8f306556e735d8c5.

											
										
										
											9 years ago
+								from .facebook import FacebookIE
-												[extractor/generic] Extract all soundcloud embeds (Closes #10179)

											
										
										
											9 years ago
+								from .soundcloud import SoundcloudIE
-												[tunein] Add support for embeds (closes #11579)

											
										
										
											8 years ago
+								from .tunein import TuneInBaseIE
-												[vbox7:generic] Add support for vbox7 embeds

											
										
										
											8 years ago
+								from .vbox7 import Vbox7IE
-												[DBTV:generic] Add support for embeds

											
										
										
											8 years ago
+								from .dbtv import DBTVIE
-												[piksel] Add new extractor(closes #11246)

											
										
										
											8 years ago
+								from .piksel import PikselIE
-												[videa] Add support for videa embeds

											
										
										
											8 years ago
+								from .videa import VideaIE
-												[extractor/generic] Add support for 20 minuten embeds (closes #11683, closes #11751)

											
										
										
											8 years ago
+								from .twentymin import TwentyMinutenIE
-												[ustream] Add UstreamIE._extract_url()

Ref: #11547

											
										
										
											8 years ago
+								from .ustream import UstreamIE
-												[extractor/generic] Add support for openload embeds (closes #11536, closes #11812)

											
										
										
											8 years ago
+								from .openload import OpenloadIE
-												[videopress] Add extractor

											
										
										
											8 years ago
+								from .videopress import VideoPressIE
-												[generic] Add support for rutube embeds

											
										
										
											8 years ago
+								from .rutube import RutubeIE
-												[limelight] Improve embeds extraction (closes #12761)
* Move extraction code to extractor
* Add extraction for LimelightEmbeddedPlayerFlash embeds
* Extract multiple video

											
										
										
											8 years ago
+								from .limelight import LimelightBaseIE
-												[anvato] Improve extraction (closes #12913)
* Promote to regular shortcut based extractor
* Add mcp to access key mapping table
* Add support for embeds extraction
* Add support for anvato embeds in generic extractor

											
										
										
											8 years ago
+								from .anvato import AnvatoIE
-												[washingtonpost] Add support for embeds (closes #12699)

											
										
										
											8 years ago
+								from .washingtonpost import WashingtonPostIE
-												[extractor/generic] Extract wistia embed code into separate method

											
										
										
											8 years ago
+								from .wistia import WistiaIE
-												[extractor/generic] Add support for mediaset embeds

											
										
										
											8 years ago
+								from .mediaset import MediasetIE
-												[joj] Rewrite and add support for generic embeds (closes #13268)

											
										
										
											8 years ago
+								from .joj import JojIE
-												[megaphone] Add extractor

											
										
										
											8 years ago
+								from .megaphone import MegaphoneIE
-												[generic] Add support for vzaar embeds


											
										
										
											7 years ago
+								from .vzaar import VzaarIE
-												[generic] Add support for channel9 embeds (closes #14469)

											
										
										
											7 years ago
+								from .channel9 import Channel9IE
-												[vshare] Fix extraction (closes #14473)


											
										
										
											7 years ago
+								from .vshare import VShareIE
-												[mediasite] Improve extraction and code style, add support for DASH (closes #11185, closes #14343, refs #5428)

											
										
										
											7 years ago
+								from .mediasite import MediasiteIE
-												[springboardplatform] Add extractor

											
										
										
											7 years ago
+								from .springboardplatform import SpringboardPlatformIE
-												[yapfiles] Add extractor (closes #15726, refs #11085)

											
										
										
											7 years ago
+								from .yapfiles import YapFilesIE
-												[vice] Fix extraction and rework extractors (closes #11101, closes #13019, closes #13622, closes #13778)

											
										
										
											7 years ago
+								from .vice import ViceIE
-												[generic] Add support for xfileshare embeds (closes #15879)

											
										
										
											7 years ago
+								from .xfileshare import XFileShareIE
-												[cloudflarestream] Add support for cloudflare streams (closes #16375)

											
										
										
											7 years ago
+								from .cloudflarestream import CloudflareStreamIE
-												[peertube] Add support for generic embeds

											
										
										
											7 years ago
+								from .peertube import PeerTubeIE
-												[indavideo] Add support for generic embeds (closes #11989)

											
										
										
											7 years ago
+								from .indavideo import IndavideoEmbedIE
-												[apa] Add extractor (closes #15041, closes #15672)

											
										
										
											7 years ago
+								from .apa import APAIE
-												[foxnews] Add support for iframe embeds (closes #15810, closes #16711)

											
										
										
											7 years ago
+								from .foxnews import FoxNewsIE
-												[viqeo] Add extractor (closes #17066)

											
										
										
											7 years ago
+								from .viqeo import ViqeoIE
-												[generic] Add support for expressen embeds

											
										
										
											6 years ago
+								from .expressen import ExpressenIE
-												Move GenericIE into its own file

											
										
										
											12 years ago
-												[generic] Support double slash URLs (Fixes #1309)

											
										
										
											12 years ago
-												Move GenericIE into its own file

											
										
										
											12 years ago
+								class GenericIE(InfoExtractor):
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								    IE_DESC = 'Generic downloader that works on some sites'
-												Move GenericIE into its own file

											
										
										
											12 years ago
+								    _VALID_URL = r'.*'
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								    IE_NAME = 'generic'
-												GenericIE: Detect videos from Brightcove

Brightcove videos info is usually found in an <object class="BrightcoveExperience"></object> node, this is passed to a new method of BrightcoveIE that builds a url to extract the video.

											
										
										
											12 years ago
+								    _TESTS = [
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											10 years ago
+								        # Direct link to a video
 								        {
 								            'url': 'http://media.w3.org/2010/05/sintel/trailer.mp4',
 								            'md5': '67d406c2bcb6af27fa886f31aa934bbe',
 								            'info_dict': {
 								                'id': 'trailer',
 								                'ext': 'mp4',
 								                'title': 'trailer',
 								                'upload_date': '20100513',
 								            }
 								        },
-												[extractor/generic] Clarify test comment

											
										
										
											10 years ago
+								        # Direct link to media delivered compressed (until Accept-Encoding is *)
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											10 years ago
+								        {
 								            'url': 'http://calimero.tk/muzik/FictionJunction-Parallel_Hearts.flac',
 								            'md5': '128c42e68b13950268b648275386fc74',
 								            'info_dict': {
 								                'id': 'FictionJunction-Parallel_Hearts',
 								                'ext': 'flac',
 								                'title': 'FictionJunction-Parallel_Hearts',
 								                'upload_date': '20140522',
 								            },
 								            'expected_warnings': [
 								                'URL could be a direct video link, returning it as such.'
-												[generic] Update some _TESTS

											
										
										
											8 years ago
+								            ],
 								            'skip': 'URL invalid',
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											10 years ago
+								        },
 								        # Direct download with broken HEAD
 								        {
 								            'url': 'http://ai-radio.org:8000/radio.opus',
 								            'info_dict': {
 								                'id': 'radio',
 								                'ext': 'opus',
 								                'title': 'radio',
 								            },
 								            'params': {
 								                'skip_download': True,  # infinite live stream
 								            },
 								            'expected_warnings': [
-												[generic] Fix test_Generic_2

Now a HEAD request returns 400 Bad Request

											
										
										
											9 years ago
+								                r'501.*Not Implemented',
 								                r'400.*Bad Request',
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											10 years ago
+								            ],
 								        },
 								        # Direct link with incorrect MIME type
 								        {
 								            'url': 'http://ftp.nluug.nl/video/nluug/2014-11-20_nj14/zaal-2/5_Lennart_Poettering_-_Systemd.webm',
 								            'md5': '4ccbebe5f36706d85221f204d7eb5913',
 								            'info_dict': {
 								                'url': 'http://ftp.nluug.nl/video/nluug/2014-11-20_nj14/zaal-2/5_Lennart_Poettering_-_Systemd.webm',
 								                'id': '5_Lennart_Poettering_-_Systemd',
 								                'ext': 'webm',
 								                'title': '5_Lennart_Poettering_-_Systemd',
 								                'upload_date': '20141120',
 								            },
 								            'expected_warnings': [
 								                'URL could be a direct video link, returning it as such.'
 								            ]
 								        },
 								        # RSS feed
 								        {
 								            'url': 'http://phihag.de/2014/youtube-dl/rss2.xml',
 								            'info_dict': {
 								                'id': 'http://phihag.de/2014/youtube-dl/rss2.xml',
 								                'title': 'Zero Punctuation',
 								                'description': 're:.*groundbreaking video review series.*'
 								            },
 								            'playlist_mincount': 11,
 								        },
 								        # RSS feed with enclosure
 								        {
 								            'url': 'http://podcastfeeds.nbcnews.com/audio/podcast/MSNBC-MADDOW-NETCAST-M4V.xml',
 								            'info_dict': {
 								                'id': 'pdv_maddow_netcast_m4v-02-27-2015-201624',
 								                'ext': 'm4v',
 								                'upload_date': '20150228',
 								                'title': 'pdv_maddow_netcast_m4v-02-27-2015-201624',
 								            }
 								        },
-												[generic] Prefer enclosures over links in RSS feeds


											
										
										
											7 years ago
+								        # RSS feed with enclosures and unsupported link URLs
 								        {
 								            'url': 'http://www.hellointernet.fm/podcast?format=rss',
 								            'info_dict': {
 								                'id': 'http://www.hellointernet.fm/podcast?format=rss',
 								                'description': 'CGP Grey and Brady Haran talk about YouTube, life, work, whatever.',
 								                'title': 'Hello Internet',
 								            },
 								            'playlist_mincount': 100,
 								        },
-												[extractor/generic] Add generic SMIL tests

											
										
										
											10 years ago
+								        # SMIL from http://videolectures.net/promogram_igor_mekjavic_eng
 								        {
 								            'url': 'http://videolectures.net/promogram_igor_mekjavic_eng/video/1/smil.xml',
 								            'info_dict': {
 								                'id': 'smil',
 								                'ext': 'mp4',
 								                'title': 'Automatics, robotics and biocybernetics',
 								                'description': 'md5:815fc1deb6b3a2bff99de2d5325be482',
-												[generic] Update test

											
										
										
											9 years ago
+								                'upload_date': '20130627',
-												[extractor/generic] Add generic SMIL tests

											
										
										
											10 years ago
+								                'formats': 'mincount:16',
 								                'subtitles': 'mincount:1',
 								            },
 								            'params': {
 								                'force_generic_extractor': True,
 								                'skip_download': True,
 								            },
 								        },
 								        # SMIL from http://www1.wdr.de/mediathek/video/livestream/index.html
 								        {
 								            'url': 'http://metafilegenerator.de/WDR/WDR_FS/hds/hds.smil',
 								            'info_dict': {
 								                'id': 'hds',
 								                'ext': 'flv',
 								                'title': 'hds',
 								                'formats': 'mincount:1',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
 								        # SMIL from https://www.restudy.dk/video/play/id/1637
 								        {
 								            'url': 'https://www.restudy.dk/awsmedia/SmilDirectory/video_1637.xml',
 								            'info_dict': {
 								                'id': 'video_1637',
 								                'ext': 'flv',
 								                'title': 'video_1637',
 								                'formats': 'mincount:3',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
 								        # SMIL from http://adventure.howstuffworks.com/5266-cool-jobs-iditarod-musher-video.htm
 								        {
 								            'url': 'http://services.media.howstuffworks.com/videos/450221/smil-service.smil',
 								            'info_dict': {
 								                'id': 'smil-service',
 								                'ext': 'flv',
 								                'title': 'smil-service',
 								                'formats': 'mincount:1',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
 								        # SMIL from http://new.livestream.com/CoheedandCambria/WebsterHall/videos/4719370
 								        {
 								            'url': 'http://api.new.livestream.com/accounts/1570303/events/1585861/videos/4719370.smil',
 								            'info_dict': {
 								                'id': '4719370',
 								                'ext': 'mp4',
 								                'title': '571de1fd-47bc-48db-abf9-238872a58d1f',
 								                'formats': 'mincount:3',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[extractor/generic] Add test for xspf playlist

											
										
										
											10 years ago
+								        # XSPF playlist from http://www.telegraaf.nl/tv/nieuws/binnenland/24353229/__Tikibad_ontruimd_wegens_brand__.html
 								        {
 								            'url': 'http://www.telegraaf.nl/xml/playlist/2015/8/7/mZlp2ctYIUEB.xspf',
 								            'info_dict': {
 								                'id': 'mZlp2ctYIUEB',
 								                'ext': 'mp4',
 								                'title': 'Tikibad ontruimd wegens brand',
 								                'description': 'md5:05ca046ff47b931f9b04855015e163a4',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											8 years ago
+								                'thumbnail': r're:^https?://.*\.jpg$',
-												[extractor/generic] Add test for xspf playlist

											
										
										
											10 years ago
+								                'duration': 33,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[extractor/generic] Add direct mpd url test

											
										
										
											9 years ago
+								        # MPD from http://dash-mse-test.appspot.com/media.html
 								        {
 								            'url': 'http://yt-dash-mse-test.commondatastorage.googleapis.com/media/car-20120827-manifest.mpd',
 								            'md5': '4b57baab2e30d6eb3a6a09f0ba57ef53',
 								            'info_dict': {
 								                'id': 'car-20120827-manifest',
 								                'ext': 'mp4',
 								                'title': 'car-20120827-manifest',
 								                'formats': 'mincount:9',
-												[ThePlatform] Fix tests failed since 79ba9140dc8fcf5883b7473596e8f20cba6b479f

											
										
										
											9 years ago
+								                'upload_date': '20130904',
-												[extractor/generic] Add direct mpd url test

											
										
										
											9 years ago
+								            },
 								            'params': {
 								                'format': 'bestvideo',
 								            },
 								        },
-												[extractor/generic] Add another test for generic m3u8

											
										
										
											9 years ago
+								        # m3u8 served with Content-Type: audio/x-mpegURL; charset=utf-8
 								        {
 								            'url': 'http://once.unicornmedia.com/now/master/playlist/bb0b18ba-64f5-4b1b-a29f-0ac252f06b68/77a785f3-5188-4806-b788-0893a61634ed/93677179-2d99-4ef4-9e17-fe70d49abfbf/content.m3u8',
 								            'info_dict': {
 								                'id': 'content',
 								                'ext': 'mp4',
 								                'title': 'content',
 								                'formats': 'mincount:8',
 								            },
 								            'params': {
 								                # m3u8 downloads
 								                'skip_download': True,
-												[generic] Update some _TESTS

											
										
										
											8 years ago
+								            },
 								            'skip': 'video gone',
-												[extractor/generic] Add another test for generic m3u8

											
										
										
											9 years ago
+								        },
-												[extractor/generic] Add a test for m3u playlist served without proper Content-Type

											
										
										
											9 years ago
+								        # m3u8 served with Content-Type: text/plain
 								        {
 								            'url': 'http://www.nacentapps.com/m3u8/index.m3u8',
 								            'info_dict': {
 								                'id': 'index',
 								                'ext': 'mp4',
 								                'title': 'index',
 								                'upload_date': '20140720',
 								                'formats': 'mincount:11',
 								            },
 								            'params': {
 								                # m3u8 downloads
 								                'skip_download': True,
-												[generic] Update some _TESTS

											
										
										
											8 years ago
+								            },
 								            'skip': 'video gone',
-												[extractor/generic] Add a test for m3u playlist served without proper Content-Type

											
										
										
											9 years ago
+								        },
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											10 years ago
+								        # google redirect
 								        {
 								            'url': 'http://www.google.com/url?sa=t&rct=j&q=&esrc=s&source=web&cd=1&cad=rja&ved=0CCUQtwIwAA&url=http%3A%2F%2Fwww.youtube.com%2Fwatch%3Fv%3DcmQHVoWB5FY&ei=F-sNU-LLCaXk4QT52ICQBQ&usg=AFQjCNEw4hL29zgOohLXvpJ-Bdh2bils1Q&bvm=bv.61965928,d.bGE',
 								            'info_dict': {
 								                'id': 'cmQHVoWB5FY',
 								                'ext': 'mp4',
 								                'upload_date': '20130224',
 								                'uploader_id': 'TheVerge',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											8 years ago
+								                'description': r're:^Chris Ziegler takes a look at the\.*',
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											10 years ago
+								                'uploader': 'The Verge',
 								                'title': 'First Firefox OS phones side-by-side',
 								            },
 								            'params': {
 								                'skip_download': False,
 								            }
 								        },
-												[extractor/generic] Fix following redirect in Refresh HTTP header on python 2

											
										
										
											9 years ago
+								        {
 								            # redirect in Refresh HTTP header
 								            'url': 'https://www.facebook.com/l.php?u=https%3A%2F%2Fwww.youtube.com%2Fwatch%3Fv%3DpO8h3EaFRdo&h=TAQHsoToz&enc=AZN16h-b6o4Zq9pZkCCdOLNKMN96BbGMNtcFwHSaazus4JHT_MFYkAA-WARTX2kvsCIdlAIyHZjl6d33ILIJU7Jzwk_K3mcenAXoAzBNoZDI_Q7EXGDJnIhrGkLXo_LJ_pAa2Jzbx17UHMd3jAs--6j2zaeto5w9RTn8T_1kKg3fdC5WPX9Dbb18vzH7YFX0eSJmoa6SP114rvlkw6pkS1-T&s=1',
 								            'info_dict': {
 								                'id': 'pO8h3EaFRdo',
 								                'ext': 'mp4',
 								                'title': 'Tripeo Boiler Room x Dekmantel Festival DJ Set',
 								                'description': 'md5:6294cc1af09c4049e0652b51a2df10d5',
 								                'upload_date': '20150917',
 								                'uploader_id': 'brtvofficial',
 								                'uploader': 'Boiler Room',
 								            },
 								            'params': {
 								                'skip_download': False,
 								            },
 								        },
-												GenericIE: Detect videos from Brightcove

Brightcove videos info is usually found in an <object class="BrightcoveExperience"></object> node, this is passed to a new method of BrightcoveIE that builds a url to extract the video.

											
										
										
											12 years ago
+								        {
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								            'url': 'http://www.hodiho.fr/2013/02/regis-plante-sa-jeep.html',
-												[generic] Update test

											
										
										
											11 years ago
+								            'md5': '85b90ccc9d73b4acd9138d3af4c27f89',
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								            'info_dict': {
-												[generic] Update test

											
										
										
											11 years ago
+								                'id': '13601338388002',
 								                'ext': 'mp4',
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								                'uploader': 'www.hodiho.fr',
 								                'title': 'R\u00e9gis plante sa Jeep',
-												GenericIE: Detect videos from Brightcove

Brightcove videos info is usually found in an <object class="BrightcoveExperience"></object> node, this is passed to a new method of BrightcoveIE that builds a url to extract the video.

											
										
										
											12 years ago
+								            }
 								        },
-												[generic] Detect bandcamp pages that use custom domains (closes #1662)

They embed the original url in the 'og:url' property.

											
										
										
											11 years ago
+								        # bandcamp page with custom domain
 								        {
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								            'add_ie': ['Bandcamp'],
 								            'url': 'http://bronyrock.com/track/the-pony-mash',
 								            'info_dict': {
-												[generic] Modernize tests

											
										
										
											11 years ago
+								                'id': '3235767654',
 								                'ext': 'mp3',
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								                'title': 'The Pony Mash',
 								                'uploader': 'M_Pallante',
-												[generic] Detect bandcamp pages that use custom domains (closes #1662)

They embed the original url in the 'og:url' property.

											
										
										
											11 years ago
+								            },
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								            'skip': 'There is a limit of 200 free downloads / month for the test song',
-												[generic] Detect bandcamp pages that use custom domains (closes #1662)

They embed the original url in the 'og:url' property.

											
										
										
											11 years ago
+								        },
-												[brightcove] Add the extraction of the url from generic

											
										
										
											11 years ago
+								        {
-												[brightcove:legacy] Improve embeds detection (closes #11523)

											
										
										
											8 years ago
+								            # embedded brightcove video
 								            # it also tests brightcove videos that need to set the 'Referer'
 								            # in the http requests
-												Rename all references to legacy studio Brightcove extractor

											
										
										
											9 years ago
+								            'add_ie': ['BrightcoveLegacy'],
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								            'url': 'http://www.bfmtv.com/video/bfmbusiness/cours-bourse/cours-bourse-l-analyse-technique-154522/',
 								            'info_dict': {
 								                'id': '2765128793001',
 								                'ext': 'mp4',
 								                'title': 'Le cours de bourse : l’analyse technique',
 								                'description': 'md5:7e9ad046e968cb2d1114004aba466fd9',
 								                'uploader': 'BFM BUSINESS',
-												[brightcove] Add the extraction of the url from generic

											
										
										
											11 years ago
+								            },
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								            'params': {
 								                'skip_download': True,
-												[brightcove] Add the extraction of the url from generic

											
										
										
											11 years ago
+								            },
 								        },
-												[brightcove:legacy] Improve embeds detection (closes #11523)

											
										
										
											8 years ago
+								        {
 								            # embedded with itemprop embedURL and video id spelled as `idVideo`
 								            'add_id': ['BrightcoveLegacy'],
 								            'url': 'http://bfmbusiness.bfmtv.com/mediaplayer/chroniques/olivier-delamarche/',
 								            'info_dict': {
 								                'id': '5255628253001',
 								                'ext': 'mp4',
 								                'title': 'md5:37c519b1128915607601e75a87995fc0',
 								                'description': 'md5:37f7f888b434bb8f8cc8dbd4f7a4cf26',
 								                'uploader': 'BFM BUSINESS',
 								                'uploader_id': '876450612001',
 								                'timestamp': 1482255315,
 								                'upload_date': '20161220',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[brightcove] Move test to generic

											
										
										
											11 years ago
+								        {
 								            # https://github.com/rg3/youtube-dl/issues/2253
 								            'url': 'http://bcove.me/i6nfkrc3',
 								            'md5': '0ba9446db037002366bab3b3eb30c88c',
 								            'info_dict': {
-												[generic] Modernize tests

											
										
										
											11 years ago
+								                'id': '3101154703001',
 								                'ext': 'mp4',
-												[brightcove] Move test to generic

											
										
										
											11 years ago
+								                'title': 'Still no power',
 								                'uploader': 'thestar.com',
 								                'description': 'Mississauga resident David Farmer is still out of power as a result of the ice storm a month ago. To keep the house warm, Farmer cuts wood from his property for a wood burning stove downstairs.',
 								            },
-												Rename all references to legacy studio Brightcove extractor

											
										
										
											9 years ago
+								            'add_ie': ['BrightcoveLegacy'],
-												[generic] Update some _TESTS

											
										
										
											8 years ago
+								            'skip': 'video gone',
-												[brightcove] Move test to generic

											
										
										
											11 years ago
+								        },
-												[brightcove] Encode object_str with utf-8

											
										
										
											11 years ago
+								        {
 								            'url': 'http://www.championat.com/video/football/v/87/87499.html',
 								            'md5': 'fb973ecf6e4a78a67453647444222983',
 								            'info_dict': {
 								                'id': '3414141473001',
 								                'ext': 'mp4',
 								                'title': 'Видео. Удаление Дзагоева (ЦСКА)',
 								                'description': 'Онлайн-трансляция матча ЦСКА - "Волга"',
 								                'uploader': 'Championat',
 								            },
 								        },
-												[generic/brightcove] Add a new test case for kijk.nl (#3541)

											
										
										
											10 years ago
+								        {
-												[brightcove] Extract m3u8 formats (#3541)

											
										
										
											10 years ago
+								            # https://github.com/rg3/youtube-dl/issues/3541
-												Rename all references to legacy studio Brightcove extractor

											
										
										
											9 years ago
+								            'add_ie': ['BrightcoveLegacy'],
-												[generic/brightcove] Add a new test case for kijk.nl (#3541)

											
										
										
											10 years ago
+								            'url': 'http://www.kijk.nl/sbs6/leermijvrouwenkennen/videos/jqMiXKAYan2S/aflevering-1',
 								            'info_dict': {
 								                'id': '3866516442001',
-												[brightcove] Extract m3u8 formats (#3541)

											
										
										
											10 years ago
+								                'ext': 'mp4',
-												[generic/brightcove] Add a new test case for kijk.nl (#3541)

											
										
										
											10 years ago
+								                'title': 'Leer mij vrouwen kennen: Aflevering 1',
 								                'description': 'Leer mij vrouwen kennen: Aflevering 1',
 								                'uploader': 'SBS Broadcasting',
 								            },
-												[brightcove] Extract m3u8 formats (#3541)

											
										
										
											10 years ago
+								            'skip': 'Restricted to Netherlands',
-												[generic/brightcove] Add a new test case for kijk.nl (#3541)

											
										
										
											10 years ago
+								            'params': {
-												[brightcove] Extract m3u8 formats (#3541)

											
										
										
											10 years ago
+								                'skip_download': True,  # m3u8 download
-												[generic/brightcove] Add a new test case for kijk.nl (#3541)

											
										
										
											10 years ago
+								            },
 								        },
-												[brightcove] Support URLs with bcpid instead of playerID

Fixes #12482

											
										
										
											8 years ago
+								        {
 								            # Brightcove video in <iframe>
 								            'url': 'http://www.un.org/chinese/News/story.asp?NewsID=27724',
 								            'md5': '36d74ef5e37c8b4a2ce92880d208b968',
 								            'info_dict': {
 								                'id': '5360463607001',
 								                'ext': 'mp4',
 								                'title': '叙利亚失明儿童在废墟上演唱《心跳》  呼吁获得正常童年生活',
 								                'description': '联合国儿童基金会中东和北非区域大使、作曲家扎德·迪拉尼（Zade Dirani）在3月15日叙利亚冲突爆发7周年纪念日之际发布了为叙利亚谱写的歌曲《心跳》（HEARTBEAT），为受到六年冲突影响的叙利亚儿童发出强烈呐喊，呼吁世界做出共同努力，使叙利亚儿童重新获得享有正常童年生活的权利。',
 								                'uploader': 'United Nations',
 								                'uploader_id': '1362235914001',
 								                'timestamp': 1489593889,
 								                'upload_date': '20170315',
 								            },
 								            'add_ie': ['BrightcoveLegacy'],
 								        },
-												[brightcove] Recognize another player ID

Closes #11688

											
										
										
											8 years ago
+								        {
 								            # Brightcove with alternative playerID key
 								            'url': 'http://www.nature.com/nmeth/journal/v9/n7/fig_tab/nmeth.2062_SV1.html',
 								            'info_dict': {
 								                'id': 'nmeth.2062_SV1',
 								                'title': 'Simultaneous multiview imaging of the Drosophila syncytial blastoderm : Quantitative high-speed imaging of entire developing embryos with simultaneous multiview light-sheet microscopy : Nature Methods : Nature Research',
 								            },
 								            'playlist': [{
 								                'info_dict': {
 								                    'id': '2228375078001',
 								                    'ext': 'mp4',
 								                    'title': 'nmeth.2062-sv1',
 								                    'description': 'nmeth.2062-sv1',
 								                    'timestamp': 1363357591,
 								                    'upload_date': '20130315',
 								                    'uploader': 'Nature Publishing Group',
 								                    'uploader_id': '1964492299001',
 								                },
 								            }],
 								        },
-												[brightcove] Relax video tag embeds extraction

BrightcoveNewIE.extract_urls(): Handle player data when it is all in
attributes of the <video> tag, and also the id is
data-brightcove-video-id not data-video-id.

Add test to generic extractor, note HEAD gives 404, no checksum computed(?).

											
										
										
											8 years ago
+								        {
 								            # Brightcove with UUID in videoPlayer
 								            'url': 'http://www8.hp.com/cn/zh/home.html',
 								            'info_dict': {
 								                'id': '5255815316001',
 								                'ext': 'mp4',
 								                'title': 'Sprocket Video - China',
 								                'description': 'Sprocket Video - China',
 								                'uploader': 'HP-Video Gallery',
 								                'timestamp': 1482263210,
 								                'upload_date': '20161220',
 								                'uploader_id': '1107601872001',
 								            },
 								            'params': {
 								                'skip_download': True,  # m3u8 download
 								            },
 								            'skip': 'video rotates...weekly?',
 								        },
 								        {
 								            # Brightcove:new type [2].
 								            'url': 'http://www.delawaresportszone.com/video-st-thomas-more-earns-first-trip-to-basketball-semis',
 								            'md5': '2b35148fcf48da41c9fb4591650784f3',
 								            'info_dict': {
 								                'id': '5348741021001',
 								                'ext': 'mp4',
 								                'upload_date': '20170306',
 								                'uploader_id': '4191638492001',
 								                'timestamp': 1488769918,
 								                'title': 'VIDEO:  St. Thomas More earns first trip to basketball semis',
 								            },
 								        },
 								        {
 								            # Alternative brightcove <video> attributes
 								            'url': 'http://www.programme-tv.net/videos/extraits/81095-guillaume-canet-evoque-les-rumeurs-d-infidelite-de-marion-cotillard-avec-brad-pitt-dans-vivement-dimanche/',
 								            'info_dict': {
 								                'id': '81095-guillaume-canet-evoque-les-rumeurs-d-infidelite-de-marion-cotillard-avec-brad-pitt-dans-vivement-dimanche',
 								                'title': "Guillaume Canet évoque les rumeurs d'infidélité de Marion Cotillard avec Brad Pitt dans Vivement Dimanche, Extraits : toutes les vidéos avec Télé-Loisirs",
 								            },
 								            'playlist': [{
 								                'md5': '732d22ba3d33f2f3fc253c39f8f36523',
 								                'info_dict': {
 								                    'id': '5311302538001',
 								                    'ext': 'mp4',
 								                    'title': "Guillaume Canet évoque les rumeurs d'infidélité de Marion Cotillard avec Brad Pitt dans Vivement Dimanche",
 								                    'description': "Guillaume Canet évoque les rumeurs d'infidélité de Marion Cotillard avec Brad Pitt dans Vivement Dimanche (France 2, 5 février 2017)",
 								                    'timestamp': 1486321708,
 								                    'upload_date': '20170205',
 								                    'uploader_id': '800000640001',
 								                },
 								                'only_matching': True,
 								            }],
 								        },
-												[extractor/generic] Add test for brigthcove UUID-like videoPlayer

											
										
										
											8 years ago
+								        {
 								            # Brightcove with UUID in videoPlayer
 								            'url': 'http://www8.hp.com/cn/zh/home.html',
 								            'info_dict': {
 								                'id': '5255815316001',
 								                'ext': 'mp4',
 								                'title': 'Sprocket Video - China',
 								                'description': 'Sprocket Video - China',
 								                'uploader': 'HP-Video Gallery',
 								                'timestamp': 1482263210,
 								                'upload_date': '20161220',
 								                'uploader_id': '1107601872001',
 								            },
 								            'params': {
 								                'skip_download': True,  # m3u8 download
 								            },
 								        },
-												[generic] Detect ooyala videos (fixes #2013)

											
										
										
											11 years ago
+								        # ooyala video
 								        {
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								            'url': 'http://www.rollingstone.com/music/videos/norwegian-dj-cashmere-cat-goes-spartan-on-with-me-premiere-20131219',
-												[generic] Update some tests

											
										
										
											10 years ago
+								            'md5': '166dd577b433b4d4ebfee10b0824d8ff',
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								            'info_dict': {
 								                'id': 'BwY2RxaTrTkslxOfcan0UCf0YqyvWysJ',
 								                'ext': 'mp4',
-												[generic] Improve testcase

											
										
										
											11 years ago
+								                'title': '2cc213299525360.mov',  # that's what we get
-												[ooyala] fix duration scale

											
										
										
											9 years ago
+								                'duration': 238.231,
-												[generic] Detect ooyala videos (fixes #2013)

											
										
										
											11 years ago
+								            },
-												[generic] Update some tests

											
										
										
											10 years ago
+								            'add_ie': ['Ooyala'],
-												[generic] Detect ooyala videos (fixes #2013)

											
										
										
											11 years ago
+								        },
-												[extractor/generic] Add test for #6485

											
										
										
											10 years ago
+								        {
 								            # ooyala video embedded with http://player.ooyala.com/iframe.js
 								            'url': 'http://www.macrumors.com/2015/07/24/steve-jobs-the-man-in-the-machine-first-trailer/',
 								            'info_dict': {
 								                'id': 'p0MGJndjoG5SOKqO_hZJuZFPB-Tr5VgB',
 								                'ext': 'mp4',
 								                'title': '"Steve Jobs: Man in the Machine" trailer',
 								                'description': 'The first trailer for the Alex Gibney documentary "Steve Jobs: Man in the Machine."',
-												[ooyala] fix duration scale

											
										
										
											9 years ago
+								                'duration': 135.427,
-												[extractor/generic] Add test for #6485

											
										
										
											10 years ago
+								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[generic] Update some _TESTS

											
										
										
											8 years ago
+								            'skip': 'movie expired',
-												[extractor/generic] Add test for #6485

											
										
										
											10 years ago
+								        },
-												[generic] Add support for another ooyala embed pattern (closes #13727)


											
										
										
											8 years ago
+								        # ooyala video embedded with http://player.ooyala.com/static/v4/production/latest/core.min.js
 								        {
 								            'url': 'http://wnep.com/2017/07/22/steampunk-fest-comes-to-honesdale/',
 								            'info_dict': {
 								                'id': 'lwYWYxYzE6V5uJMjNGyKtwwiw9ZJD7t2',
 								                'ext': 'mp4',
 								                'title': 'Steampunk Fest Comes to Honesdale',
 								                'duration': 43.276,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            }
 								        },
-												Add support for embed.ly

											
										
										
											11 years ago
+								        # embed.ly video
 								        {
 								            'url': 'http://www.tested.com/science/weird/460206-tested-grinding-coffee-2000-frames-second/',
 								            'info_dict': {
 								                'id': '9ODmcdjQcHQ',
 								                'ext': 'mp4',
-												[generic] Add all test attributes for embedly (#2447)

In the future, we may want to not only print something, but throw an error for untested properties.

											
										
										
											11 years ago
+								                'title': 'Tested: Grinding Coffee at 2000 Frames Per Second',
 								                'upload_date': '20140225',
 								                'description': 'md5:06a40fbf30b220468f1e0957c0f558ff',
 								                'uploader': 'Tested',
 								                'uploader_id': 'testedcom',
-												Add support for embed.ly

											
										
										
											11 years ago
+								            },
 								            # No need to test YoutubeIE here
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[generic/funnyordie] Add support for funnyordie embeds (Fixes #2546)

											
										
										
											11 years ago
+								        # funnyordie embed
 								        {
 								            'url': 'http://www.theguardian.com/world/2014/mar/11/obama-zach-galifianakis-between-two-ferns',
 								            'info_dict': {
 								                'id': '18e820ec3f',
 								                'ext': 'mp4',
 								                'title': 'Between Two Ferns with Zach Galifianakis: President Barack Obama',
 								                'description': 'Episode 18: President Barack Obama sits down with Zach Galifianakis for his most memorable interview yet.',
-												[generic] Add support for embedded rutv player

											
										
										
											11 years ago
+								            },
-												[generic] Update some _TESTS

											
										
										
											8 years ago
+								            # HEAD requests lead to endless 301, while GET is OK
 								            'expected_warnings': ['301'],
-												[generic/funnyordie] Add support for funnyordie embeds (Fixes #2546)

											
										
										
											11 years ago
+								        },
-												[generic] Add support for embedded rutv player

											
										
										
											11 years ago
+								        # RUTV embed
 								        {
 								            'url': 'http://www.rg.ru/2014/03/15/reg-dfo/anklav-anons.html',
 								            'info_dict': {
 								                'id': '776940',
 								                'ext': 'mp4',
 								                'title': 'Охотское море стало целиком российским',
 								                'description': 'md5:5ed62483b14663e2a95ebbe115eb8f43',
 								            },
 								            'params': {
 								                # m3u8 download
 								                'skip_download': True,
 								            },
-												[ted] Simplify embed code (#2587)

											
										
										
											11 years ago
+								        },
-												[extractor/generic] Add test for tvc embed

											
										
										
											10 years ago
+								        # TVC embed
 								        {
 								            'url': 'http://sch1298sz.mskobr.ru/dou_edu/karamel_ki/filial_galleries/video/iframe_src_http_tvc_ru_video_iframe_id_55304_isplay_false_acc_video_id_channel_brand_id_11_show_episodes_episode_id_32307_frameb/',
 								            'info_dict': {
 								                'id': '55304',
 								                'ext': 'mp4',
 								                'title': 'Дошкольное воспитание',
 								            },
 								        },
-												[generic] Add test for sportbox embeds

											
										
										
											10 years ago
+								        # SportBox embed
 								        {
 								            'url': 'http://www.vestifinance.ru/articles/25753',
 								            'info_dict': {
 								                'id': '25753',
-												[generic] Fix an MTV test and another test that breaks nosetests

											
										
										
											9 years ago
+								                'title': 'Прямые трансляции с Форума-выставки "Госзаказ-2013"',
-												[generic] Add test for sportbox embeds

											
										
										
											10 years ago
+								            },
 								            'playlist': [{
 								                'info_dict': {
 								                    'id': '370908',
 								                    'title': 'Госзаказ. День 3',
 								                    'ext': 'mp4',
 								                }
 								            }, {
 								                'info_dict': {
 								                    'id': '370905',
 								                    'title': 'Госзаказ. День 2',
 								                    'ext': 'mp4',
 								                }
 								            }, {
 								                'info_dict': {
 								                    'id': '370902',
 								                    'title': 'Госзаказ. День 1',
 								                    'ext': 'mp4',
 								                }
 								            }],
 								            'params': {
 								                # m3u8 download
 								                'skip_download': True,
 								            },
 								        },
-												[extractor/generic] Add test for myvi embed

											
										
										
											10 years ago
+								        # Myvi.ru embed
 								        {
 								            'url': 'http://www.kinomyvi.tv/news/detail/Pervij-dublirovannij-trejler--Uzhastikov-_nOw1',
 								            'info_dict': {
 								                'id': 'f4dafcad-ff21-423d-89b5-146cfd89fa1e',
 								                'ext': 'mp4',
 								                'title': 'Ужастики, русский трейлер (2015)',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											8 years ago
+								                'thumbnail': r're:^https?://.*\.jpg$',
-												[extractor/generic] Add test for myvi embed

											
										
										
											10 years ago
+								                'duration': 153,
 								            }
 								        },
-												[extractor/generic] Add test for xhamster embed

											
										
										
											10 years ago
+								        # XHamster embed
 								        {
 								            'url': 'http://www.numisc.com/forum/showthread.php?11696-FM15-which-pumiscer-was-this-%28-vid-%29-%28-alfa-as-fuck-srx-%29&s=711f5db534502e22260dec8c5e2d66d8',
 								            'info_dict': {
 								                'id': 'showthread',
 								                'title': '[NSFL] [FM15] which pumiscer was this ( vid ) ( alfa as fuck srx )',
 								            },
 								            'playlist_mincount': 7,
-												[generic] Update some _TESTS

											
										
										
											8 years ago
+								            # This forum does not allow <iframe> syntaxes anymore
 								            # Now HTML tags are displayed as-is
 								            'skip': 'No videos on this page',
-												[extractor/generic] Add test for xhamster embed

											
										
										
											10 years ago
+								        },
-												[ted] Simplify embed code (#2587)

											
										
										
											11 years ago
+								        # Embedded TED video
 								        {
 								            'url': 'http://en.support.wordpress.com/videos/ted-talks/',
-												[generic] Fix testcases

											
										
										
											10 years ago
+								            'md5': '65fdff94098e4a607385a60c5177c638',
-												[ted] Simplify embed code (#2587)

											
										
										
											11 years ago
+								            'info_dict': {
-												[generic] Fix testcases

											
										
										
											10 years ago
+								                'id': '1969',
-												[ted] Simplify embed code (#2587)

											
										
										
											11 years ago
+								                'ext': 'mp4',
-												[generic] Fix testcases

											
										
										
											10 years ago
+								                'title': 'Hidden miracles of the natural world',
 								                'uploader': 'Louie Schwartzberg',
 								                'description': 'md5:8145d19d320ff3e52f28401f4c4283b9',
-												[ted] Simplify embed code (#2587)

											
										
										
											11 years ago
+								            }
-												[generic/funnyordie] Add support for funnyordie embeds (Fixes #2546)

											
										
										
											11 years ago
+								        },
-												[generic] Add nowvideo test hidden behind percent encoding

											
										
										
											11 years ago
+								        # nowvideo embed hidden behind percent encoding
 								        {
 								            'url': 'http://www.waoanime.tv/the-super-dimension-fortress-macross-episode-1/',
 								            'md5': '2baf4ddd70f697d94b1c18cf796d5107',
 								            'info_dict': {
 								                'id': '06e53103ca9aa',
 								                'ext': 'flv',
 								                'title': 'Macross Episode 001  Watch Macross Episode 001 onl',
 								                'description': 'No description',
 								            },
-												Merge remote-tracking branch 'dstftw/generic-webpage-unescape'

Conflicts:
	youtube_dl/extractor/generic.py

											
										
										
											11 years ago
+								        },
-												[arte] Add support for embedded videos (Fixes #2620)

											
										
										
											11 years ago
+								        # arte embed
 								        {
 								            'url': 'http://www.tv-replay.fr/redirection/20-03-14/x-enius-arte-10753389.html',
 								            'md5': '7653032cbb25bf6c80d80f217055fa43',
 								            'info_dict': {
 								                'id': '048195-004_PLUS7-F',
 								                'ext': 'flv',
 								                'title': 'X:enius',
 								                'description': 'md5:d5fdf32ef6613cdbfd516ae658abf168',
 								                'upload_date': '20140320',
 								            },
 								            'params': {
 								                'skip_download': 'Requires rtmpdump'
-												[generic] Update some _TESTS

											
										
										
											8 years ago
+								            },
 								            'skip': 'video gone',
-												[arte] Add support for embedded videos (Fixes #2620)

											
										
										
											11 years ago
+								        },
-												[extractor/generic] Add support for francetv embeds

											
										
										
											10 years ago
+								        # francetv embed
 								        {
 								            'url': 'http://www.tsprod.com/replay-du-concert-alcaline-de-calogero',
 								            'info_dict': {
 								                'id': 'EV_30231',
 								                'ext': 'mp4',
 								                'title': 'Alcaline, le concert avec Calogero',
 								                'description': 'md5:61f08036dcc8f47e9cfc33aed08ffaff',
 								                'upload_date': '20150226',
 								                'timestamp': 1424989860,
 								                'duration': 5400,
 								            },
 								            'params': {
 								                # m3u8 downloads
 								                'skip_download': True,
 								            },
 								            'expected_warnings': [
 								                'Forbidden'
 								            ]
 								        },
-												[condenast|generic] Add support for condenast embeds (Fixes #2783)

											
										
										
											11 years ago
+								        # Condé Nast embed
 								        {
 								            'url': 'http://www.wired.com/2014/04/honda-asimo/',
 								            'md5': 'ba0dfe966fa007657bd1443ee672db0f',
 								            'info_dict': {
 								                'id': '53501be369702d3275860000',
 								                'ext': 'mp4',
 								                'title': 'Honda’s  New Asimo Robot Is More Human Than Ever',
 								            }
-												[generic] Add support for protocol-independent URLs (Fixes #2810)

											
										
										
											11 years ago
+								        },
 								        # Dailymotion embed
 								        {
 								            'url': 'http://www.spi0n.com/zap-spi0n-com-n216/',
 								            'md5': '441aeeb82eb72c422c7f14ec533999cd',
 								            'info_dict': {
 								                'id': 'k2mm4bCdJ6CQ2i7c8o2',
 								                'ext': 'mp4',
 								                'title': 'Le Zap de Spi0n n°216 - Zapping du Web',
-												[ThePlatform] Fix tests failed since 79ba9140dc8fcf5883b7473596e8f20cba6b479f

											
										
										
											9 years ago
+								                'description': 'md5:faf028e48a461b8b7fad38f1e104b119',
-												[generic] Add support for protocol-independent URLs (Fixes #2810)

											
										
										
											11 years ago
+								                'uploader': 'Spi0n',
-												[ThePlatform] Fix tests failed since 79ba9140dc8fcf5883b7473596e8f20cba6b479f

											
										
										
											9 years ago
+								                'uploader_id': 'xgditw',
 								                'upload_date': '20140425',
 								                'timestamp': 1398441542,
-												[generic] Add support for protocol-independent URLs (Fixes #2810)

											
										
										
											11 years ago
+								            },
 								            'add_ie': ['Dailymotion'],
-												[generic] Add support for <embed YouTube

											
										
										
											11 years ago
+								        },
-												[dailymail] Add support for embeds

											
										
										
											8 years ago
+								        # DailyMail embed
 								        {
 								            'url': 'http://www.bumm.sk/krimi/2017/07/05/biztonsagi-kamera-buktatta-le-az-agg-ferfit-utlegelo-apolot',
 								            'info_dict': {
 								                'id': '1495629',
 								                'ext': 'mp4',
 								                'title': 'Care worker punches elderly dementia patient in head 11 times',
 								                'description': 'md5:3a743dee84e57e48ec68bf67113199a5',
 								            },
 								            'add_ie': ['DailyMail'],
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[generic] Add support for <embed YouTube

											
										
										
											11 years ago
+								        # YouTube embed
 								        {
 								            'url': 'http://www.badzine.de/ansicht/datum/2014/06/09/so-funktioniert-die-neue-englische-badminton-liga.html',
 								            'info_dict': {
 								                'id': 'FXRb4ykk4S0',
 								                'ext': 'mp4',
 								                'title': 'The NBL Auction 2014',
 								                'uploader': 'BADMINTON England',
 								                'uploader_id': 'BADMINTONEvents',
 								                'upload_date': '20140603',
 								                'description': 'md5:9ef128a69f1e262a700ed83edb163a73',
 								            },
 								            'add_ie': ['Youtube'],
 								            'params': {
 								                'skip_download': True,
 								            }
 								        },
-												[generic] Extract mtvservices embedded videos

											
										
										
											11 years ago
+								        # MTVSercices embed
 								        {
-												[generic] Update test_Generic_40

The original link now redirects to an YouTube user channel.

											
										
										
											9 years ago
+								            'url': 'http://www.vulture.com/2016/06/new-key-peele-sketches-released.html',
 								            'md5': 'ca1aef97695ef2c1d6973256a57e5252',
-												[generic] Extract mtvservices embedded videos

											
										
										
											11 years ago
+								            'info_dict': {
-												[generic] Update test_Generic_40

The original link now redirects to an YouTube user channel.

											
										
										
											9 years ago
+								                'id': '769f7ec0-0692-4d62-9b45-0d88074bffc1',
-												[generic] Extract mtvservices embedded videos

											
										
										
											11 years ago
+								                'ext': 'mp4',
-												[generic] Update test_Generic_40

The original link now redirects to an YouTube user channel.

											
										
										
											9 years ago
+								                'title': 'Key and Peele|October 10, 2012|2|203|Liam Neesons - Uncensored',
 								                'description': 'Two valets share their love for movie star Liam Neesons.',
-												[generic] Fix an MTV test and another test that breaks nosetests

											
										
										
											9 years ago
+								                'timestamp': 1349922600,
 								                'upload_date': '20121011',
-												[generic] Extract mtvservices embedded videos

											
										
										
											11 years ago
+								            },
 								        },
-												Add a _TEST_

											
										
										
											11 years ago
+								        # YouTube embed via <data-embed-url="">
 								        {
 								            'url': 'https://play.google.com/store/apps/details?id=com.gameloft.android.ANMP.GloftA8HM',
 								            'info_dict': {
-												[generic] Fix testcases

											
										
										
											10 years ago
+								                'id': '4vAffPZIT44',
-												Add a _TEST_

											
										
										
											11 years ago
+								                'ext': 'mp4',
-												[generic] Fix testcases

											
										
										
											10 years ago
+								                'title': 'Asphalt 8: Airborne - Update - Welcome to Dubai!',
-												[generic] Simplify playlist support (#2948)

											
										
										
											10 years ago
+								                'uploader': 'Gameloft',
 								                'uploader_id': 'gameloft',
-												[generic] Fix testcases

											
										
										
											10 years ago
+								                'upload_date': '20140828',
 								                'description': 'md5:c80da9ed3d83ae6d1876c834de03e1c4',
-												[generic] Simplify playlist support (#2948)

											
										
										
											10 years ago
+								            },
 								            'params': {
 								                'skip_download': True,
-												Add a _TEST_

											
										
										
											11 years ago
+								            }
-												[generic] Add support for camtasia videos (Fixes #3574)

											
										
										
											10 years ago
+								        },
-												[generic] Add support for <object> youtube embeds (closes #12637)


											
										
										
											8 years ago
+								        # YouTube <object> embed
 								        {
 								            'url': 'http://www.improbable.com/2017/04/03/untrained-modern-youths-and-ancient-masters-in-selfie-portraits/',
 								            'md5': '516718101ec834f74318df76259fb3cc',
 								            'info_dict': {
 								                'id': 'msN87y-iEx0',
 								                'ext': 'webm',
 								                'title': 'Feynman: Mirrors FUN TO IMAGINE 6',
 								                'upload_date': '20080526',
 								                'description': 'md5:0ffc78ea3f01b2e2c247d5f8d1d3c18d',
 								                'uploader': 'Christopher Sykes',
 								                'uploader_id': 'ChristopherJSykes',
 								            },
 								            'add_ie': ['Youtube'],
 								        },
-												[generic] Add support for camtasia videos (Fixes #3574)

											
										
										
											10 years ago
+								        # Camtasia studio
 								        {
 								            'url': 'http://www.ll.mit.edu/workshops/education/videocourses/antennas/lecture1/video/',
 								            'playlist': [{
 								                'md5': '0c5e352edabf715d762b0ad4e6d9ee67',
 								                'info_dict': {
 								                    'id': 'Fenn-AA_PA_Radar_Course_Lecture_1c_Final',
 								                    'title': 'Fenn-AA_PA_Radar_Course_Lecture_1c_Final - video1',
 								                    'ext': 'flv',
 								                    'duration': 2235.90,
 								                }
 								            }, {
 								                'md5': '10e4bb3aaca9fd630e273ff92d9f3c63',
 								                'info_dict': {
 								                    'id': 'Fenn-AA_PA_Radar_Course_Lecture_1c_Final_PIP',
 								                    'title': 'Fenn-AA_PA_Radar_Course_Lecture_1c_Final - pip',
 								                    'ext': 'flv',
 								                    'duration': 2235.93,
 								                }
 								            }],
 								            'info_dict': {
 								                'title': 'Fenn-AA_PA_Radar_Course_Lecture_1c_Final',
 								            }
-												[generic] Automatic detection of flow player and age_limit (Fixes #3576)

											
										
										
											10 years ago
+								        },
 								        # Flowplayer
 								        {
 								            'url': 'http://www.handjobhub.com/video/busty-blonde-siri-tit-fuck-while-wank-6313.html',
 								            'md5': '9d65602bf31c6e20014319c7d07fba27',
 								            'info_dict': {
 								                'id': '5123ea6d5e5a7',
 								                'ext': 'mp4',
 								                'age_limit': 18,
 								                'uploader': 'www.handjobhub.com',
-												[generic] Fix test title

											
										
										
											10 years ago
+								                'title': 'Busty Blonde Siri Tit Fuck While Wank at HandjobHub.com',
-												[generic] Automatic detection of flow player and age_limit (Fixes #3576)

											
										
										
											10 years ago
+								            }
-												[generic] Fix rss under Python 2.x and move test to extractor

											
										
										
											10 years ago
+								        },
-												Move playlist tests to extractors.

From now on, test_download will run these tests. That means we benefit not only from the networking setup in there, but also from the other tests (for example test_all_urls to find problems with _VALID_URLs).

											
										
										
											10 years ago
+								        # Multiple brightcove videos
 								        # https://github.com/rg3/youtube-dl/issues/2283
 								        {
 								            'url': 'http://www.newyorker.com/online/blogs/newsdesk/2014/01/always-never-nuclear-command-and-control.html',
 								            'info_dict': {
 								                'id': 'always-never',
 								                'title': 'Always / Never - The New Yorker',
 								            },
 								            'playlist_count': 3,
 								            'params': {
 								                'extract_flat': False,
 								                'skip_download': True,
 								            }
-												[mlb] Add support for embedded videos (Closes #3653)

											
										
										
											10 years ago
+								        },
 								        # MLB embed
 								        {
 								            'url': 'http://umpire-empire.com/index.php/topic/58125-laz-decides-no-thats-low/',
 								            'md5': '96f09a37e44da40dd083e12d9a683327',
 								            'info_dict': {
 								                'id': '33322633',
 								                'ext': 'mp4',
 								                'title': 'Ump changes call to ball',
 								                'description': 'md5:71c11215384298a172a6dcb4c2e20685',
 								                'duration': 48,
 								                'timestamp': 1401537900,
 								                'upload_date': '20140531',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											8 years ago
+								                'thumbnail': r're:^https?://.*\.jpg$',
-												[mlb] Add support for embedded videos (Closes #3653)

											
										
										
											10 years ago
+								            },
 								        },
-												[wistia] Use API and make more generic

											
										
										
											10 years ago
+								        # Wistia embed
 								        {
-												[extractor/generic] Remove generic id and title from wistia extractionand update tests

											
										
										
											9 years ago
+								            'url': 'http://study.com/academy/lesson/north-american-exploration-failed-colonies-of-spain-france-england.html#lesson',
 								            'md5': '1953f3a698ab51cfc948ed3992a0b7ff',
-												[wistia] Use API and make more generic

											
										
										
											10 years ago
+								            'info_dict': {
-												[extractor/generic] Remove generic id and title from wistia extractionand update tests

											
										
										
											9 years ago
+								                'id': '6e2wtrbdaf',
-												[wistia] Use API and make more generic

											
										
										
											10 years ago
+								                'ext': 'mov',
-												[extractor/generic] Remove generic id and title from wistia extractionand update tests

											
										
										
											9 years ago
+								                'title': 'paywall_north-american-exploration-failed-colonies-of-spain-france-england',
 								                'description': 'a Paywall Videos video from Remilon',
 								                'duration': 644.072,
 								                'uploader': 'study.com',
 								                'timestamp': 1459678540,
 								                'upload_date': '20160403',
 								                'filesize': 24687186,
-												[wistia] Use API and make more generic

											
										
										
											10 years ago
+								            },
 								        },
-												[thoughtworks] wistia support added

											
										
										
											10 years ago
+								        {
 								            'url': 'http://thoughtworks.wistia.com/medias/uxjb0lwrcz',
 								            'md5': 'baf49c2baa8a7de5f3fc145a8506dcd4',
 								            'info_dict': {
 								                'id': 'uxjb0lwrcz',
 								                'ext': 'mp4',
-												[extractor/generic] Remove generic id and title from wistia extractionand update tests

											
										
										
											9 years ago
+								                'title': 'Conversation about Hexagonal Rails Part 1',
-												[ThePlatform] Fix tests failed since 79ba9140dc8fcf5883b7473596e8f20cba6b479f

											
										
										
											9 years ago
+								                'description': 'a Martin Fowler video from ThoughtWorks',
-												[thoughtworks] wistia support added

											
										
										
											10 years ago
+								                'duration': 1715.0,
-												[thoughtworks] wistia regex modified

											
										
										
											10 years ago
+								                'uploader': 'thoughtworks.wistia.com',
-												[ThePlatform] Fix tests failed since 79ba9140dc8fcf5883b7473596e8f20cba6b479f

											
										
										
											9 years ago
+								                'timestamp': 1401832161,
-												[extractor/generic] Remove generic id and title from wistia extractionand update tests

											
										
										
											9 years ago
+								                'upload_date': '20140603',
-												[generic] Add a test case for direct links with broken HEAD (#4032)

											
										
										
											10 years ago
+								            },
-												[thoughtworks] wistia support added

											
										
										
											10 years ago
+								        },
-												[extractor/generic] Add test for wistia standard embed

											
										
										
											9 years ago
+								        # Wistia standard embed (async)
 								        {
 								            'url': 'https://www.getdrip.com/university/brennan-dunn-drip-workshop/',
 								            'info_dict': {
 								                'id': '807fafadvk',
 								                'ext': 'mp4',
 								                'title': 'Drip Brennan Dunn Workshop',
 								                'description': 'a JV Webinars video from getdrip-1',
 								                'duration': 4986.95,
 								                'timestamp': 1463607249,
-												[extractor/generic] Remove generic id and title from wistia extractionand update tests

											
										
										
											9 years ago
+								                'upload_date': '20160518',
-												[extractor/generic] Add test for wistia standard embed

											
										
										
											9 years ago
+								            },
 								            'params': {
 								                'skip_download': True,
 								            }
 								        },
-												[generic] Allow soundcloud embeds with additional attributes

											
										
										
											10 years ago
+								        # Soundcloud embed
 								        {
 								            'url': 'http://nakedsecurity.sophos.com/2014/10/29/sscc-171-are-you-sure-that-1234-is-a-bad-password-podcast/',
 								            'info_dict': {
 								                'id': '174391317',
 								                'ext': 'mp3',
 								                'description': 'md5:ff867d6b555488ad3c52572bb33d432c',
 								                'uploader': 'Sophos Security',
 								                'title': 'Chet Chat 171 - Oct 29, 2014',
 								                'upload_date': '20141029',
 								            }
-												[generic] Add support for livestream embeds (Fixes #4185)

											
										
										
											10 years ago
+								        },
-												[extractor/generic] Add test for #10179

											
										
										
											9 years ago
+								        # Soundcloud multiple embeds
 								        {
 								            'url': 'http://www.guitarplayer.com/lessons/1014/legato-workout-one-hour-to-more-fluid-performance---tab/52809',
 								            'info_dict': {
 								                'id': '52809',
 								                'title': 'Guitar Essentials: Legato Workout—One-Hour to Fluid Performance  | TAB + AUDIO',
 								            },
 								            'playlist_mincount': 7,
 								        },
-												[tunein] Add support for embeds (closes #11579)

											
										
										
											8 years ago
+								        # TuneIn station embed
 								        {
 								            'url': 'http://radiocnrv.com/promouvoir-radio-cnrv/',
 								            'info_dict': {
 								                'id': '204146',
 								                'ext': 'mp3',
 								                'title': 'CNRV',
 								                'location': 'Paris, France',
 								                'is_live': True,
 								            },
 								            'params': {
 								                # Live stream
 								                'skip_download': True,
 								            },
 								        },
-												[generic] Add support for livestream embeds (Fixes #4185)

											
										
										
											10 years ago
+								        # Livestream embed
 								        {
 								            'url': 'http://www.esa.int/Our_Activities/Space_Science/Rosetta/Philae_comet_touch-down_webcast',
 								            'info_dict': {
 								                'id': '67864563',
 								                'ext': 'flv',
 								                'upload_date': '20141112',
 								                'title': 'Rosetta #CometLanding webcast HL 10',
 								            }
 								        },
-												[generic] Improve Livestream detection (closes #2234)

											
										
										
											9 years ago
+								        # Another Livestream embed, without 'new.' in URL
 								        {
 								            'url': 'https://www.freespeech.org/',
 								            'info_dict': {
 								                'id': '123537347',
 								                'ext': 'mp4',
 								                'title': 're:^FSTV [0-9]{4}-[0-9]{2}-[0-9]{2} [0-9]{2}:[0-9]{2}$',
 								            },
 								            'params': {
 								                # Live stream
 								                'skip_download': True,
 								            },
 								        },
-												[generic] Add support for LazyYT embeds (Fixes #4306)

											
										
										
											10 years ago
+								        # LazyYT
 								        {
-												[generic] Replace LazyYT test with skiplagged

discourse.ubuntu.com has gone away, repalce with skiplagged.com.
Be nice to have a non-frontpage URL that might be more stable,
though I don't have one. Maybe this should move to html
in test/test_InfoExtractor.py?

											
										
										
											8 years ago
+								            'url': 'https://skiplagged.com/',
-												[generic] Add support for LazyYT embeds (Fixes #4306)

											
										
										
											10 years ago
+								            'info_dict': {
-												[generic] Replace LazyYT test with skiplagged

discourse.ubuntu.com has gone away, repalce with skiplagged.com.
Be nice to have a non-frontpage URL that might be more stable,
though I don't have one. Maybe this should move to html
in test/test_InfoExtractor.py?

											
										
										
											8 years ago
+								                'id': 'skiplagged',
 								                'title': 'Skiplagged: The smart way to find cheap flights',
-												[generic] Add support for LazyYT embeds (Fixes #4306)

											
										
										
											10 years ago
+								            },
-												[generic] Replace LazyYT test with skiplagged

discourse.ubuntu.com has gone away, repalce with skiplagged.com.
Be nice to have a non-frontpage URL that might be more stable,
though I don't have one. Maybe this should move to html
in test/test_InfoExtractor.py?

											
										
										
											8 years ago
+								            'playlist_mincount': 1,
 								            'add_ie': ['Youtube'],
-												[generic] Detect direct video links (Fixes #4149, #4313)

											
										
										
											10 years ago
+								        },
-												[cinchcast] Add new extractor (Fixes #4428)

											
										
										
											10 years ago
+								        # Cinchcast embed
 								        {
 								            'url': 'http://undergroundwellness.com/podcasts/306-5-steps-to-permanent-gut-healing/',
 								            'info_dict': {
 								                'id': '7141703',
 								                'ext': 'mp3',
 								                'upload_date': '20141126',
 								                'title': 'Jack Tips: 5 Steps to Permanent Gut Healing',
 								            }
 								        },
-												[generic] Add support for Cinerama player (Fixes #4752)

											
										
										
											10 years ago
+								        # Cinerama player
 								        {
 								            'url': 'http://www.abc.net.au/7.30/content/2015/s4164797.htm',
 								            'info_dict': {
 								                'id': '730m_DandD_1901_512k',
 								                'ext': 'mp4',
 								                'uploader': 'www.abc.net.au',
 								                'title': 'Game of Thrones with dice - Dungeons and Dragons fantasy role-playing game gets new life - 19/01/2015',
 								            }
-												fixed viddler support - needed a Referer header; also added a viddler
generic extractor

											
										
										
											10 years ago
+								        },
 								        # embedded viddler video
 								        {
 								            'url': 'http://deadspin.com/i-cant-stop-watching-john-wall-chop-the-nuggets-with-th-1681801597',
 								            'info_dict': {
 								                'id': '4d03aad9',
 								                'ext': 'mp4',
 								                'uploader': 'deadspin',
 								                'title': 'WALL-TO-GORTAT',
 								                'timestamp': 1422285291,
 								                'upload_date': '20150126',
 								            },
 								            'add_ie': ['Viddler'],
-												[generic] Add support for jwPlayer YouTube videos

This makes nationalarchives.gov.uk work (Fixes #4907, fixes #4876)

											
										
										
											10 years ago
+								        },
-												[extractor/generic] Add test for Libsyn embed

											
										
										
											10 years ago
+								        # Libsyn embed
 								        {
 								            'url': 'http://thedailyshow.cc.com/podcast/episodetwelve',
 								            'info_dict': {
 								                'id': '3377616',
 								                'ext': 'mp3',
 								                'title': "The Daily Show Podcast without Jon Stewart - Episode 12: Bassem Youssef: Egypt's Jon Stewart",
 								                'description': 'md5:601cb790edd05908957dae8aaa866465',
 								                'upload_date': '20150220',
 								            },
-												[generic] Skip an invalid test

											
										
										
											9 years ago
+								            'skip': 'All The Daily Show URLs now redirect to http://www.cc.com/shows/',
-												[extractor/generic] Add test for Libsyn embed

											
										
										
											10 years ago
+								        },
-												[generic] Add support for jwPlayer YouTube videos

This makes nationalarchives.gov.uk work (Fixes #4907, fixes #4876)

											
										
										
											10 years ago
+								        # jwplayer YouTube
 								        {
 								            'url': 'http://media.nationalarchives.gov.uk/index.php/webinar-using-discovery-national-archives-online-catalogue/',
 								            'info_dict': {
 								                'id': 'Mrj4DVp2zeA',
 								                'ext': 'mp4',
-												[generic] Correct test case

Video has been reuploaded / edited

											
										
										
											10 years ago
+								                'upload_date': '20150212',
-												[generic] Add support for jwPlayer YouTube videos

This makes nationalarchives.gov.uk work (Fixes #4907, fixes #4876)

											
										
										
											10 years ago
+								                'uploader': 'The National Archives UK',
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								                'description': 'md5:8078af856dca76edc42910b61273dbbf',
-												[generic] Add support for jwPlayer YouTube videos

This makes nationalarchives.gov.uk work (Fixes #4907, fixes #4876)

											
										
										
											10 years ago
+								                'uploader_id': 'NationalArchives08',
 								                'title': 'Webinar: Using Discovery, The National Archives’ online catalogue',
 								            },
-												[rtlnl|generic] Add support for rtl.nl embeds (Fixes #4959)

											
										
										
											10 years ago
+								        },
-												[extractor/generic] Add test for #11993 and more metadata for rtmp

											
										
										
											8 years ago
+								        # jwplayer rtmp
 								        {
-												[Generic] Update test 69 (suffolk/sjc)

suffolk.edu/sjc => suffolk.edu/sjc/live.php

Unfortunately it only transmits video a few mornings per month, so
leaving the 'skip' is probably appropriate. Updating the 'skip- to
include the calendar information though.

											
										
										
											7 years ago
+								            'url': 'http://www.suffolk.edu/sjc/live.php',
-												[extractor/generic] Add test for #11993 and more metadata for rtmp

											
										
										
											8 years ago
+								            'info_dict': {
-												[Generic] Update test 69 (suffolk/sjc)

suffolk.edu/sjc => suffolk.edu/sjc/live.php

Unfortunately it only transmits video a few mornings per month, so
leaving the 'skip' is probably appropriate. Updating the 'skip- to
include the calendar information though.

											
										
										
											7 years ago
+								                'id': 'live',
-												[extractor/generic] Add test for #11993 and more metadata for rtmp

											
										
										
											8 years ago
+								                'ext': 'flv',
 								                'title': 'Massachusetts Supreme Judicial Court Oral Arguments',
 								                'uploader': 'www.suffolk.edu',
 								            },
 								            'params': {
 								                'skip_download': True,
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								            },
-												[Generic] Update test 69 (suffolk/sjc)

suffolk.edu/sjc => suffolk.edu/sjc/live.php

Unfortunately it only transmits video a few mornings per month, so
leaving the 'skip' is probably appropriate. Updating the 'skip- to
include the calendar information though.

											
										
										
											7 years ago
+								            'skip': 'Only has video a few mornings per month, see http://www.suffolk.edu/sjc/',
-												[extractor/generic] Add test for #11993 and more metadata for rtmp

											
										
										
											8 years ago
+								        },
-												[generic] Try parsing JWPlayer embedded videos (closes #12030)

											
										
										
											8 years ago
+								        # Complex jwplayer
 								        {
 								            'url': 'http://www.indiedb.com/games/king-machine/videos',
 								            'info_dict': {
 								                'id': 'videos',
 								                'ext': 'mp4',
 								                'title': 'king machine trailer 1',
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								                'description': 'Browse King Machine videos & audio for sweet media. Your eyes will thank you.',
-												[generic] Try parsing JWPlayer embedded videos (closes #12030)

											
										
										
											8 years ago
+								                'thumbnail': r're:^https?://.*\.jpg$',
 								            },
 								        },
-												Add test for JWPlayer where config is passed as variable

											
										
										
											8 years ago
+								        {
 								            # JWPlayer config passed as variable
 								            'url': 'http://www.txxx.com/videos/3326530/ariele/',
 								            'info_dict': {
 								                'id': '3326530_hq',
 								                'ext': 'mp4',
 								                'title': 'ARIELE | Tube Cup',
 								                'uploader': 'www.txxx.com',
 								                'age_limit': 18,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            }
 								        },
-												[JWPlatform] Support iframes

Support content.jwplatform... src attributes inside <iframe> tags in
addition to <script> tags. Just a regexp change.

Add a test (currently Generic_72).

											
										
										
											7 years ago
+								        {
 								            # JWPlatform iframe
 								            'url': 'https://www.mediaite.com/tv/dem-senator-claims-gary-cohn-faked-a-bad-connection-during-trump-call-to-get-him-off-the-phone/',
 								            'md5': 'ca00a040364b5b439230e7ebfd02c4e9',
 								            'info_dict': {
 								                'id': 'O0c5JcKT',
 								                'ext': 'mp4',
 								                'upload_date': '20171122',
 								                'timestamp': 1511366290,
 								                'title': 'Dem Senator Claims Gary Cohn Faked a Bad Connection During Trump Call to Get Him Off the Phone',
 								            },
-												[Generic] ie_key in JWPlatform test 72

											
										
										
											7 years ago
+								            'add_ie': [JWPlatformIE.ie_key()],
-												[JWPlatform] Support iframes

Support content.jwplatform... src attributes inside <iframe> tags in
addition to <script> tags. Just a regexp change.

Add a test (currently Generic_72).

											
										
										
											7 years ago
+								        },
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
+								        {
-												[generic] Add support for single format Video.js embeds (closes #14371)

											
										
										
											7 years ago
+								            # Video.js embed, multiple formats
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
+								            'url': 'http://ortcam.com/solidworks-урок-6-настройка-чертежа_33f9b7351.html',
 								            'info_dict': {
 								                'id': 'yygqldloqIk',
 								                'ext': 'mp4',
 								                'title': 'SolidWorks. Урок 6 Настройка чертежа',
 								                'description': 'md5:baf95267792646afdbf030e4d06b2ab3',
 								                'upload_date': '20130314',
 								                'uploader': 'PROстое3D',
 								                'uploader_id': 'PROstoe3D',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[generic] Add support for single format Video.js embeds (closes #14371)

											
										
										
											7 years ago
+								        {
 								            # Video.js embed, single format
 								            'url': 'https://www.vooplayer.com/v3/watch/watch.php?v=NzgwNTg=',
 								            'info_dict': {
 								                'id': 'watch',
 								                'ext': 'mp4',
 								                'title': 'Step 1 -  Good Foundation',
 								                'description': 'md5:d1e7ff33a29fc3eb1673d6c270d344f4',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[rtlnl|generic] Add support for rtl.nl embeds (Fixes #4959)

											
										
										
											10 years ago
+								        # rtl.nl embed
 								        {
 								            'url': 'http://www.rtlnieuws.nl/nieuws/buitenland/aanslagen-kopenhagen',
 								            'playlist_mincount': 5,
 								            'info_dict': {
 								                'id': 'aanslagen-kopenhagen',
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								                'title': 'Aanslagen Kopenhagen',
-												[rtlnl|generic] Add support for rtl.nl embeds (Fixes #4959)

											
										
										
											10 years ago
+								            }
-												[generic] Add support for Zapiks embeds (#5014)

											
										
										
											10 years ago
+								        },
 								        # Zapiks embed
 								        {
 								            'url': 'http://www.skipass.com/news/116090-bon-appetit-s5ep3-baqueira-mi-cor.html',
 								            'info_dict': {
 								                'id': '118046',
 								                'ext': 'mp4',
 								                'title': 'EP3S5 - Bon Appétit - Baqueira Mi Corazon !',
 								            }
 								        },
-												[extractor/generic] Improve kaltura embeds support (Closes #6137)

											
										
										
											10 years ago
+								        # Kaltura embed (different embed code)
 								        {
 								            'url': 'http://www.premierchristianradio.com/Shows/Saturday/Unbelievable/Conference-Videos/Os-Guinness-Is-It-Fools-Talk-Unbelievable-Conference-2014',
 								            'info_dict': {
 								                'id': '1_a52wc67y',
 								                'ext': 'flv',
 								                'upload_date': '20150127',
 								                'uploader_id': 'PremierMedia',
 								                'timestamp': int,
 								                'title': 'Os Guinness // Is It Fools Talk? // Unbelievable? Conference 2014',
 								            },
 								        },
-												[generic] Improve Kaltura detection

Closes #4004

											
										
										
											9 years ago
+								        # Kaltura embed with single quotes
 								        {
 								            'url': 'http://fod.infobase.com/p_ViewPlaylist.aspx?AssignmentID=NUN8ZY',
 								            'info_dict': {
 								                'id': '0_izeg5utt',
 								                'ext': 'mp4',
 								                'title': '35871',
 								                'timestamp': 1355743100,
 								                'upload_date': '20121217',
-												[kaltura] Improve embeds detection (closes #16201)

											
										
										
											7 years ago
+								                'uploader_id': 'cplapp@learn360.com',
-												[generic] Improve Kaltura detection

Closes #4004

											
										
										
											9 years ago
+								            },
 								            'add_ie': ['Kaltura'],
 								        },
-												[extractor/generic] Improve kaltura embed detection (Closes #9911)

											
										
										
											9 years ago
+								        {
 								            # Kaltura embedded via quoted entry_id
 								            'url': 'https://www.oreilly.com/ideas/my-cloud-makes-pretty-pictures',
 								            'info_dict': {
 								                'id': '0_utuok90b',
 								                'ext': 'mp4',
 								                'title': '06_matthew_brender_raj_dutt',
 								                'timestamp': 1466638791,
 								                'upload_date': '20160622',
 								            },
 								            'add_ie': ['Kaltura'],
 								            'expected_warnings': [
 								                'Could not send HEAD request'
 								            ],
 								            'params': {
 								                'skip_download': True,
 								            }
 								        },
-												[kaltura] Improve widget ID extraction (closes #11480)

											
										
										
											8 years ago
+								        {
 								            # Kaltura embedded, some fileExt broken (#11480)
 								            'url': 'http://www.cornell.edu/video/nima-arkani-hamed-standard-models-of-particle-physics',
 								            'info_dict': {
 								                'id': '1_sgtvehim',
 								                'ext': 'mp4',
 								                'title': 'Our "Standard Models" of particle physics and cosmology',
 								                'description': 'md5:67ea74807b8c4fea92a6f38d6d323861',
 								                'timestamp': 1321158993,
 								                'upload_date': '20111113',
 								                'uploader_id': 'kps1',
 								            },
 								            'add_ie': ['Kaltura'],
 								        },
-												[kaltura] Add support for iframe embeds


											
										
										
											8 years ago
+								        {
 								            # Kaltura iframe embed
 								            'url': 'http://www.gsd.harvard.edu/event/i-m-pei-a-centennial-celebration/',
 								            'md5': 'ae5ace8eb09dc1a35d03b579a9c2cc44',
 								            'info_dict': {
 								                'id': '0_f2cfbpwy',
 								                'ext': 'mp4',
 								                'title': 'I. M. Pei: A Centennial Celebration',
 								                'description': 'md5:1db8f40c69edc46ca180ba30c567f37c',
 								                'upload_date': '20170403',
 								                'uploader_id': 'batchUser',
 								                'timestamp': 1491232186,
 								            },
 								            'add_ie': ['Kaltura'],
 								        },
-												[kaltura] Improve iframe embeds detection (closes #16337)

											
										
										
											7 years ago
+								        {
 								            # Kaltura iframe embed, more sophisticated
 								            'url': 'http://www.cns.nyu.edu/~eero/math-tools/Videos/lecture-05sep2017.html',
 								            'info_dict': {
 								                'id': '1_9gzouybz',
 								                'ext': 'mp4',
 								                'title': 'lecture-05sep2017',
 								                'description': 'md5:40f347d91fd4ba047e511c5321064b49',
 								                'upload_date': '20170913',
 								                'uploader_id': 'eps2',
 								                'timestamp': 1505340777,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								            'add_ie': ['Kaltura'],
 								        },
-												[kaltura] Improve embeds detection (closes #16201)

											
										
										
											7 years ago
+								        {
 								            # meta twitter:player
 								            'url': 'http://thechive.com/2017/12/08/all-i-want-for-christmas-is-more-twerk/',
 								            'info_dict': {
 								                'id': '0_01b42zps',
 								                'ext': 'mp4',
 								                'title': 'Main Twerk (Video)',
 								                'upload_date': '20171208',
 								                'uploader_id': 'sebastian.salinas@thechive.com',
 								                'timestamp': 1512713057,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								            'add_ie': ['Kaltura'],
 								        },
-												[generic] Add tests for #13557

											
										
										
											8 years ago
+								        # referrer protected EaglePlatform embed
 								        {
 								            'url': 'https://tvrain.ru/lite/teleshow/kak_vse_nachinalos/namin-418921/',
 								            'info_dict': {
 								                'id': '582306',
 								                'ext': 'mp4',
 								                'title': 'Стас Намин: «Мы нарушили девственность Кремля»',
 								                'thumbnail': r're:^https?://.*\.jpg$',
 								                'duration': 3382,
 								                'view_count': int,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[eagleplatform] Add support for embeds

											
										
										
											10 years ago
+								        },
-												[eagleplatform] Add support for referrer protected videos (closes #13557)

											
										
										
											8 years ago
+								        # ClipYou (EaglePlatform) embed (custom URL)
-												[eagleplatform] Add support for ClipYou embeds

											
										
										
											10 years ago
+								        {
 								            'url': 'http://muz-tv.ru/play/7129/',
-												[eagleplatform] Checking direct HTTP links

Sometimes they fail with 404

											
										
										
											9 years ago
+								            # Not checking MD5 as sometimes the direct HTTP link results in 404 and HLS is used
-												[eagleplatform] Add support for ClipYou embeds

											
										
										
											10 years ago
+								            'info_dict': {
 								                'id': '12820',
 								                'ext': 'mp4',
 								                'title': "'O Sole Mio",
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											8 years ago
+								                'thumbnail': r're:^https?://.*\.jpg$',
-												[eagleplatform] Add support for ClipYou embeds

											
										
										
											10 years ago
+								                'duration': 216,
 								                'view_count': int,
 								            },
-												[generic] Add tests for #13557

											
										
										
											8 years ago
+								            'params': {
 								                'skip_download': True,
 								            },
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								            'skip': 'This video is unavailable.',
-												[eagleplatform] Add support for ClipYou embeds

											
										
										
											10 years ago
+								        },
-												[pladform] Add support for embeds

											
										
										
											10 years ago
+								        # Pladform embed
 								        {
 								            'url': 'http://muz-tv.ru/kinozal/view/7400/',
 								            'info_dict': {
 								                'id': '100183293',
 								                'ext': 'mp4',
-												[generic] Update pladform embed test

											
										
										
											10 years ago
+								                'title': 'Тайны перевала Дятлова • 1 серия 2 часть',
-												[pladform] Add support for embeds

											
										
										
											10 years ago
+								                'description': 'Документальный сериал-расследование одной из самых жутких тайн ХХ века',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											8 years ago
+								                'thumbnail': r're:^https?://.*\.jpg$',
-												[pladform] Add support for embeds

											
										
										
											10 years ago
+								                'duration': 694,
 								                'age_limit': 0,
 								            },
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								            'skip': 'HTTP Error 404: Not Found',
-												[pladform] Add support for embeds

											
										
										
											10 years ago
+								        },
-												[generic] Add test for playwire embed (#5430)

											
										
										
											10 years ago
+								        # Playwire embed
 								        {
 								            'url': 'http://www.cinemablend.com/new/First-Joe-Dirt-2-Trailer-Teaser-Stupid-Greatness-70874.html',
 								            'info_dict': {
 								                'id': '3519514',
 								                'ext': 'mp4',
 								                'title': 'Joe Dirt 2 Beautiful Loser Teaser Trailer',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											8 years ago
+								                'thumbnail': r're:^https?://.*\.png$',
-												[generic] Add test for playwire embed (#5430)

											
										
										
											10 years ago
+								                'duration': 45.115,
 								            },
 								        },
-												[generic] Add support for 5min embeds (#5310)

											
										
										
											10 years ago
+								        # 5min embed
 								        {
 								            'url': 'http://techcrunch.com/video/facebook-creates-on-this-day-crunch-report/518726732/',
 								            'md5': '4c6f127a30736b59b3e2c19234ee2bf7',
 								            'info_dict': {
 								                'id': '518726732',
 								                'ext': 'mp4',
 								                'title': 'Facebook Creates "On This Day" | Crunch Report',
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								                'description': 'Amazon updates Fire TV line, Tesla\'s Model X spotted in the wild',
 								                'timestamp': 1427237531,
 								                'uploader': 'Crunch Report',
 								                'upload_date': '20150324',
 								            },
 								            'params': {
 								                # m3u8 download
 								                'skip_download': True,
-												[generic] Add support for 5min embeds (#5310)

											
										
										
											10 years ago
+								            },
 								        },
-												[generic] Add tests for Crooks and Liars embeds

											
										
										
											10 years ago
+								        # Crooks and Liars embed
 								        {
 								            'url': 'http://crooksandliars.com/2015/04/fox-friends-says-protecting-atheists',
 								            'info_dict': {
 								                'id': '8RUoRhRi',
 								                'ext': 'mp4',
 								                'title': "Fox & Friends Says Protecting Atheists From Discrimination Is Anti-Christian!",
 								                'description': 'md5:e1a46ad1650e3a5ec7196d432799127f',
 								                'timestamp': 1428207000,
 								                'upload_date': '20150405',
 								                'uploader': 'Heather',
 								            },
 								        },
 								        # Crooks and Liars external embed
 								        {
 								            'url': 'http://theothermccain.com/2010/02/02/video-proves-that-bill-kristol-has-been-watching-glenn-beck/comment-page-1/',
 								            'info_dict': {
 								                'id': 'MTE3MjUtMzQ2MzA',
 								                'ext': 'mp4',
 								                'title': 'md5:5e3662a81a4014d24c250d76d41a08d5',
 								                'description': 'md5:9b8e9542d6c3c5de42d6451b7d780cec',
 								                'timestamp': 1265032391,
 								                'upload_date': '20100201',
 								                'uploader': 'Heather',
 								            },
 								        },
-												[generic] Add working NBC Sports vplayer test

											
										
										
											10 years ago
+								        # NBC Sports vplayer embed
-												[NBC/ThePlatform/Generic] Add a generic detector for NBCSportsVPlayer and enhance error detection in ThePlatformIE

											
										
										
											10 years ago
+								        {
-												[generic] Add working NBC Sports vplayer test

											
										
										
											10 years ago
+								            'url': 'http://www.riderfans.com/forum/showthread.php?121827-Freeman&s=e98fa1ea6dc08e886b1678d35212494a',
-												[NBC/ThePlatform/Generic] Add a generic detector for NBCSportsVPlayer and enhance error detection in ThePlatformIE

											
										
										
											10 years ago
+								            'info_dict': {
-												[generic] Add working NBC Sports vplayer test

											
										
										
											10 years ago
+								                'id': 'ln7x1qSThw4k',
 								                'ext': 'flv',
 								                'title': "PFT Live: New leader in the 'new-look' defense",
 								                'description': 'md5:65a19b4bbfb3b0c0c5768bed1dfad74e',
-												[ThePlatform] Fix tests failed since 79ba9140dc8fcf5883b7473596e8f20cba6b479f

											
										
										
											9 years ago
+								                'uploader': 'NBCU-SPORTS',
 								                'upload_date': '20140107',
 								                'timestamp': 1389118457,
-												[NBC/ThePlatform/Generic] Add a generic detector for NBCSportsVPlayer and enhance error detection in ThePlatformIE

											
										
										
											10 years ago
+								            },
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								            'skip': 'Invalid Page URL',
-												[udn] Add new extractor

											
										
										
											10 years ago
+								        },
-												[generic] Detect NBC News embeds

											
										
										
											9 years ago
+								        # NBC News embed
 								        {
 								            'url': 'http://www.vulture.com/2016/06/letterman-couldnt-care-less-about-late-night.html',
 								            'md5': '1aa589c675898ae6d37a17913cf68d66',
 								            'info_dict': {
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								                'id': 'x_dtl_oa_LettermanliftPR_160608',
-												[generic] Detect NBC News embeds

											
										
										
											9 years ago
+								                'ext': 'mp4',
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								                'title': 'David Letterman: A Preview',
-												[generic] Detect NBC News embeds

											
										
										
											9 years ago
+								                'description': 'A preview of Tom Brokaw\'s interview with David Letterman as part of the On Assignment series powered by Dateline. Airs Sunday June 12 at 7/6c.',
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								                'upload_date': '20160609',
 								                'timestamp': 1465431544,
 								                'uploader': 'NBCU-NEWS',
-												[generic] Detect NBC News embeds

											
										
										
											9 years ago
+								            },
 								        },
-												[udn] Add new extractor

											
										
										
											10 years ago
+								        # UDN embed
 								        {
-												[generic] Update the UDNEmbed test case

											
										
										
											9 years ago
+								            'url': 'https://video.udn.com/news/300346',
-												[generic] Fix test generic_51

The website replaced the original video with a new one

											
										
										
											10 years ago
+								            'md5': 'fd2060e988c326991037b9aff9df21a6',
-												[udn] Add new extractor

											
										
										
											10 years ago
+								            'info_dict': {
-												[generic] Fix test generic_51

The website replaced the original video with a new one

											
										
										
											10 years ago
+								                'id': '300346',
-												[udn] Add new extractor

											
										
										
											10 years ago
+								                'ext': 'mp4',
-												[generic] Fix test generic_51

The website replaced the original video with a new one

											
										
										
											10 years ago
+								                'title': '中一中男師變性 全校師生力挺',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											8 years ago
+								                'thumbnail': r're:^https?://.*\.jpg$',
-												[generic] Update the UDNEmbed test case

											
										
										
											9 years ago
+								            },
 								            'params': {
 								                # m3u8 download
 								                'skip_download': True,
 								            },
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								            'expected_warnings': ['Failed to parse JSON Expecting value'],
-												[generic] Support another type of Ooyala embedded video

											
										
										
											10 years ago
+								        },
-												[brightcove] Allow single quotes in Brightcove URLs (fixes #5901)

											
										
										
											10 years ago
+								        # Brightcove URL in single quotes
 								        {
 								            'url': 'http://www.sportsnet.ca/baseball/mlb/sn-presents-russell-martin-world-citizen/',
 								            'md5': '4ae374f1f8b91c889c4b9203c8c752af',
 								            'info_dict': {
 								                'id': '4255764656001',
 								                'ext': 'mp4',
 								                'title': 'SN Presents: Russell Martin, World Citizen',
 								                'description': 'To understand why he was the Toronto Blue Jays’ top off-season priority is to appreciate his background and upbringing in Montreal, where he first developed his baseball skills. Written and narrated by Stephen Brunt.',
 								                'uploader': 'Rogers Sportsnet',
-												[ThePlatform] Fix tests failed since 79ba9140dc8fcf5883b7473596e8f20cba6b479f

											
										
										
											9 years ago
+								                'uploader_id': '1704050871',
 								                'upload_date': '20150525',
 								                'timestamp': 1432570283,
-												[brightcove] Allow single quotes in Brightcove URLs (fixes #5901)

											
										
										
											10 years ago
+								            },
-												[dailymotion/generic] Add DailymotionCloudIE

											
										
										
											10 years ago
+								        },
-												[extractor/generic] Add test for OnionStudios embeds

											
										
										
											10 years ago
+								        # OnionStudios embed
 								        {
 								            'url': 'http://www.clickhole.com/video/dont-understand-bitcoin-man-will-mumble-explanatio-2537',
 								            'info_dict': {
 								                'id': '2855',
 								                'ext': 'mp4',
 								                'title': 'Don’t Understand Bitcoin? This Man Will Mumble An Explanation At You',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											8 years ago
+								                'thumbnail': r're:^https?://.*\.jpe?g$',
-												[extractor/generic] Add test for OnionStudios embeds

											
										
										
											10 years ago
+								                'uploader': 'ClickHole',
 								                'uploader_id': 'clickhole',
 								            }
 								        },
-												[extractor/generic] Add test for snagfilms embeds

											
										
										
											10 years ago
+								        # SnagFilms embed
 								        {
 								            'url': 'http://whilewewatch.blogspot.ru/2012/06/whilewewatch-whilewewatch-gripping.html',
 								            'info_dict': {
 								                'id': '74849a00-85a9-11e1-9660-123139220831',
 								                'ext': 'mp4',
 								                'title': '#whilewewatch',
 								            }
 								        },
-												[generic/adobetv] Support AdobeTVVideo embeds (#6039)

											
										
										
											10 years ago
+								        # AdobeTVVideo embed
 								        {
 								            'url': 'https://helpx.adobe.com/acrobat/how-to/new-experience-acrobat-dc.html?set=acrobat--get-started--essential-beginners',
 								            'md5': '43662b577c018ad707a63766462b1e87',
 								            'info_dict': {
 								                'id': '2456',
 								                'ext': 'mp4',
 								                'title': 'New experience with Acrobat DC',
 								                'description': 'New experience with Acrobat DC',
 								                'duration': 248.667,
 								            },
-												[generic] Add test for screenwavemedia embed

											
										
										
											9 years ago
+								        },
-												[brightcove] add support for brightcove in page embed(fixes #6824)

											
										
										
											9 years ago
+								        # BrightcoveInPageEmbed embed
 								        {
 								            'url': 'http://www.geekandsundry.com/tabletop-bonus-wils-final-thoughts-on-dread/',
 								            'info_dict': {
 								                'id': '4238694884001',
 								                'ext': 'flv',
 								                'title': 'Tabletop: Dread, Last Thoughts',
 								                'description': 'Tabletop: Dread, Last Thoughts',
 								                'duration': 51690,
 								            },
-												[generic] Extract M3U8 formats (closes #7582)

											
										
										
											9 years ago
+								        },
-												[generic] Add a test case for brightcove embed

Closes #8862

											
										
										
											9 years ago
+								        # Brightcove embed, with no valid 'renditions' but valid 'IOSRenditions'
 								        # This video can't be played in browsers if Flash disabled and UA set to iPhone, which is actually a false alarm
 								        {
 								            'url': 'https://dl.dropboxusercontent.com/u/29092637/interview.html',
 								            'info_dict': {
 								                'id': '4785848093001',
 								                'ext': 'mp4',
 								                'title': 'The Cardinal Pell Interview',
 								                'description': 'Sky News Contributor Andrew Bolt interviews George Pell in Rome, following the Cardinal\'s evidence before the Royal Commission into Child Abuse. ',
 								                'uploader': 'GlobeCast Australia - GlobeStream',
-												[ThePlatform] Fix tests failed since 79ba9140dc8fcf5883b7473596e8f20cba6b479f

											
										
										
											9 years ago
+								                'uploader_id': '2733773828001',
 								                'upload_date': '20160304',
 								                'timestamp': 1457083087,
-												[generic] Add a test case for brightcove embed

Closes #8862

											
										
										
											9 years ago
+								            },
 								            'params': {
 								                # m3u8 downloads
 								                'skip_download': True,
 								            },
 								        },
-												[brightcove] Allow whitespace around attribute names in embedded code

											
										
										
											8 years ago
+								        {
 								            # Brightcove embed with whitespace around attribute names
 								            'url': 'http://www.stack.com/video/3167554373001/learn-to-hit-open-three-pointers-with-damian-lillard-s-baseline-drift-drill',
 								            'info_dict': {
 								                'id': '3167554373001',
 								                'ext': 'mp4',
 								                'title': "Learn to Hit Open Three-Pointers With Damian Lillard's Baseline Drift Drill",
 								                'description': 'md5:57bacb0e0f29349de4972bfda3191713',
 								                'uploader_id': '1079349493',
 								                'upload_date': '20140207',
 								                'timestamp': 1391810548,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[arte.tv:embed] Extended support (#2620)

											
										
										
											9 years ago
+								        # Another form of arte.tv embed
 								        {
 								            'url': 'http://www.tv-replay.fr/redirection/09-04-16/arte-reportage-arte-11508975.html',
 								            'md5': '850bfe45417ddf221288c88a0cffe2e2',
 								            'info_dict': {
 								                'id': '030273-562_PLUS7-F',
 								                'ext': 'mp4',
 								                'title': 'ARTE Reportage - Nulle part, en France',
 								                'description': 'md5:e3a0e8868ed7303ed509b9e3af2b870d',
 								                'upload_date': '20160409',
 								            },
 								        },
-												[generic] Add support for LiveLeak embeds

											
										
										
											9 years ago
+								        # LiveLeak embed
 								        {
 								            'url': 'http://www.wykop.pl/link/3088787/',
-												[liveleak] Support another liveleak embedding pattern (closes #13336)

											
										
										
											7 years ago
+								            'md5': '7619da8c820e835bef21a1efa2a0fc71',
-												[generic] Add support for LiveLeak embeds

											
										
										
											9 years ago
+								            'info_dict': {
 								                'id': '874_1459135191',
 								                'ext': 'mp4',
 								                'title': 'Man shows poor quality of new apartment building',
 								                'description': 'The wall is like a sand pile.',
 								                'uploader': 'Lake8737',
-												[liveleak] Support another liveleak embedding pattern (closes #13336)

											
										
										
											7 years ago
+								            },
 								            'add_ie': [LiveLeakIE.ie_key()],
 								        },
 								        # Another LiveLeak embed pattern (#13336)
 								        {
 								            'url': 'https://milo.yiannopoulos.net/2017/06/concealed-carry-robbery/',
 								            'info_dict': {
 								                'id': '2eb_1496309988',
 								                'ext': 'mp4',
 								                'title': 'Thief robs place where everyone was armed',
 								                'description': 'md5:694d73ee79e535953cf2488562288eee',
 								                'uploader': 'brazilwtf',
 								            },
 								            'add_ie': [LiveLeakIE.ie_key()],
-												[generic] Add support for LiveLeak embeds

											
										
										
											9 years ago
+								        },
-												[genric] Eliminate duplicated video URLs (closes #6562)

											
										
										
											9 years ago
+								        # Duplicated embedded video URLs
 								        {
 								            'url': 'http://www.hudl.com/athlete/2538180/highlights/149298443',
 								            'info_dict': {
 								                'id': '149298443_480_16c25b74_2',
 								                'ext': 'mp4',
 								                'title': 'vs. Blue Orange Spring Game',
 								                'uploader': 'www.hudl.com',
 								            },
 								        },
-												[extractor/generic] Change twitter:player embeds priority to lowest (Closes #10090)

											
										
										
											9 years ago
+								        # twitter:player:stream embed
 								        {
 								            'url': 'http://www.rtl.be/info/video/589263.aspx?CategoryID=288',
 								            'info_dict': {
 								                'id': 'master',
 								                'ext': 'mp4',
 								                'title': 'Une nouvelle espèce de dinosaure découverte en Argentine',
 								                'uploader': 'www.rtl.be',
 								            },
 								            'params': {
 								                # m3u8 downloads
 								                'skip_download': True,
 								            },
 								        },
-												[generic] add generic support for twitter:player embeds

											
										
										
											9 years ago
+								        # twitter:player embed
 								        {
 								            'url': 'http://www.theatlantic.com/video/index/484130/what-do-black-holes-sound-like/',
 								            'md5': 'a3e0df96369831de324f0778e126653c',
 								            'info_dict': {
 								                'id': '4909620399001',
 								                'ext': 'mp4',
 								                'title': 'What Do Black Holes Sound Like?',
 								                'description': 'what do black holes sound like',
 								                'upload_date': '20160524',
 								                'uploader_id': '29913724001',
 								                'timestamp': 1464107587,
 								                'uploader': 'TheAtlantic',
 								            },
 								            'add_ie': ['BrightcoveLegacy'],
-												[facebook] Improve Facebook embedded detection

Related to #9938.

Another example comes from 9834872bf63b4e03b66c5e3b8f306556e735d8c5.

											
										
										
											9 years ago
+								        },
 								        # Facebook <iframe> embed
 								        {
 								            'url': 'https://www.hostblogger.de/blog/archives/6181-Auto-jagt-Betonmischer.html',
-												[generic] Add MD5 checksums

											
										
										
											9 years ago
+								            'md5': 'fbcde74f534176ecb015849146dd3aee',
-												[facebook] Improve Facebook embedded detection

Related to #9938.

Another example comes from 9834872bf63b4e03b66c5e3b8f306556e735d8c5.

											
										
										
											9 years ago
+								            'info_dict': {
 								                'id': '599637780109885',
 								                'ext': 'mp4',
 								                'title': 'Facebook video #599637780109885',
 								            },
 								        },
-												[facebook] Add test for plugin video embed (#13493)

											
										
										
											8 years ago
+								        # Facebook <iframe> embed, plugin video
 								        {
 								            'url': 'http://5pillarsuk.com/2017/06/07/tariq-ramadan-disagrees-with-pr-exercise-by-imams-refusing-funeral-prayers-for-london-attackers/',
 								            'info_dict': {
 								                'id': '1754168231264132',
 								                'ext': 'mp4',
 								                'title': 'About the Imams and Religious leaders refusing to perform funeral prayers for...',
 								                'uploader': 'Tariq Ramadan (official)',
 								                'timestamp': 1496758379,
 								                'upload_date': '20170606',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[facebook] Improve Facebook embedded detection

Related to #9938.

Another example comes from 9834872bf63b4e03b66c5e3b8f306556e735d8c5.

											
										
										
											9 years ago
+								        # Facebook API embed
 								        {
 								            'url': 'http://www.lothype.com/blue-stars-2016-preview-standstill-full-show/',
-												[generic] Add MD5 checksums

											
										
										
											9 years ago
+								            'md5': 'a47372ee61b39a7b90287094d447d94e',
-												[facebook] Improve Facebook embedded detection

Related to #9938.

Another example comes from 9834872bf63b4e03b66c5e3b8f306556e735d8c5.

											
										
										
											9 years ago
+								            'info_dict': {
 								                'id': '10153467542406923',
 								                'ext': 'mp4',
 								                'title': 'Facebook video #10153467542406923',
 								            },
-												[generic] Support Wordpress "YouTube Video Importer" plugin

Closes #9938

											
										
										
											9 years ago
+								        },
 								        # Wordpress "YouTube Video Importer" plugin
 								        {
 								            'url': 'http://www.lothype.com/blue-devils-drumline-stanford-lot-2016/',
-												[generic] Add MD5 checksums

											
										
										
											9 years ago
+								            'md5': 'd16797741b560b485194eddda8121b48',
-												[generic] Support Wordpress "YouTube Video Importer" plugin

Closes #9938

											
										
										
											9 years ago
+								            'info_dict': {
 								                'id': 'HNTXWDXV9Is',
 								                'ext': 'mp4',
 								                'title': 'Blue Devils Drumline Stanford lot 2016',
 								                'upload_date': '20160627',
 								                'uploader_id': 'GENOCIDE8GENERAL10',
 								                'uploader': 'cylus cyrus',
 								            },
 								        },
-												[kaltura] add support videos stored on custom kaltura servers(closes #5557)

											
										
										
											9 years ago
+								        {
 								            # video stored on custom kaltura server
 								            'url': 'http://www.expansion.com/multimedia/videos.html?media=EQcM30NHIPv',
 								            'md5': '537617d06e64dfed891fa1593c4b30cc',
 								            'info_dict': {
 								                'id': '0_1iotm5bh',
 								                'ext': 'mp4',
 								                'title': 'Elecciones británicas: 5 lecciones para Rajoy',
 								                'description': 'md5:435a89d68b9760b92ce67ed227055f16',
 								                'uploader_id': 'videos.expansion@el-mundo.net',
 								                'upload_date': '20150429',
 								                'timestamp': 1430303472,
 								            },
 								            'add_ie': ['Kaltura'],
 								        },
-												[generic] Add the test. Closes #1638

											
										
										
											9 years ago
+								        {
 								            # Non-standard Vimeo embed
 								            'url': 'https://openclassrooms.com/courses/understanding-the-web',
 								            'md5': '64d86f1c7d369afd9a78b38cbb88d80a',
 								            'info_dict': {
 								                'id': '148867247',
 								                'ext': 'mp4',
 								                'title': 'Understanding the web - Teaser',
 								                'description': 'This is "Understanding the web - Teaser" by openclassrooms on Vimeo, the home for high quality videos and the people who love them.',
 								                'upload_date': '20151214',
 								                'uploader': 'OpenClassrooms',
 								                'uploader_id': 'openclassrooms',
 								            },
 								            'add_ie': ['Vimeo'],
 								        },
-												[extractor/generic] Add vimeo embed that requires Referer passed

											
										
										
											8 years ago
+								        {
 								            # generic vimeo embed that requires original URL passed as Referer
 								            'url': 'http://racing4everyone.eu/2016/07/30/formula-1-2016-round12-germany/',
 								            'only_matching': True,
 								        },
-												[extractor/generic] Add support for arkena embeds

											
										
										
											9 years ago
+								        {
 								            'url': 'https://support.arkena.com/display/PLAY/Ways+to+embed+your+video',
 								            'md5': 'b96f2f71b359a8ecd05ce4e1daa72365',
 								            'info_dict': {
 								                'id': 'b41dda37-d8e7-4d3f-b1b5-9a9db578bdfe',
 								                'ext': 'mp4',
 								                'title': 'Big Buck Bunny',
 								                'description': 'Royalty free test video',
 								                'timestamp': 1432816365,
 								                'upload_date': '20150528',
 								                'is_live': False,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								            'add_ie': [ArkenaIE.ie_key()],
 								        },
-												[vbox7:generic] Add support for vbox7 embeds

											
										
										
											8 years ago
+								        {
 								            'url': 'http://nova.bg/news/view/2016/08/16/156543/%D0%BD%D0%B0-%D0%BA%D0%BE%D1%81%D1%8A%D0%BC-%D0%BE%D1%82-%D0%B2%D0%B7%D1%80%D0%B8%D0%B2-%D0%BE%D1%82%D1%86%D0%B5%D0%BF%D0%B8%D1%85%D0%B0-%D1%86%D1%8F%D0%BB-%D0%BA%D0%B2%D0%B0%D1%80%D1%82%D0%B0%D0%BB-%D0%B7%D0%B0%D1%80%D0%B0%D0%B4%D0%B8-%D0%B8%D0%B7%D1%82%D0%B8%D1%87%D0%B0%D0%BD%D0%B5-%D0%BD%D0%B0-%D0%B3%D0%B0%D0%B7-%D0%B2-%D0%BF%D0%BB%D0%BE%D0%B2%D0%B4%D0%B8%D0%B2/',
 								            'info_dict': {
 								                'id': '1c7141f46c',
 								                'ext': 'mp4',
 								                'title': 'НА КОСЪМ ОТ ВЗРИВ: Изтичане на газ на бензиностанция в Пловдив',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								            'add_ie': [Vbox7IE.ie_key()],
 								        },
-												[DBTV:generic] Add support for embeds

											
										
										
											8 years ago
+								        {
 								            # DBTV embeds
 								            'url': 'http://www.dagbladet.no/2016/02/23/nyheter/nordlys/ski/troms/ver/43254897/',
-												[generic] Fix dbtv test (Closes #10364)

											
										
										
											8 years ago
+								            'info_dict': {
 								                'id': '43254897',
 								                'title': 'Etter ett års planlegging, klaffet endelig alt: - Jeg måtte ta en liten dans',
 								            },
-												[DBTV:generic] Add support for embeds

											
										
										
											8 years ago
+								            'playlist_mincount': 3,
 								        },
-												[videa] Add support for videa embeds

											
										
										
											8 years ago
+								        {
 								            # Videa embeds
 								            'url': 'http://forum.dvdtalk.com/movie-talk/623756-deleted-magic-star-wars-ot-deleted-alt-scenes-docu-style.html',
 								            'info_dict': {
 								                'id': '623756-deleted-magic-star-wars-ot-deleted-alt-scenes-docu-style',
 								                'title': 'Deleted Magic - Star Wars: OT Deleted / Alt. Scenes Docu. Style - DVD Talk Forum',
 								            },
 								            'playlist_mincount': 2,
 								        },
-												[extractor/generic] Add support for 20 minuten embeds (closes #11683, closes #11751)

											
										
										
											8 years ago
+								        {
 								            # 20 minuten embed
 								            'url': 'http://www.20min.ch/schweiz/news/story/So-kommen-Sie-bei-Eis-und-Schnee-sicher-an-27032552',
 								            'info_dict': {
 								                'id': '523629',
 								                'ext': 'mp4',
 								                'title': 'So kommen Sie bei Eis und Schnee sicher an',
 								                'description': 'md5:117c212f64b25e3d95747e5276863f7d',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								            'add_ie': [TwentyMinutenIE.ie_key()],
-												[videopress] Add extractor

											
										
										
											8 years ago
+								        },
 								        {
 								            # VideoPress embed
 								            'url': 'https://en.support.wordpress.com/videopress/',
 								            'info_dict': {
 								                'id': 'OcobLTqC',
 								                'ext': 'm4v',
 								                'title': 'IMG_5786',
 								                'timestamp': 1435711927,
 								                'upload_date': '20150701',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								            'add_ie': [VideoPressIE.ie_key()],
-												[theplatform] Recognize URLs with whitespaces (closes #12044)

											
										
										
											8 years ago
+								        },
-												[generic] Add support for rutube embeds

											
										
										
											8 years ago
+								        {
 								            # Rutube embed
 								            'url': 'http://magazzino.friday.ru/videos/vipuski/kazan-2',
 								            'info_dict': {
 								                'id': '9b3d5bee0a8740bf70dfd29d3ea43541',
 								                'ext': 'flv',
 								                'title': 'Магаззино: Казань 2',
 								                'description': 'md5:99bccdfac2269f0e8fdbc4bbc9db184a',
 								                'uploader': 'Магаззино',
 								                'upload_date': '20170228',
 								                'uploader_id': '996642',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								            'add_ie': [RutubeIE.ie_key()],
 								        },
-												[theplatform] Recognize URLs with whitespaces (closes #12044)

											
										
										
											8 years ago
+								        {
 								            # ThePlatform embedded with whitespaces in URLs
 								            'url': 'http://www.golfchannel.com/topics/shows/golftalkcentral.htm',
 								            'only_matching': True,
 								        },
-												[generic] Add test for Senate ISVP iframe embed


											
										
										
											8 years ago
+								        {
 								            # Senate ISVP iframe https
 								            'url': 'https://www.hsgac.senate.gov/hearings/canadas-fast-track-refugee-plan-unanswered-questions-and-implications-for-us-national-security',
 								            'md5': 'fb8c70b0b515e5037981a2492099aab8',
 								            'info_dict': {
 								                'id': 'govtaff020316',
 								                'ext': 'mp4',
 								                'title': 'Integrated Senate Video Player',
 								            },
 								            'add_ie': [SenateISVPIE.ie_key()],
 								        },
-												[extractor/generic] Add test for #12761

											
										
										
											8 years ago
+								        {
 								            # Limelight embeds (1 channel embed + 4 media embeds)
 								            'url': 'http://www.sedona.com/FacilitatorTraining2017',
 								            'info_dict': {
 								                'id': 'FacilitatorTraining2017',
 								                'title': 'Facilitator Training 2017',
 								            },
 								            'playlist_mincount': 5,
 								        },
-												[generic] Add test for #13895

											
										
										
											7 years ago
+								        {
 								            # Limelight embed (LimelightPlayerUtil.embed)
 								            'url': 'https://tv5.ca/videos?v=xuu8qowr291ri',
 								            'info_dict': {
 								                'id': '95d035dc5c8a401588e9c0e6bd1e9c92',
 								                'ext': 'mp4',
 								                'title': '07448641',
 								                'timestamp': 1499890639,
 								                'upload_date': '20170712',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								            'add_ie': ['LimelightMedia'],
 								        },
-												[anvato] Improve extraction (closes #12913)
* Promote to regular shortcut based extractor
* Add mcp to access key mapping table
* Add support for embeds extraction
* Add support for anvato embeds in generic extractor

											
										
										
											8 years ago
+								        {
 								            'url': 'http://kron4.com/2017/04/28/standoff-with-walnut-creek-murder-suspect-ends-with-arrest/',
 								            'info_dict': {
 								                'id': 'standoff-with-walnut-creek-murder-suspect-ends-with-arrest',
 								                'title': 'Standoff with Walnut Creek murder suspect ends',
 								                'description': 'md5:3ccc48a60fc9441eeccfc9c469ebf788',
 								            },
 								            'playlist_mincount': 4,
 								        },
-												[washingtonpost] Add support for embeds (closes #12699)

											
										
										
											8 years ago
+								        {
 								            # WashingtonPost embed
 								            'url': 'http://www.vanityfair.com/hollywood/2017/04/donald-trump-tv-pitches',
 								            'info_dict': {
 								                'id': '8caf6e88-d0ec-11e5-90d3-34c2c42653ac',
 								                'ext': 'mp4',
 								                'title': "No one has seen the drama series based on Trump's life \u2014 until now",
 								                'description': 'Donald Trump wanted a weekly TV drama based on his life. It never aired. But The Washington Post recently obtained a scene from the pilot script — and enlisted actors.',
 								                'timestamp': 1455216756,
 								                'uploader': 'The Washington Post',
 								                'upload_date': '20160211',
 								            },
 								            'add_ie': [WashingtonPostIE.ie_key()],
 								        },
-												[extractor/generic] Add test for mediaset embed

											
										
										
											8 years ago
+								        {
 								            # Mediaset embed
 								            'url': 'http://www.tgcom24.mediaset.it/politica/serracchiani-voglio-vivere-in-una-societa-aperta-reazioni-sproporzionate-_3071354-201702a.shtml',
 								            'info_dict': {
 								                'id': '720642',
 								                'ext': 'mp4',
 								                'title': 'Serracchiani: "Voglio vivere in una società aperta, con tutela del patto di fiducia"',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								            'add_ie': [MediasetIE.ie_key()],
 								        },
-												[joj] Rewrite and add support for generic embeds (closes #13268)

											
										
										
											8 years ago
+								        {
 								            # JOJ.sk embeds
 								            'url': 'https://www.noviny.sk/slovensko/238543-slovenskom-sa-prehnala-vlna-silnych-burok',
 								            'info_dict': {
 								                'id': '238543-slovenskom-sa-prehnala-vlna-silnych-burok',
 								                'title': 'Slovenskom sa prehnala vlna silných búrok',
 								            },
 								            'playlist_mincount': 5,
 								            'add_ie': [JojIE.ie_key()],
 								        },
-												[extractor/common] Add support for AMP tags in _parse_html5_media_entries

											
										
										
											8 years ago
+								        {
 								            # AMP embed (see https://www.ampproject.org/docs/reference/components/amp-video)
 								            'url': 'https://tvrain.ru/amp/418921/',
 								            'md5': 'cc00413936695987e8de148b67d14f1d',
 								            'info_dict': {
 								                'id': '418921',
 								                'ext': 'mp4',
 								                'title': 'Стас Намин: «Мы нарушили девственность Кремля»',
 								            },
 								        },
-												[generic] Add support for vzaar embeds


											
										
										
											7 years ago
+								        {
 								            # vzaar embed
-												[generic] Replace vzaar embed test

											
										
										
											7 years ago
+								            'url': 'http://help.vzaar.com/article/165-embedding-video',
 								            'md5': '7e3919d9d2620b89e3e00bec7fe8c9d4',
-												[generic] Add support for vzaar embeds


											
										
										
											7 years ago
+								            'info_dict': {
-												[generic] Replace vzaar embed test

											
										
										
											7 years ago
+								                'id': '8707641',
-												[generic] Add support for vzaar embeds


											
										
										
											7 years ago
+								                'ext': 'mp4',
-												[generic] Replace vzaar embed test

											
										
										
											7 years ago
+								                'title': 'Building A Business Online: Principal Chairs Q & A',
-												[generic] Add support for vzaar embeds


											
										
										
											7 years ago
+								            },
 								        },
-												[generic] Fix support for multiple HTML5 videos on one page (closes #14080)


											
										
										
											7 years ago
+								        {
 								            # multiple HTML5 videos on one page
 								            'url': 'https://www.paragon-software.com/home/rk-free/keyscenarios.html',
 								            'info_dict': {
 								                'id': 'keyscenarios',
 								                'title': 'Rescue Kit 14 Free Edition - Getting started',
 								            },
 								            'playlist_count': 4,
-												[vshare] Fix extraction (closes #14473)


											
										
										
											7 years ago
+								        },
 								        {
 								            # vshare embed
 								            'url': 'https://youtube-dl-demo.neocities.org/vshare.html',
 								            'md5': '17b39f55b5497ae8b59f5fbce8e35886',
 								            'info_dict': {
 								                'id': '0f64ce6',
 								                'title': 'vl14062007715967',
 								                'ext': 'mp4',
 								            }
-												[mediasite] Improve extraction and code style, add support for DASH (closes #11185, closes #14343, refs #5428)

											
										
										
											7 years ago
+								        },
 								        {
 								            'url': 'http://www.heidelberg-laureate-forum.org/blog/video/lecture-friday-september-23-2016-sir-c-antony-r-hoare/',
 								            'md5': 'aecd089f55b1cb5a59032cb049d3a356',
 								            'info_dict': {
 								                'id': '90227f51a80c4d8f86c345a7fa62bd9a1d',
 								                'ext': 'mp4',
 								                'title': 'Lecture: Friday, September 23, 2016 - Sir Tony Hoare',
 								                'description': 'md5:5a51db84a62def7b7054df2ade403c6c',
 								                'timestamp': 1474354800,
 								                'upload_date': '20160920',
 								            }
-												[springboardplatform] Add extractor

											
										
										
											7 years ago
+								        },
 								        {
 								            'url': 'http://www.kidzworld.com/article/30935-trolls-the-beat-goes-on-interview-skylar-astin-and-amanda-leighton',
 								            'info_dict': {
 								                'id': '1731611',
 								                'ext': 'mp4',
 								                'title': 'Official Trailer | TROLLS: THE BEAT GOES ON!',
 								                'description': 'md5:eb5f23826a027ba95277d105f248b825',
 								                'timestamp': 1516100691,
 								                'upload_date': '20180116',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								            'add_ie': [SpringboardPlatformIE.ie_key()],
-												[youtube] Handle shared URLs with generic extractor (closes #14303)

											
										
										
											7 years ago
+								        },
 								        {
 								            'url': 'https://www.youtube.com/shared?ci=1nEzmT-M4fU',
 								            'info_dict': {
 								                'id': 'uPDB5I9wfp8',
 								                'ext': 'webm',
 								                'title': 'Pocoyo: 90 minutos de episódios completos Português para crianças - PARTE 3',
 								                'description': 'md5:d9e4d9346a2dfff4c7dc4c8cec0f546d',
 								                'upload_date': '20160219',
 								                'uploader': 'Pocoyo - Português (BR)',
 								                'uploader_id': 'PocoyoBrazil',
 								            },
 								            'add_ie': [YoutubeIE.ie_key()],
 								            'params': {
 								                'skip_download': True,
 								            },
-												[yapfiles] Add extractor (closes #15726, refs #11085)

											
										
										
											7 years ago
+								        },
 								        {
 								            'url': 'https://www.yapfiles.ru/show/1872528/690b05d3054d2dbe1e69523aa21bb3b1.mp4.html',
 								            'info_dict': {
 								                'id': 'vMDE4NzI1Mjgt690b',
 								                'ext': 'mp4',
 								                'title': 'Котята',
 								            },
 								            'add_ie': [YapFilesIE.ie_key()],
 								            'params': {
 								                'skip_download': True,
 								            },
-												[generic] Add support for share-videos.se embeds (closes #16089)


											
										
										
											7 years ago
+								        },
-												[cloudflarestream] Add support for cloudflare streams (closes #16375)

											
										
										
											7 years ago
+								        {
 								            # CloudflareStream embed
 								            'url': 'https://www.cloudflare.com/products/cloudflare-stream/',
 								            'info_dict': {
 								                'id': '31c9291ab41fac05471db4e73aa11717',
 								                'ext': 'mp4',
 								                'title': '31c9291ab41fac05471db4e73aa11717',
 								            },
 								            'add_ie': [CloudflareStreamIE.ie_key()],
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[peertube] Add support for generic embeds

											
										
										
											7 years ago
+								        {
 								            # PeerTube embed
 								            'url': 'https://joinpeertube.org/fr/home/',
 								            'info_dict': {
 								                'id': 'home',
 								                'title': 'Reprenez le contrôle de vos vidéos ! #JoinPeertube',
 								            },
 								            'playlist_count': 2,
 								        },
-												[indavideo] Add support for generic embeds (closes #11989)

											
										
										
											7 years ago
+								        {
 								            # Indavideo embed
 								            'url': 'https://streetkitchen.hu/receptek/igy_kell_otthon_hamburgert_sutni/',
 								            'info_dict': {
 								                'id': '1693903',
 								                'ext': 'mp4',
 								                'title': 'Így kell otthon hamburgert sütni',
 								                'description': 'md5:f5a730ecf900a5c852e1e00540bbb0f7',
 								                'timestamp': 1426330212,
 								                'upload_date': '20150314',
 								                'uploader': 'StreetKitchen',
 								                'uploader_id': '546363',
 								            },
 								            'add_ie': [IndavideoEmbedIE.ie_key()],
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[apa] Add extractor (closes #15041, closes #15672)

											
										
										
											7 years ago
+								        {
 								            # APA embed via JWPlatform embed
 								            'url': 'http://www.vol.at/blue-man-group/5593454',
 								            'info_dict': {
 								                'id': 'jjv85FdZ',
 								                'ext': 'mp4',
 								                'title': '"Blau ist mysteriös": Die Blue Man Group im Interview',
 								                'description': 'md5:d41d8cd98f00b204e9800998ecf8427e',
 								                'thumbnail': r're:^https?://.*\.jpg$',
 								                'duration': 254,
 								                'timestamp': 1519211149,
 								                'upload_date': '20180221',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[generic] Add support for share-videos.se embeds (closes #16089)


											
										
										
											7 years ago
+								        {
 								            'url': 'http://share-videos.se/auto/video/83645793?uid=13',
 								            'md5': 'b68d276de422ab07ee1d49388103f457',
 								            'info_dict': {
 								                'id': '83645793',
 								                'title': 'Lock up and get excited',
 								                'ext': 'mp4'
-												[generic] Restrict share-videos.se embeds regex to filter bogus URLs (#16115)

											
										
										
											7 years ago
+								            },
 								            'skip': 'TODO: fix nested playlists processing in tests',
 								        },
-												[viqeo] Add extractor (closes #17066)

											
										
										
											7 years ago
+								        {
 								            # Viqeo embeds
 								            'url': 'https://viqeo.tv/',
 								            'info_dict': {
 								                'id': 'viqeo',
 								                'title': 'All-new video platform',
 								            },
 								            'playlist_count': 6,
 								        },
-												[generic] Allow relative src for videojs embeds (closes #17324)

											
										
										
											6 years ago
+								        {
 								            # videojs embed
 								            'url': 'https://video.sibnet.ru/shell.php?videoid=3422904',
 								            'info_dict': {
 								                'id': 'shell',
 								                'ext': 'mp4',
 								                'title': 'Доставщик пиццы спросил разрешения сыграть на фортепиано',
 								                'description': 'md5:89209cdc587dab1e4a090453dbaa2cb1',
 								                'thumbnail': r're:^https?://.*\.jpg$',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								            'expected_warnings': ['Failed to download MPD manifest'],
 								        },
-												[extractor/generic] Properly comment out a test

											
										
										
											9 years ago
+								        # {
 								        #     # TODO: find another test
 								        #     # http://schema.org/VideoObject
 								        #     'url': 'https://flipagram.com/f/nyvTSJMKId',
 								        #     'md5': '888dcf08b7ea671381f00fab74692755',
 								        #     'info_dict': {
 								        #         'id': 'nyvTSJMKId',
 								        #         'ext': 'mp4',
 								        #         'title': 'Flipagram by sjuria101 featuring Midnight Memories by One Direction',
 								        #         'description': '#love for cats.',
 								        #         'timestamp': 1461244995,
 								        #         'upload_date': '20160421',
 								        #     },
 								        #     'params': {
 								        #         'force_generic_extractor': True,
 								        #     },
 								        # }
-												GenericIE: Detect videos from Brightcove

Brightcove videos info is usually found in an <object class="BrightcoveExperience"></object> node, this is passed to a new method of BrightcoveIE that builds a url to extract the video.

											
										
										
											12 years ago
+								    ]
-												Move GenericIE into its own file

											
										
										
											12 years ago
 								    def report_following_redirect(self, new_url):
 								        """Report information extraction."""
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								        self._downloader.to_screen('[redirect] Following redirect to %s' % new_url)
-												Move GenericIE into its own file

											
										
										
											12 years ago
-												[generic] Add support for RSS feeds (Fixes #667)

											
										
										
											11 years ago
+								    def _extract_rss(self, url, video_id, doc):
 								        playlist_title = doc.find('./channel/title').text
 								        playlist_desc_el = doc.find('./channel/description')
 								        playlist_desc = None if playlist_desc_el is None else playlist_desc_el.text
-												[generic] Parse RSS enclosure URLs (Fixes #5091)

											
										
										
											10 years ago
+								        entries = []
 								        for it in doc.findall('./channel/item'):
-												[generic] Prefer enclosures over links in RSS feeds


											
										
										
											7 years ago
+								            next_url = None
 								            enclosure_nodes = it.findall('./enclosure')
 								            for e in enclosure_nodes:
 								                next_url = e.attrib.get('url')
 								                if next_url:
 								                    break
-												[generic] Parse RSS enclosure URLs (Fixes #5091)

											
										
										
											10 years ago
+								            if not next_url:
-												[generic] Prefer enclosures over links in RSS feeds


											
										
										
											7 years ago
+								                next_url = xpath_text(it, 'link', fatal=False)
-												[generic] Parse RSS enclosure URLs (Fixes #5091)

											
										
										
											10 years ago
 								            if not next_url:
 								                continue
 								            entries.append({
-												[extractor/generic] Extract RSS entries as url_transparent (#11163)

											
										
										
											8 years ago
+								                '_type': 'url_transparent',
-												[generic] Parse RSS enclosure URLs (Fixes #5091)

											
										
										
											10 years ago
+								                'url': next_url,
 								                'title': it.find('title').text,
 								            })
-												[generic] Add support for RSS feeds (Fixes #667)

											
										
										
											11 years ago
 								        return {
 								            '_type': 'playlist',
 								            'id': url,
 								            'title': playlist_title,
 								            'description': playlist_desc,
 								            'entries': entries,
 								        }
-												[generic] Add support for camtasia videos (Fixes #3574)

											
										
										
											10 years ago
+								    def _extract_camtasia(self, url, video_id, webpage):
 								        """ Returns None if no camtasia video can be found. """
 								        camtasia_cfg = self._search_regex(
 								            r'fo\.addVariable\(\s*"csConfigFile",\s*"([^"]+)"\s*\);',
 								            webpage, 'camtasia configuration file', default=None)
 								        if camtasia_cfg is None:
 								            return None
 								        title = self._html_search_meta('DC.title', webpage, fatal=True)
 								        camtasia_url = compat_urlparse.urljoin(url, camtasia_cfg)
 								        camtasia_cfg = self._download_xml(
 								            camtasia_url, video_id,
 								            note='Downloading camtasia configuration',
 								            errnote='Failed to download camtasia configuration')
 								        fileset_node = camtasia_cfg.find('./playlist/array/fileset')
 								        entries = []
 								        for n in fileset_node.getchildren():
 								            url_n = n.find('./uri')
 								            if url_n is None:
 								                continue
 								            entries.append({
 								                'id': os.path.splitext(url_n.text.rpartition('/')[2])[0],
 								                'title': '%s - %s' % (title, n.tag),
 								                'url': compat_urlparse.urljoin(url, url_n.text),
 								                'duration': float_or_none(n.find('./duration').text),
 								            })
 								        return {
 								            '_type': 'playlist',
 								            'entries': entries,
 								            'title': title,
 								        }
-												Move GenericIE into its own file

											
										
										
											12 years ago
+								    def _real_extract(self, url):
-												[generic] Add support for protocol-independent URLs (Fixes #2810)

											
										
										
											11 years ago
+								        if url.startswith('//'):
 								            return {
 								                '_type': 'url',
-												[soundcloud/generic] Add support for playlists

											
										
										
											11 years ago
+								                'url': self.http_scheme() + url,
-												[generic] Add support for protocol-independent URLs (Fixes #2810)

											
										
										
											11 years ago
+								            }
-												[generic] If the url doesn't specify the protocol, then try to extract prepending 'http://'

											
										
										
											11 years ago
+								        parsed_url = compat_urlparse.urlparse(url)
 								        if not parsed_url.scheme:
-												Add new --default-search option (#2193)

											
										
										
											11 years ago
+								            default_search = self._downloader.params.get('default_search')
 								            if default_search is None:
-												[generic] Add --default-search fixup_error

This restores the ability to enter URLs without a scheme (and default to http), but still fail if the input is a search term.

											
										
										
											11 years ago
+								                default_search = 'fixup_error'
-												Add new --default-search option (#2193)

											
										
										
											11 years ago
-												[generic] Add --default-search fixup_error

This restores the ability to enter URLs without a scheme (and default to http), but still fail if the input is a search term.

											
										
										
											11 years ago
+								            if default_search in ('auto', 'auto_warning', 'fixup_error'):
-												Add new --default-search option (#2193)

											
										
										
											11 years ago
+								                if '/' in url:
 								                    self._downloader.report_warning('The url doesn\'t specify the protocol, trying with http')
 								                    return self.url_result('http://' + url)
-												[generic] Add --default-search fixup_error

This restores the ability to enter URLs without a scheme (and default to http), but still fail if the input is a search term.

											
										
										
											11 years ago
+								                elif default_search != 'fixup_error':
-												[generic] Warn before fallback to automatic search

											
										
										
											11 years ago
+								                    if default_search == 'auto_warning':
-												[generic] Abort if user passes in URL "url" (#2942)

											
										
										
											11 years ago
+								                        if re.match(r'^(?:url|URL)$', url):
 								                            raise ExtractorError(
 								                                'Invalid URL:  %r . Call youtube-dl like this:  youtube-dl -v "https://www.youtube.com/watch?v=BaW_jenozKc"  ' % url,
 								                                expected=True)
 								                        else:
 								                            self._downloader.report_warning(
-												[generic] Set default-search to error

This prevents users from submitting bug reports where they mistyped a URL, and prevents me from getting a weird video when holding shift and thus searching for :Tds

											
										
										
											11 years ago
+								                                'Falling back to youtube search for  %s . Set --default-search "auto" to suppress this warning.' % url)
-												Add new --default-search option (#2193)

											
										
										
											11 years ago
+								                    return self.url_result('ytsearch:' + url)
-												[generic] Add --default-search fixup_error

This restores the ability to enter URLs without a scheme (and default to http), but still fail if the input is a search term.

											
										
										
											11 years ago
 								            if default_search in ('error', 'fixup_error'):
-												[generic] Set default-search to error

This prevents users from submitting bug reports where they mistyped a URL, and prevents me from getting a weird video when holding shift and thus searching for :Tds

											
										
										
											11 years ago
+								                raise ExtractorError(
-												Fix all PEP8 issues except E501

											
										
										
											10 years ago
+								                    '%r is not a valid URL. '
 								                    'Set --default-search "ytsearch" (or run  youtube-dl "ytsearch:%s" ) to search YouTube'
 								                    % (url, url), expected=True)
-												Add new --default-search option (#2193)

											
										
										
											11 years ago
+								            else:
-												[generic] Allow --default-search without colon

											
										
										
											10 years ago
+								                if ':' not in default_search:
 								                    default_search += ':'
-												Add new --default-search option (#2193)

											
										
										
											11 years ago
+								                return self.url_result(default_search + url)
-												[ministrygrid] Add extractor (Fixes #2900)

											
										
										
											10 years ago
 								        url, smuggled_data = unsmuggle_url(url)
 								        force_videoid = None
-												[vimeo:likes] Add new extractor (Fixes #3835)

											
										
										
											10 years ago
+								        is_intentional = smuggled_data and smuggled_data.get('to_generic')
-												[ministrygrid] Add extractor (Fixes #2900)

											
										
										
											10 years ago
+								        if smuggled_data and 'force_videoid' in smuggled_data:
 								            force_videoid = smuggled_data['force_videoid']
 								            video_id = force_videoid
 								        else:
-												[generic,commonprotocols] Move mms suuport from GenericIE

And use _generic_* helpers in those extractors

											
										
										
											8 years ago
+								            video_id = self._generic_id(url)
-												[generic] Support direct MMS links (closes #10838)

											
										
										
											8 years ago
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								        self.to_screen('%s: Requesting header' % video_id)
-												[generic] Output something before making network requests

											
										
										
											11 years ago
-												[generic] Use default opener for HEAD request (Fixes #3528)

											
										
										
											10 years ago
+								        head_req = HEADRequest(url)
-												[generic] Handle audio streams that do not implement HEAD (Fixes #4032)

											
										
										
											10 years ago
+								        head_response = self._request_webpage(
-												[generic] Use default opener for HEAD request (Fixes #3528)

											
										
										
											10 years ago
+								            head_req, video_id,
 								            note=False, errnote='Could not send HEAD request to %s' % url,
 								            fatal=False)
-												Add support for direct links to a video (#1973)

											
										
										
											11 years ago
-												[generic] Handle audio streams that do not implement HEAD (Fixes #4032)

											
										
										
											10 years ago
+								        if head_response is not False:
-												Add support for direct links to a video (#1973)

											
										
										
											11 years ago
+								            # Check for redirect
-												[generic] Convert redirect URLs to unicode strings (closes #13951)

											
										
										
											7 years ago
+								            new_url = compat_str(head_response.geturl())
-												Add support for direct links to a video (#1973)

											
										
										
											11 years ago
+								            if url != new_url:
 								                self.report_following_redirect(new_url)
-												[ministrygrid] Add extractor (Fixes #2900)

											
										
										
											10 years ago
+								                if force_videoid:
 								                    new_url = smuggle_url(
 								                        new_url, {'force_videoid': force_videoid})
-												[generic] Do not use compatibility result fallback

											
										
										
											11 years ago
+								                return self.url_result(new_url)
-												Add support for direct links to a video (#1973)

											
										
										
											11 years ago
-												[generic] Handle audio streams that do not implement HEAD (Fixes #4032)

											
										
										
											10 years ago
+								        full_response = None
 								        if head_response is False:
-												Switch codebase to use sanitized_Request instead of
compat_urllib_request.Request

[downloader/dash] Use sanitized_Request

[downloader/http] Use sanitized_Request

[atresplayer] Use sanitized_Request

[bambuser] Use sanitized_Request

[bliptv] Use sanitized_Request

[brightcove] Use sanitized_Request

[cbs] Use sanitized_Request

[ceskatelevize] Use sanitized_Request

[collegerama] Use sanitized_Request

[extractor/common] Use sanitized_Request

[crunchyroll] Use sanitized_Request

[dailymotion] Use sanitized_Request

[dcn] Use sanitized_Request

[dramafever] Use sanitized_Request

[dumpert] Use sanitized_Request

[eitb] Use sanitized_Request

[escapist] Use sanitized_Request

[everyonesmixtape] Use sanitized_Request

[extremetube] Use sanitized_Request

[facebook] Use sanitized_Request

[fc2] Use sanitized_Request

[flickr] Use sanitized_Request

[4tube] Use sanitized_Request

[gdcvault] Use sanitized_Request

[extractor/generic] Use sanitized_Request

[hearthisat] Use sanitized_Request

[hotnewhiphop] Use sanitized_Request

[hypem] Use sanitized_Request

[iprima] Use sanitized_Request

[ivi] Use sanitized_Request

[keezmovies] Use sanitized_Request

[letv] Use sanitized_Request

[lynda] Use sanitized_Request

[metacafe] Use sanitized_Request

[minhateca] Use sanitized_Request

[miomio] Use sanitized_Request

[meovideo] Use sanitized_Request

[mofosex] Use sanitized_Request

[moniker] Use sanitized_Request

[mooshare] Use sanitized_Request

[movieclips] Use sanitized_Request

[mtv] Use sanitized_Request

[myvideo] Use sanitized_Request

[neteasemusic] Use sanitized_Request

[nfb] Use sanitized_Request

[niconico] Use sanitized_Request

[noco] Use sanitized_Request

[nosvideo] Use sanitized_Request

[novamov] Use sanitized_Request

[nowness] Use sanitized_Request

[nuvid] Use sanitized_Request

[played] Use sanitized_Request

[pluralsight] Use sanitized_Request

[pornhub] Use sanitized_Request

[pornotube] Use sanitized_Request

[primesharetv] Use sanitized_Request

[promptfile] Use sanitized_Request

[qqmusic] Use sanitized_Request

[rtve] Use sanitized_Request

[safari] Use sanitized_Request

[sandia] Use sanitized_Request

[shared] Use sanitized_Request

[sharesix] Use sanitized_Request

[sina] Use sanitized_Request

[smotri] Use sanitized_Request

[sohu] Use sanitized_Request

[spankwire] Use sanitized_Request

[sportdeutschland] Use sanitized_Request

[streamcloud] Use sanitized_Request

[streamcz] Use sanitized_Request

[tapely] Use sanitized_Request

[tube8] Use sanitized_Request

[tubitv] Use sanitized_Request

[twitch] Use sanitized_Request

[twitter] Use sanitized_Request

[udemy] Use sanitized_Request

[vbox7] Use sanitized_Request

[veoh] Use sanitized_Request

[vessel] Use sanitized_Request

[vevo] Use sanitized_Request

[viddler] Use sanitized_Request

[videomega] Use sanitized_Request

[viewvster] Use sanitized_Request

[viki] Use sanitized_Request

[vk] Use sanitized_Request

[vodlocker] Use sanitized_Request

[voicerepublic] Use sanitized_Request

[wistia] Use sanitized_Request

[xfileshare] Use sanitized_Request

[xtube] Use sanitized_Request

[xvideos] Use sanitized_Request

[yandexmusic] Use sanitized_Request

[youku] Use sanitized_Request

[youporn] Use sanitized_Request

[youtube] Use sanitized_Request

[patreon] Use sanitized_Request

[extractor/common] Remove unused import

[nfb] PEP 8

											
										
										
											9 years ago
+								            request = sanitized_Request(url)
-												[extractor/generic] Force Accept-Encoding to any for extraction pass

											
										
										
											10 years ago
+								            request.add_header('Accept-Encoding', '*')
 								            full_response = self._request_webpage(request, video_id)
-												[generic] Handle audio streams that do not implement HEAD (Fixes #4032)

											
										
										
											10 years ago
+								            head_response = full_response
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											9 years ago
+								        info_dict = {
 								            'id': video_id,
-												[generic,commonprotocols] Move mms suuport from GenericIE

And use _generic_* helpers in those extractors

											
										
										
											8 years ago
+								            'title': self._generic_title(url),
-												[extractor/generic] Simplify upload_date extraction

											
										
										
											9 years ago
+								            'upload_date': unified_strdate(head_response.headers.get('Last-Modified'))
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											9 years ago
+								        }
-												[generic] Handle audio streams that do not implement HEAD (Fixes #4032)

											
										
										
											10 years ago
+								        # Check for direct link to a video
-												[extractor/generic] Force Content-Type to lowecase

											
										
										
											9 years ago
+								        content_type = head_response.headers.get('Content-Type', '').lower()
-												[extractor/generic] Properly extract format id from Content-Type

Fixes extraction for cases like: audio/x-mpegURL; charset=utf-8

											
										
										
											9 years ago
+								        m = re.match(r'^(?P<type>audio|video|application(?=/(?:ogg$|(?:vnd\.apple\.|x-)?mpegurl)))/(?P<format_id>[^;\s]+)', content_type)
-												[generic] Handle audio streams that do not implement HEAD (Fixes #4032)

											
										
										
											10 years ago
+								        if m:
-												[extractor/generic] Ensure format id is unicode string

											
										
										
											8 years ago
+								            format_id = compat_str(m.group('format_id'))
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											9 years ago
+								            if format_id.endswith('mpegurl'):
-												[generic] extract m3u8 formats when mpegurl content type detected

											
										
										
											9 years ago
+								                formats = self._extract_m3u8_formats(url, video_id, 'mp4')
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											9 years ago
+								            elif format_id == 'f4m':
 								                formats = self._extract_f4m_formats(url, video_id)
-												[generic] extract m3u8 formats when mpegurl content type detected

											
										
										
											9 years ago
+								            else:
 								                formats = [{
-												[extractor/generic] Ensure format id is unicode string

											
										
										
											8 years ago
+								                    'format_id': format_id,
-												[generic] extract m3u8 formats when mpegurl content type detected

											
										
										
											9 years ago
+								                    'url': url,
 								                    'vcodec': 'none' if m.group('type') == 'audio' else None
 								                }]
-												[extractor/generic] Fix direct link semantics

											
										
										
											9 years ago
+								                info_dict['direct'] = True
-												Remove _sort_formats from _extract_*_formats methods

Now _sort_formats should be called explicitly.
_sort_formats has been added to all the necessary places in code.

Closes #8051

											
										
										
											9 years ago
+								            self._sort_formats(formats)
-												[extractor/generic] Fix direct link semantics

											
										
										
											9 years ago
+								            info_dict['formats'] = formats
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											9 years ago
+								            return info_dict
-												Add support for direct links to a video (#1973)

											
										
										
											11 years ago
-												[vimeo:likes] Add new extractor (Fixes #3835)

											
										
										
											10 years ago
+								        if not self._downloader.params.get('test', False) and not is_intentional:
-												[extractor/generic] Clarify generic extraction warning

											
										
										
											10 years ago
+								            force = self._downloader.params.get('force_generic_extractor', False)
 								            self._downloader.report_warning(
 								                '%s on generic information extractor.' % ('Forcing' if force else 'Falling back'))
-												[vimeo:likes] Add new extractor (Fixes #3835)

											
										
										
											10 years ago
-												[generic] Detect direct video links (Fixes #4149, #4313)

											
										
										
											10 years ago
+								        if not full_response:
-												Switch codebase to use sanitized_Request instead of
compat_urllib_request.Request

[downloader/dash] Use sanitized_Request

[downloader/http] Use sanitized_Request

[atresplayer] Use sanitized_Request

[bambuser] Use sanitized_Request

[bliptv] Use sanitized_Request

[brightcove] Use sanitized_Request

[cbs] Use sanitized_Request

[ceskatelevize] Use sanitized_Request

[collegerama] Use sanitized_Request

[extractor/common] Use sanitized_Request

[crunchyroll] Use sanitized_Request

[dailymotion] Use sanitized_Request

[dcn] Use sanitized_Request

[dramafever] Use sanitized_Request

[dumpert] Use sanitized_Request

[eitb] Use sanitized_Request

[escapist] Use sanitized_Request

[everyonesmixtape] Use sanitized_Request

[extremetube] Use sanitized_Request

[facebook] Use sanitized_Request

[fc2] Use sanitized_Request

[flickr] Use sanitized_Request

[4tube] Use sanitized_Request

[gdcvault] Use sanitized_Request

[extractor/generic] Use sanitized_Request

[hearthisat] Use sanitized_Request

[hotnewhiphop] Use sanitized_Request

[hypem] Use sanitized_Request

[iprima] Use sanitized_Request

[ivi] Use sanitized_Request

[keezmovies] Use sanitized_Request

[letv] Use sanitized_Request

[lynda] Use sanitized_Request

[metacafe] Use sanitized_Request

[minhateca] Use sanitized_Request

[miomio] Use sanitized_Request

[meovideo] Use sanitized_Request

[mofosex] Use sanitized_Request

[moniker] Use sanitized_Request

[mooshare] Use sanitized_Request

[movieclips] Use sanitized_Request

[mtv] Use sanitized_Request

[myvideo] Use sanitized_Request

[neteasemusic] Use sanitized_Request

[nfb] Use sanitized_Request

[niconico] Use sanitized_Request

[noco] Use sanitized_Request

[nosvideo] Use sanitized_Request

[novamov] Use sanitized_Request

[nowness] Use sanitized_Request

[nuvid] Use sanitized_Request

[played] Use sanitized_Request

[pluralsight] Use sanitized_Request

[pornhub] Use sanitized_Request

[pornotube] Use sanitized_Request

[primesharetv] Use sanitized_Request

[promptfile] Use sanitized_Request

[qqmusic] Use sanitized_Request

[rtve] Use sanitized_Request

[safari] Use sanitized_Request

[sandia] Use sanitized_Request

[shared] Use sanitized_Request

[sharesix] Use sanitized_Request

[sina] Use sanitized_Request

[smotri] Use sanitized_Request

[sohu] Use sanitized_Request

[spankwire] Use sanitized_Request

[sportdeutschland] Use sanitized_Request

[streamcloud] Use sanitized_Request

[streamcz] Use sanitized_Request

[tapely] Use sanitized_Request

[tube8] Use sanitized_Request

[tubitv] Use sanitized_Request

[twitch] Use sanitized_Request

[twitter] Use sanitized_Request

[udemy] Use sanitized_Request

[vbox7] Use sanitized_Request

[veoh] Use sanitized_Request

[vessel] Use sanitized_Request

[vevo] Use sanitized_Request

[viddler] Use sanitized_Request

[videomega] Use sanitized_Request

[viewvster] Use sanitized_Request

[viki] Use sanitized_Request

[vk] Use sanitized_Request

[vodlocker] Use sanitized_Request

[voicerepublic] Use sanitized_Request

[wistia] Use sanitized_Request

[xfileshare] Use sanitized_Request

[xtube] Use sanitized_Request

[xvideos] Use sanitized_Request

[yandexmusic] Use sanitized_Request

[youku] Use sanitized_Request

[youporn] Use sanitized_Request

[youtube] Use sanitized_Request

[patreon] Use sanitized_Request

[extractor/common] Remove unused import

[nfb] PEP 8

											
										
										
											9 years ago
+								            request = sanitized_Request(url)
-												[extractor/generic] Force Accept-Encoding to any for extraction pass

											
										
										
											10 years ago
+								            # Some webservers may serve compressed content of rather big size (e.g. gzipped flac)
 								            # making it impossible to download only chunk of the file (yet we need only 512kB to
 								            # test whether it's HTML or not). According to youtube-dl default Accept-Encoding
 								            # that will always result in downloading the whole file that is not desirable.
 								            # Therefore for extraction pass we have to override Accept-Encoding to any in order
 								            # to accept raw bytes and being able to download only a chunk.
 								            # It may probably better to solve this by checking Content-Type for application/octet-stream
 								            # after HEAD request finishes, but not sure if we can rely on this.
 								            request.add_header('Accept-Encoding', '*')
 								            full_response = self._request_webpage(request, video_id)
-												[generic] Detect direct video links (Fixes #4149, #4313)

											
										
										
											10 years ago
-												[extractor/generic] Detect m3u playlists served without proper Content-Type

											
										
										
											9 years ago
+								        first_bytes = full_response.read(512)
 								        # Is it an M3U playlist?
-												[extractor/generic] Fix missing byte literal prefix

											
										
										
											9 years ago
+								        if first_bytes.startswith(b'#EXTM3U'):
-												[extractor/generic] Detect m3u playlists served without proper Content-Type

											
										
										
											9 years ago
+								            info_dict['formats'] = self._extract_m3u8_formats(url, video_id, 'mp4')
-												Remove _sort_formats from _extract_*_formats methods

Now _sort_formats should be called explicitly.
_sort_formats has been added to all the necessary places in code.

Closes #8051

											
										
										
											9 years ago
+								            self._sort_formats(info_dict['formats'])
-												[extractor/generic] Detect m3u playlists served without proper Content-Type

											
										
										
											9 years ago
+								            return info_dict
-												[generic] Detect direct video links (Fixes #4149, #4313)

											
										
										
											10 years ago
+								        # Maybe it's a direct link to a video?
 								        # Be careful not to download the whole thing!
-												[generic] Add support for BOMs (Fixes #4753)

											
										
										
											10 years ago
+								        if not is_html(first_bytes):
-												[generic] Detect direct video links (Fixes #4149, #4313)

											
										
										
											10 years ago
+								            self._downloader.report_warning(
 								                'URL could be a direct video link, returning it as such.')
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											9 years ago
+								            info_dict.update({
-												[generic] Detect direct video links (Fixes #4149, #4313)

											
										
										
											10 years ago
+								                'direct': True,
 								                'url': url,
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											9 years ago
+								            })
 								            return info_dict
-												[generic] Detect direct video links (Fixes #4149, #4313)

											
										
										
											10 years ago
 								        webpage = self._webpage_read_content(
 								            full_response, url, video_id, prefix=first_bytes)
-												Move GenericIE into its own file

											
										
										
											12 years ago
+								        self.report_extraction(video_id)
-												Support multiple embedded YouTube URLs (Fixes #1787)

											
										
										
											11 years ago
-												[extractor/generic] Detect DASH manifests and extract mpd formats

											
										
										
											9 years ago
+								        # Is it an RSS feed, a SMIL file, an XSPF playlist or a MPD manifest?
-												[generic] Add support for RSS feeds (Fixes #667)

											
										
										
											11 years ago
+								        try:
-												[compat] compat_etree_fromstring: also decode the text attribute

Deletes parse_xml from utils, because it also does it.

											
										
										
											9 years ago
+								            doc = compat_etree_fromstring(webpage.encode('utf-8'))
-												[generic] Add support for RSS feeds (Fixes #667)

											
										
										
											11 years ago
+								            if doc.tag == 'rss':
 								                return self._extract_rss(url, video_id, doc)
-												[extractor/generic] Add support for ISM manifests

											
										
										
											8 years ago
+								            elif doc.tag == 'SmoothStreamingMedia':
 								                info_dict['formats'] = self._parse_ism_formats(doc, url)
 								                self._sort_formats(info_dict['formats'])
 								                return info_dict
-												[extractor/generic] Improve generic SMIL detection

											
										
										
											10 years ago
+								            elif re.match(r'^(?:{[^}]+})?smil$', doc.tag):
-												Remove _sort_formats from _extract_*_formats methods

Now _sort_formats should be called explicitly.
_sort_formats has been added to all the necessary places in code.

Closes #8051

											
										
										
											9 years ago
+								                smil = self._parse_smil(doc, url, video_id)
 								                self._sort_formats(smil['formats'])
 								                return smil
-												[extractor/generic] Add support for xspf playlists

											
										
										
											10 years ago
+								            elif doc.tag == '{http://xspf.org/ns/0/}playlist':
-												[extractor/generic] Support relative URIs in _parse_xspf

<location> can have relative URIs, not just absolute.

											
										
										
											7 years ago
+								                return self.playlist_result(
-												Generalize XML manifest processing code and improve XSPF parsing (closes #15794)

											
										
										
											7 years ago
+								                    self._parse_xspf(
 								                        doc, video_id, xspf_url=url,
 								                        xspf_base_url=compat_str(full_response.geturl())),
-												[extractor/generic] Support relative URIs in _parse_xspf

<location> can have relative URIs, not just absolute.

											
										
										
											7 years ago
+								                    video_id)
-												[extractor/generic] Detect DASH manifests and extract mpd formats

											
										
										
											9 years ago
+								            elif re.match(r'(?i)^(?:{[^}]+})?MPD$', doc.tag):
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											9 years ago
+								                info_dict['formats'] = self._parse_mpd_formats(
-												[extractor/generic] Fix typo (closes #14902)
Don't pass video_id as mpd_id

											
										
										
											7 years ago
+								                    doc,
-												[generic] Convert redirect URLs to unicode strings (closes #13951)

											
										
										
											7 years ago
+								                    mpd_base_url=compat_str(full_response.geturl()).rpartition('/')[0],
-												Refactor fragments interface and dash segments downloader
- Eliminate segment_urls and initialization_url
+ Introduce manifest_url (manifest may contain unfragmented data in this case url will be used for direct media URL and manifest_url for manifest itself correspondingly)
* Rewrite dashsegments downloader to use fragments data
* Improve generic mpd extraction

											
										
										
											8 years ago
+								                    mpd_url=url)
-												Remove _sort_formats from _extract_*_formats methods

Now _sort_formats should be called explicitly.
_sort_formats has been added to all the necessary places in code.

Closes #8051

											
										
										
											9 years ago
+								                self._sort_formats(info_dict['formats'])
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											9 years ago
+								                return info_dict
 								            elif re.match(r'^{http://ns\.adobe\.com/f4m/[12]\.0}manifest$', doc.tag):
 								                info_dict['formats'] = self._parse_f4m_formats(doc, url, video_id)
-												Remove _sort_formats from _extract_*_formats methods

Now _sort_formats should be called explicitly.
_sort_formats has been added to all the necessary places in code.

Closes #8051

											
										
										
											9 years ago
+								                self._sort_formats(info_dict['formats'])
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											9 years ago
+								                return info_dict
-												[generic] Fix on python 2.6

`ParseError` is not available, it raises `xml.parsers.expat.ExpatError`.
The webpage needs to be encoded.

											
										
										
											11 years ago
+								        except compat_xml_parse_error:
-												[generic] Add support for RSS feeds (Fixes #667)

											
										
										
											11 years ago
+								            pass
-												[generic] Add support for camtasia videos (Fixes #3574)

											
										
										
											10 years ago
+								        # Is it a Camtasia project?
 								        camtasia_res = self._extract_camtasia(url, video_id, webpage)
 								        if camtasia_res is not None:
 								            return camtasia_res
-												[generic] Add comment for unescaping webpage contents

											
										
										
											11 years ago
+								        # Sometimes embedded video player is hidden behind percent encoding
 								        # (e.g. https://github.com/rg3/youtube-dl/issues/2448)
 								        # Unescaping the whole page allows to handle those cases in a generic way
-												Generic: use compat_urllib_parse_unquote to prevent utf8 mangling
of the entire page in python 2.

-requires- fixed compat_urllib_parse_unquote

example - the following will save with a mangled playlist title,
 instead of the kanji for 'tsunami'. This affects all utf8encoded
 urls as well

youtube-dl -f18 -o '%(playlist_title)s-%(title)s.%(ext)s' \
  https://gist.githubusercontent.com/atomicdryad/fcb97465e6060fc519e1/raw/61c14c1e3a4985471dcf56c281d24d7e781a4e0e/tsunami.html

											
										
										
											10 years ago
+								        webpage = compat_urllib_parse_unquote(webpage)
-												[generic] Unescape webpage contents
											
										
										
											11 years ago
-												Support multiple embedded YouTube URLs (Fixes #1787)

											
										
										
											11 years ago
+								        # it's tempting to parse this further, but you would
 								        # have to take into account all the variations like
 								        #   Video Title - Site Name
 								        #   Site Name | Video Title
 								        #   Video Title - Tagline | Site Name
 								        # and so on and so forth; it's just not practical
-												[extractor/generic] Improve 3qsdn embeds support (Closes #9453)

											
										
										
											9 years ago
+								        video_title = self._og_search_title(
 								            webpage, default=None) or self._html_search_regex(
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								            r'(?s)<title>(.*?)</title>', webpage, 'video title',
 								            default='video')
-												[wistia] Add extractor

											
										
										
											11 years ago
-												[generic] Automatic detection of flow player and age_limit (Fixes #3576)

											
										
										
											10 years ago
+								        # Try to detect age limit automatically
 								        age_limit = self._rta_search(webpage)
 								        # And then there are the jokers who advertise that they use RTA,
 								        # but actually don't.
 								        AGE_LIMIT_MARKERS = [
-												Fix some regexes

											
										
										
											7 years ago
+								            r'Proudly Labeled <a href="http://www\.rtalabel\.org/" title="Restricted to Adults">RTA</a>',
-												[generic] Automatic detection of flow player and age_limit (Fixes #3576)

											
										
										
											10 years ago
+								        ]
 								        if any(re.search(marker, webpage) for marker in AGE_LIMIT_MARKERS):
 								            age_limit = 18
-												[wistia] Add extractor

											
										
										
											11 years ago
+								        # video uploader is domain name
 								        video_uploader = self._search_regex(
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								            r'^(?:https?://)?([^/]*)/.*', url, 'video uploader')
-												Support multiple embedded YouTube URLs (Fixes #1787)

											
										
										
											11 years ago
-												[extractor/generic] Improve 3qsdn embeds support (Closes #9453)

											
										
										
											9 years ago
+								        video_description = self._og_search_description(webpage, default=None)
 								        video_thumbnail = self._og_search_thumbnail(webpage, default=None)
-												[generic] Extract more generic metadata (closes #13527)

											
										
										
											8 years ago
+								        info_dict.update({
 								            'title': video_title,
 								            'description': video_description,
 								            'thumbnail': video_thumbnail,
 								            'age_limit': age_limit,
 								        })
-												[generic] Clarify Brightcove Legacy Studio comment

											
										
										
											9 years ago
+								        # Look for Brightcove Legacy Studio embeds
-												[brightcove] Rename extractor to brightcove legacy

Old embedding approaches are now "Legacy Studio"

											
										
										
											9 years ago
+								        bc_urls = BrightcoveLegacyIE._extract_brightcove_urls(webpage)
-												[generic] Add support for multiple brightcove URLs (Fixes #2283)

											
										
										
											11 years ago
+								        if bc_urls:
 								            entries = [{
 								                '_type': 'url',
 								                'url': smuggle_url(bc_url, {'Referer': url}),
-												Rename all references to legacy studio Brightcove extractor

											
										
										
											9 years ago
+								                'ie_key': 'BrightcoveLegacy'
-												[generic] Add support for multiple brightcove URLs (Fixes #2283)

											
										
										
											11 years ago
+								            } for bc_url in bc_urls]
 								            return {
 								                '_type': 'playlist',
 								                'title': video_title,
 								                'id': video_id,
 								                'entries': entries,
 								            }
-												GenericIE: Detect videos from Brightcove

Brightcove videos info is usually found in an <object class="BrightcoveExperience"></object> node, this is passed to a new method of BrightcoveIE that builds a url to extract the video.

											
										
										
											12 years ago
-												[generic] Extract Brightcove New Studio embeds

											
										
										
											9 years ago
+								        # Look for Brightcove New Studio embeds
-												[brightcove] Validate ambiguous embeds' URLs (closes #9163, closes #12005, closes #12178, closes #12480)

											
										
										
											8 years ago
+								        bc_urls = BrightcoveNewIE._extract_urls(self, webpage)
-												[generic] Extract Brightcove New Studio embeds

											
										
										
											9 years ago
+								        if bc_urls:
-												[brightcove] Pass embed page URL as referrer (closes #15486)

											
										
										
											7 years ago
+								            return self.playlist_from_matches(
 								                bc_urls, video_id, video_title,
 								                getter=lambda x: smuggle_url(x, {'referrer': url}),
 								                ie='BrightcoveNew')
-												[brightcove] add support for brightcove in page embed(fixes #6824)

											
										
										
											9 years ago
-												[nexx] Add extractor (closes #10807, closes #13465)

											
										
										
											8 years ago
+								        # Look for Nexx embeds
 								        nexx_urls = NexxIE._extract_urls(webpage)
 								        if nexx_urls:
 								            return self.playlist_from_matches(nexx_urls, video_id, video_title, ie=NexxIE.ie_key())
-												[nexx:embed] Add extractor for iframe embeds

											
										
										
											8 years ago
+								        # Look for Nexx iFrame embeds
 								        nexx_embed_urls = NexxEmbedIE._extract_urls(webpage)
 								        if nexx_embed_urls:
 								            return self.playlist_from_matches(nexx_embed_urls, video_id, video_title, ie=NexxEmbedIE.ie_key())
-												[extractor/generic] Add support for theplatform embeds (Closes #8636, closes #9476)

											
										
										
											9 years ago
+								        # Look for ThePlatform embeds
 								        tp_urls = ThePlatformIE._extract_urls(webpage)
 								        if tp_urls:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								            return self.playlist_from_matches(tp_urls, video_id, video_title, ie='ThePlatform')
-												[extractor/generic] Add support for theplatform embeds (Closes #8636, closes #9476)

											
										
										
											9 years ago
-												[extractor/generic] Add support vessel embeds (Closes #7083)

											
										
										
											9 years ago
+								        # Look for Vessel embeds
 								        vessel_urls = VesselIE._extract_urls(webpage)
 								        if vessel_urls:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								            return self.playlist_from_matches(vessel_urls, video_id, video_title, ie=VesselIE.ie_key())
-												[extractor/generic] Add support vessel embeds (Closes #7083)

											
										
										
											9 years ago
-												[rtlnl|generic] Add support for rtl.nl embeds (Fixes #4959)

											
										
										
											10 years ago
+								        # Look for embedded rtl.nl player
 								        matches = re.findall(
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								            r'<iframe[^>]+?src="((?:https?:)?//(?:(?:www|static)\.)?rtl\.nl/(?:system/videoplayer/[^"]+(?:video_)?)?embed[^"]+)"',
-												[rtlnl|generic] Add support for rtl.nl embeds (Fixes #4959)

											
										
										
											10 years ago
+								            webpage)
 								        if matches:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								            return self.playlist_from_matches(matches, video_id, video_title, ie='RtlNl')
-												[rtlnl|generic] Add support for rtl.nl embeds (Fixes #4959)

											
										
										
											10 years ago
-												[generic] Add support for multiple vimeo embeds (Closes #10862)

											
										
										
											8 years ago
+								        vimeo_urls = VimeoIE._extract_urls(url, webpage)
 								        if vimeo_urls:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								            return self.playlist_from_matches(vimeo_urls, video_id, video_title, ie=VimeoIE.ie_key())
-												[vimeo/generic] Add support for embedded SWF vimeo videos

											
										
										
											11 years ago
-												[extractor/generic] Support vid.me embeds

											
										
										
											10 years ago
+								        vid_me_embed_url = self._search_regex(
 								            r'src=[\'"](https?://vid\.me/[^\'"]+)[\'"]',
 								            webpage, 'vid.me embed', default=None)
 								        if vid_me_embed_url is not None:
 								            return self.url_result(vid_me_embed_url, 'Vidme')
-												[youtube] Separate methods for embeds extraction

											
										
										
											7 years ago
+								        # Look for YouTube embeds
 								        youtube_urls = YoutubeIE._extract_urls(webpage)
 								        if youtube_urls:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								            return self.playlist_from_matches(
-												[youtube] Separate methods for embeds extraction

											
										
										
											7 years ago
+								                youtube_urls, video_id, video_title, ie=YoutubeIE.ie_key())
-												[generic] Support Wordpress "YouTube Video Importer" plugin

Closes #9938

											
										
										
											9 years ago
-												[francetv] Recognize more Dailymotion embedded videos

Closes #9955

											
										
										
											9 years ago
+								        matches = DailymotionIE._extract_urls(webpage)
-												[generic] Find embedded dailymotion videos (Fixes #1848)

											
										
										
											11 years ago
+								        if matches:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								            return self.playlist_from_matches(matches, video_id, video_title)
-												[generic] Find embedded dailymotion videos (Fixes #1848)

											
										
										
											11 years ago
-												[generic] Support embedded Dailymotion playlists (fixes #3822)

											
										
										
											10 years ago
+								        # Look for embedded Dailymotion playlist player (#3822)
 								        m = re.search(
 								            r'<iframe[^>]+?src=(["\'])(?P<url>(?:https?:)?//(?:www\.)?dailymotion\.[a-z]{2,3}/widget/jukebox\?.+?)\1', webpage)
 								        if m:
 								            playlists = re.findall(
 								                r'list\[\]=/playlist/([^/]+)/', unescapeHTML(m.group('url')))
 								            if playlists:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								                return self.playlist_from_matches(
 								                    playlists, video_id, video_title, lambda p: '//dailymotion.com/playlist/%s' % p)
-												[generic] Support embedded Dailymotion playlists (fixes #3822)

											
										
										
											10 years ago
-												[dailymail] Add support for embeds

											
										
										
											8 years ago
+								        # Look for DailyMail embeds
 								        dailymail_urls = DailyMailIE._extract_urls(webpage)
 								        if dailymail_urls:
 								            return self.playlist_from_matches(
 								                dailymail_urls, video_id, video_title, ie=DailyMailIE.ie_key())
-												[wistia] Add extractor

											
										
										
											11 years ago
+								        # Look for embedded Wistia player
-												[extractor/generic] Extract wistia embed code into separate method

											
										
										
											8 years ago
+								        wistia_url = WistiaIE._extract_url(webpage)
 								        if wistia_url:
-												[wistia] Add extractor

											
										
										
											11 years ago
+								            return {
 								                '_type': 'url_transparent',
-												[extractor/generic] Extract wistia embed code into separate method

											
										
										
											8 years ago
+								                'url': self._proto_relative_url(wistia_url),
 								                'ie_key': WistiaIE.ie_key(),
-												[wistia] Add extractor

											
										
										
											11 years ago
+								                'uploader': video_uploader,
 								            }
-												PEP8 applied

											
										
										
											10 years ago
-												[extractor/generic] Add support for svt embeds (Closes #5622)

											
										
										
											10 years ago
+								        # Look for SVT player
 								        svt_url = SVTIE._extract_url(webpage)
 								        if svt_url:
 								            return self.url_result(svt_url, 'SVT')
-												[generic] Detect bandcamp pages that use custom domains (closes #1662)

They embed the original url in the 'og:url' property.

											
										
										
											11 years ago
+								        # Look for Bandcamp pages with custom domain
 								        mobj = re.search(r'<meta property="og:url"[^>]*?content="(.*?bandcamp\.com.*?)"', webpage)
 								        if mobj is not None:
 								            burl = unescapeHTML(mobj.group(1))
-												[bandcamp] add support for albums (reported in #1270)

											
										
										
											11 years ago
+								            # Don't set the extractor because it can be a track url or an album
 								            return self.url_result(burl)
-												[generic] Detect bandcamp pages that use custom domains (closes #1662)

They embed the original url in the 'og:url' property.

											
										
										
											11 years ago
-												Add support for embedded vevo player (Fixes #1957)

											
										
										
											11 years ago
+								        # Look for embedded Vevo player
 								        mobj = re.search(
 								            r'<iframe[^>]+?src=(["\'])(?P<url>(?:https?:)?//(?:cache\.)?vevo\.com/.+?)\1', webpage)
 								        if mobj is not None:
 								            return self.url_result(mobj.group('url'))
-												fixed viddler support - needed a Referer header; also added a viddler
generic extractor

											
										
										
											10 years ago
 								        # Look for embedded Viddler player
-												[generic] Improve some regexes

											
										
										
											10 years ago
+								        mobj = re.search(
 								            r'<(?:iframe[^>]+?src|param[^>]+?value)=(["\'])(?P<url>(?:https?:)?//(?:www\.)?viddler\.com/(?:embed|player)/.+?)\1',
 								            webpage)
-												fixed viddler support - needed a Referer header; also added a viddler
generic extractor

											
										
										
											10 years ago
+								        if mobj is not None:
 								            return self.url_result(mobj.group('url'))
-												Add support for embedded vevo player (Fixes #1957)

											
										
										
											11 years ago
-												[generic] Add support for nytimes embeds (Closes #5234)

											
										
										
											10 years ago
+								        # Look for NYTimes player
 								        mobj = re.search(
 								            r'<iframe[^>]+src=(["\'])(?P<url>(?:https?:)?//graphics8\.nytimes\.com/bcvideo/[^/]+/iframe/embed\.html.+?)\1>',
 								            webpage)
 								        if mobj is not None:
 								            return self.url_result(mobj.group('url'))
-												[extractor/generic] Support Libsyn embeds

											
										
										
											10 years ago
+								        # Look for Libsyn player
 								        mobj = re.search(
 								            r'<iframe[^>]+src=(["\'])(?P<url>(?:https?:)?//html5-player\.libsyn\.com/embed/.+?)\1', webpage)
 								        if mobj is not None:
 								            return self.url_result(mobj.group('url'))
-												[generic] Detect ooyala videos (fixes #2013)

											
										
										
											11 years ago
+								        # Look for Ooyala videos
-												[extractor/generic] Expand ooyala regex (Closes #6485)

											
										
										
											10 years ago
+								        mobj = (re.search(r'player\.ooyala\.com/[^"?]+[?#][^"]*?(?:embedCode|ec)=(?P<ec>[^"&]+)', webpage) or
-												[generic/ooyala] Add support for Ooyala embeds on SBN network websites (Fixes #4859)

											
										
										
											10 years ago
+								                re.search(r'OO\.Player\.create\([\'"].*?[\'"],\s*[\'"](?P<ec>.{32})[\'"]', webpage) or
-												[generic] Add support for another ooyala embed pattern (closes #13727)


											
										
										
											8 years ago
+								                re.search(r'OO\.Player\.create\.apply\(\s*OO\.Player\s*,\s*op\(\s*\[\s*[\'"][^\'"]*[\'"]\s*,\s*[\'"](?P<ec>.{32})[\'"]', webpage) or
-												[generic] Support another type of Ooyala embedded video

											
										
										
											10 years ago
+								                re.search(r'SBN\.VideoLinkset\.ooyala\([\'"](?P<ec>.{32})[\'"]\)', webpage) or
 								                re.search(r'data-ooyala-video-id\s*=\s*[\'"](?P<ec>.{32})[\'"]', webpage))
-												[generic] Detect ooyala videos (fixes #2013)

											
										
										
											11 years ago
+								        if mobj is not None:
-												[ooyala] add support for videos with embedToken(#11684)

											
										
										
											8 years ago
+								            embed_token = self._search_regex(
 								                r'embedToken[\'"]?\s*:\s*[\'"]([^\'"]+)',
 								                webpage, 'ooyala embed token', default=None)
 								            return OoyalaIE._build_url_result(smuggle_url(
 								                mobj.group('ec'), {
 								                    'domain': url,
 								                    'embed_token': embed_token,
 								                }))
-												[generic] Detect ooyala videos (fixes #2013)

											
										
										
											11 years ago
-												[generic/ooyala] Add support for Ooyala embeds on SBN network websites (Fixes #4859)

											
										
										
											10 years ago
+								        # Look for multiple Ooyala embeds on SBN network websites
 								        mobj = re.search(r'SBN\.VideoLinkset\.entryGroup\((\[.*?\])', webpage)
 								        if mobj is not None:
 								            embeds = self._parse_json(mobj.group(1), video_id, fatal=False)
 								            if embeds:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								                return self.playlist_from_matches(
 								                    embeds, video_id, video_title,
 								                    getter=lambda v: OoyalaIE._url_for_embed_code(smuggle_url(v['provider_video_id'], {'domain': url})), ie='Ooyala')
-												[generic/ooyala] Add support for Ooyala embeds on SBN network websites (Fixes #4859)

											
										
										
											10 years ago
-												[aparat] Add support (Fixes #2012)

											
										
										
											11 years ago
+								        # Look for Aparat videos
-												[generic] Be more relaxed when looking for aparat embeds (Fixes #2784)

											
										
										
											11 years ago
+								        mobj = re.search(r'<iframe .*?src="(http://www\.aparat\.com/video/[^"]+)"', webpage)
-												[aparat] Add support (Fixes #2012)

											
										
										
											11 years ago
+								        if mobj is not None:
 								            return self.url_result(mobj.group(1), 'Aparat')
-												[mpora] Add support (Fixes #2096)

											
										
										
											11 years ago
+								        # Look for MPORA videos
-												Improve some regexes for embedded players
											
										
										
											11 years ago
+								        mobj = re.search(r'<iframe .*?src="(http://mpora\.(?:com|de)/videos/[^"]+)"', webpage)
-												[mpora] Add support (Fixes #2096)

											
										
										
											11 years ago
+								        if mobj is not None:
 								            return self.url_result(mobj.group(1), 'Mpora')
-												[novamov] Remove superfluous tabs
											
										
										
											11 years ago
-												[generic] Generalize novamov based embeds

											
										
										
											11 years ago
+								        # Look for embedded NovaMov-based player
-												[novamov] Add embedded player support

											
										
										
											11 years ago
+								        mobj = re.search(
-												[generic] Support pagespeed_iframe for NovaMov embeds

											
										
										
											11 years ago
+								            r'''(?x)<(?:pagespeed_)?iframe[^>]+?src=(["\'])
-												[generic] Generalize novamov based embeds

											
										
										
											11 years ago
+								                    (?P<url>http://(?:(?:embed|www)\.)?
 								                        (?:novamov\.com|
 								                           nowvideo\.(?:ch|sx|eu|at|ag|co)|
 								                           videoweed\.(?:es|com)|
 								                           movshare\.(?:net|sx|ag)|
 								                           divxstage\.(?:eu|net|ch|co|at|ag))
 								                        /embed\.php.+?)\1''', webpage)
-												[novamov] Add embedded player support

											
										
										
											11 years ago
+								        if mobj is not None:
-												[generic] Generalize novamov based embeds

											
										
										
											11 years ago
+								            return self.url_result(mobj.group('url'))
-												[generic] Add support for videoweed embeds

											
										
										
											11 years ago
-												[facebook] Add support for embeds

Example URL: http://www.hostblogger.de/blog/archives/6181-Auto-jagt-Betonmischer.html

											
										
										
											11 years ago
+								        # Look for embedded Facebook player
-												[facebook] Add support for plugin video embeds and multiple embeds (closes #13493)

											
										
										
											8 years ago
+								        facebook_urls = FacebookIE._extract_urls(webpage)
 								        if facebook_urls:
 								            return self.playlist_from_matches(facebook_urls, video_id, video_title)
-												[facebook] Add support for embeds

Example URL: http://www.hostblogger.de/blog/archives/6181-Auto-jagt-Betonmischer.html

											
										
										
											11 years ago
-												[vk] Add support for embedded videos (Closes #2473)
											
										
										
											11 years ago
+								        # Look for embedded VK player
 								        mobj = re.search(r'<iframe[^>]+?src=(["\'])(?P<url>https?://vk\.com/video_ext\.php.+?)\1', webpage)
 								        if mobj is not None:
 								            return self.url_result(mobj.group('url'), 'VK')
-												[extractor/generic] Add support for ok embeds (#8619)

											
										
										
											9 years ago
+								        # Look for embedded Odnoklassniki player
 								        mobj = re.search(r'<iframe[^>]+?src=(["\'])(?P<url>https?://(?:odnoklassniki|ok)\.ru/videoembed/.+?)\1', webpage)
 								        if mobj is not None:
 								            return self.url_result(mobj.group('url'), 'Odnoklassniki')
-												[generic] Add support for ivi.ru embedded player

											
										
										
											11 years ago
+								        # Look for embedded ivi player
 								        mobj = re.search(r'<embed[^>]+?src=(["\'])(?P<url>https?://(?:www\.)?ivi\.ru/video/player.+?)\1', webpage)
 								        if mobj is not None:
 								            return self.url_result(mobj.group('url'), 'Ivi')
-												[huffpost] Add support

											
										
										
											11 years ago
+								        # Look for embedded Huffington Post player
 								        mobj = re.search(
-												Improve some regexes for embedded players
											
										
										
											11 years ago
+								            r'<iframe[^>]+?src=(["\'])(?P<url>https?://embed\.live\.huffingtonpost\.com/.+?)\1', webpage)
-												[huffpost] Add support

											
										
										
											11 years ago
+								        if mobj is not None:
 								            return self.url_result(mobj.group('url'), 'HuffPost')
-												Add support for embed.ly

											
										
										
											11 years ago
+								        # Look for embed.ly
 								        mobj = re.search(r'class=["\']embedly-card["\'][^>]href=["\'](?P<url>[^"\']+)', webpage)
 								        if mobj is not None:
 								            return self.url_result(mobj.group('url'))
 								        mobj = re.search(r'class=["\']embedly-embed["\'][^>]src=["\'][^"\']*url=(?P<url>[^&]+)', webpage)
 								        if mobj is not None:
-												[extractor/generic] Use compat_urllib_parse_unquote

											
										
										
											10 years ago
+								            return self.url_result(compat_urllib_parse_unquote(mobj.group('url')))
-												Add support for embed.ly

											
										
										
											11 years ago
-												[generic/funnyordie] Add support for funnyordie embeds (Fixes #2546)

											
										
										
											11 years ago
+								        # Look for funnyordie embed
 								        matches = re.findall(r'<iframe[^>]+?src="(https?://(?:www\.)?funnyordie\.com/embed/[^"]+)"', webpage)
 								        if matches:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								            return self.playlist_from_matches(
 								                matches, video_id, video_title, getter=unescapeHTML, ie='FunnyOrDie')
-												[generic/funnyordie] Add support for funnyordie embeds (Fixes #2546)

											
										
										
											11 years ago
-												[generic] Add support for BBC iPlayer embeds (Closes #4619)

											
										
										
											10 years ago
+								        # Look for BBC iPlayer embed
 								        matches = re.findall(r'setPlaylist\("(https?://www\.bbc\.co\.uk/iplayer/[^/]+/[\da-z]{8})"\)', webpage)
 								        if matches:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								            return self.playlist_from_matches(matches, video_id, video_title, ie='BBCCoUk')
-												[generic] Add support for BBC iPlayer embeds (Closes #4619)

											
										
										
											10 years ago
-												[generic] Add support for embedded rutv player

											
										
										
											11 years ago
+								        # Look for embedded RUTV player
 								        rutv_url = RUTVIE._extract_url(webpage)
 								        if rutv_url:
 								            return self.url_result(rutv_url, 'RUTV')
-												[extractor/generic] Add support for tvc embeds

											
										
										
											10 years ago
+								        # Look for embedded TVC player
-												[extractor/generic] Rename tvc embed url variable

											
										
										
											10 years ago
+								        tvc_url = TVCIE._extract_url(webpage)
 								        if tvc_url:
 								            return self.url_result(tvc_url, 'TVC')
-												[extractor/generic] Add support for tvc embeds

											
										
										
											10 years ago
-												[generic] Add support for sportbox embeds

											
										
										
											10 years ago
+								        # Look for embedded SportBox player
 								        sportbox_urls = SportBoxEmbedIE._extract_urls(webpage)
 								        if sportbox_urls:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								            return self.playlist_from_matches(sportbox_urls, video_id, video_title, ie='SportBoxEmbed')
-												[generic] Add support for sportbox embeds

											
										
										
											10 years ago
-												[generic] Add support for xhamster embeds

											
										
										
											10 years ago
+								        # Look for embedded XHamster player
 								        xhamster_urls = XHamsterEmbedIE._extract_urls(webpage)
 								        if xhamster_urls:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								            return self.playlist_from_matches(xhamster_urls, video_id, video_title, ie='XHamsterEmbed')
-												[generic] Add support for xhamster embeds

											
										
										
											10 years ago
-												[extractor/generic] Add support for tnaflix network embeds (Closes #7505)

											
										
										
											9 years ago
+								        # Look for embedded TNAFlixNetwork player
 								        tnaflix_urls = TNAFlixNetworkEmbedIE._extract_urls(webpage)
 								        if tnaflix_urls:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								            return self.playlist_from_matches(tnaflix_urls, video_id, video_title, ie=TNAFlixNetworkEmbedIE.ie_key())
-												[extractor/generic] Add support for tnaflix network embeds (Closes #7505)

											
										
										
											9 years ago
-												[extractor/generic] Improve support for pornhub embeds (closes #11100)

											
										
										
											8 years ago
+								        # Look for embedded PornHub player
 								        pornhub_urls = PornHubIE._extract_urls(webpage)
 								        if pornhub_urls:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								            return self.playlist_from_matches(pornhub_urls, video_id, video_title, ie=PornHubIE.ie_key())
-												[extractor/generic] Improve support for pornhub embeds (closes #11100)

											
										
										
											8 years ago
-												[extractor/generic] Add support for drtuber embds (closes #11098)

											
										
										
											8 years ago
+								        # Look for embedded DrTuber player
 								        drtuber_urls = DrTuberIE._extract_urls(webpage)
 								        if drtuber_urls:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								            return self.playlist_from_matches(drtuber_urls, video_id, video_title, ie=DrTuberIE.ie_key())
-												[extractor/generic] Add support for drtuber embds (closes #11098)

											
										
										
											8 years ago
-												[extractor/generic] Add support for redtube embds (closes #11099)

											
										
										
											8 years ago
+								        # Look for embedded RedTube player
 								        redtube_urls = RedTubeIE._extract_urls(webpage)
 								        if redtube_urls:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								            return self.playlist_from_matches(redtube_urls, video_id, video_title, ie=RedTubeIE.ie_key())
-												[extractor/generic] Add support for redtube embds (closes #11099)

											
										
										
											8 years ago
-												[generic] Add support for tube8 embeds

											
										
										
											7 years ago
+								        # Look for embedded Tube8 player
 								        tube8_urls = Tube8IE._extract_urls(webpage)
 								        if tube8_urls:
 								            return self.playlist_from_matches(tube8_urls, video_id, video_title, ie=Tube8IE.ie_key())
-												[extractor/generic] Add support for tvigle embeds

											
										
										
											10 years ago
+								        # Look for embedded Tvigle player
 								        mobj = re.search(
 								            r'<iframe[^>]+?src=(["\'])(?P<url>(?:https?:)?//cloud\.tvigle\.ru/video/.+?)\1', webpage)
 								        if mobj is not None:
 								            return self.url_result(mobj.group('url'), 'Tvigle')
-												[generic] Run TED detection before JW Player detection

Otherwise it overwrittes the `mobj` variable.

											
										
										
											11 years ago
+								        # Look for embedded TED player
 								        mobj = re.search(
-												[generic] PEP8

											
										
										
											10 years ago
+								            r'<iframe[^>]+?src=(["\'])(?P<url>https?://embed(?:-ssl)?\.ted\.com/.+?)\1', webpage)
-												[generic] Run TED detection before JW Player detection

Otherwise it overwrittes the `mobj` variable.

											
										
										
											11 years ago
+								        if mobj is not None:
 								            return self.url_result(mobj.group('url'), 'TED')
-												[UstreamIE] [generic] Added support for Ustream embed URLs (Fixes #2694)

											
										
										
											11 years ago
+								        # Look for embedded Ustream videos
-												[ustream] Add UstreamIE._extract_url()

Ref: #11547

											
										
										
											8 years ago
+								        ustream_url = UstreamIE._extract_url(webpage)
 								        if ustream_url:
 								            return self.url_result(ustream_url, UstreamIE.ie_key())
-												[UstreamIE] [generic] Added support for Ustream embed URLs (Fixes #2694)

											
										
										
											11 years ago
-												[arte] Add support for embedded videos (Fixes #2620)

											
										
										
											11 years ago
+								        # Look for embedded arte.tv player
 								        mobj = re.search(
-												[arte.tv:embed] Extended support (#2620)

											
										
										
											9 years ago
+								            r'<(?:script|iframe) [^>]*?src="(?P<url>http://www\.arte\.tv/(?:playerv2/embed|arte_vp/index)[^"]+)"',
-												[arte] Add support for embedded videos (Fixes #2620)

											
										
										
											11 years ago
+								            webpage)
 								        if mobj is not None:
 								            return self.url_result(mobj.group('url'), 'ArteTVEmbed')
-												[extractor/generic] Add support for francetv embeds

											
										
										
											10 years ago
+								        # Look for embedded francetv player
 								        mobj = re.search(
 								            r'<iframe[^>]+?src=(["\'])(?P<url>(?:https?://)?embed\.francetv\.fr/\?ue=.+?)\1',
 								            webpage)
 								        if mobj is not None:
 								            return self.url_result(mobj.group('url'))
-												[smotri] Modernize and add support for emdebbed videos (Closes #2585)

											
										
										
											11 years ago
+								        # Look for embedded smotri.com player
 								        smotri_url = SmotriIE._extract_url(webpage)
 								        if smotri_url:
 								            return self.url_result(smotri_url, 'Smotri')
-												[extractor/generic:myvi] Add support for myvi embeds

											
										
										
											10 years ago
+								        # Look for embedded Myvi.ru player
-												[myvi:embed] Rename to myvi

											
										
										
											10 years ago
+								        myvi_url = MyviIE._extract_url(webpage)
-												[extractor/generic:myvi] Add support for myvi embeds

											
										
										
											10 years ago
+								        if myvi_url:
 								            return self.url_result(myvi_url)
-												Fix typos

Closes #8200.

											
										
										
											9 years ago
+								        # Look for embedded soundcloud player
-												[extractor/generic] Extract all soundcloud embeds (Closes #10179)

											
										
										
											9 years ago
+								        soundcloud_urls = SoundcloudIE._extract_urls(webpage)
 								        if soundcloud_urls:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								            return self.playlist_from_matches(soundcloud_urls, video_id, video_title, getter=unescapeHTML, ie=SoundcloudIE.ie_key())
-												[soundcloud/generic] Add support for playlists

											
										
										
											11 years ago
-												[tunein] Add support for embeds (closes #11579)

											
										
										
											8 years ago
+								        # Look for tunein player
 								        tunein_urls = TuneInBaseIE._extract_urls(webpage)
 								        if tunein_urls:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								            return self.playlist_from_matches(tunein_urls, video_id, video_title)
-												[tunein] Add support for embeds (closes #11579)

											
										
										
											8 years ago
-												[generic] Extract mtvservices embedded videos

											
										
										
											11 years ago
+								        # Look for embedded mtvservices player
-												[extractor/generic] Use _extract_url for mtvservices

											
										
										
											9 years ago
+								        mtvservices_url = MTVServicesEmbeddedIE._extract_url(webpage)
 								        if mtvservices_url:
 								            return self.url_result(mtvservices_url, ie='MTVServicesEmbedded')
-												[generic] Extract mtvservices embedded videos

											
										
										
											11 years ago
-												[yahoo] Add support for embedded videos (Closes #3525)

											
										
										
											11 years ago
+								        # Look for embedded yahoo player
 								        mobj = re.search(
 								            r'<iframe[^>]+?src=(["\'])(?P<url>https?://(?:screen|movies)\.yahoo\.com/.+?\.html\?format=embed)\1',
 								            webpage)
 								        if mobj is not None:
 								            return self.url_result(mobj.group('url'), 'Yahoo')
-												[sbs] Add new extractor (Fixes #3566)

											
										
										
											10 years ago
+								        # Look for embedded sbs.com.au player
 								        mobj = re.search(
-												[generic] Improve SBS detection (Fixes #4899)

											
										
										
											10 years ago
+								            r'''(?x)
 								            (?:
 								                <meta\s+property="og:video"\s+content=|
 								                <iframe[^>]+?src=
 								            )
 								            (["\'])(?P<url>https?://(?:www\.)?sbs\.com\.au/ondemand/video/.+?)\1''',
-												[sbs] Add new extractor (Fixes #3566)

											
										
										
											10 years ago
+								            webpage)
 								        if mobj is not None:
 								            return self.url_result(mobj.group('url'), 'SBS')
-												[cinchcast] Add new extractor (Fixes #4428)

											
										
										
											10 years ago
+								        # Look for embedded Cinchcast player
 								        mobj = re.search(
 								            r'<iframe[^>]+?src=(["\'])(?P<url>https?://player\.cinchcast\.com/.+?)\1',
 								            webpage)
 								        if mobj is not None:
 								            return self.url_result(mobj.group('url'), 'Cinchcast')
-												[mlb] Add support for embedded videos (Closes #3653)

											
										
										
											10 years ago
+								        mobj = re.search(
-												[generic] Improve MLB iframe regex

											
										
										
											10 years ago
+								            r'<iframe[^>]+?src=(["\'])(?P<url>https?://m(?:lb)?\.mlb\.com/shared/video/embed/embed\.html\?.+?)\1',
-												[mlb] Add support for embedded videos (Closes #3653)

											
										
										
											10 years ago
+								            webpage)
-												[generic] Detect more MLB videos (fixes #5443)

											
										
										
											10 years ago
+								        if not mobj:
 								            mobj = re.search(
 								                r'data-video-link=["\'](?P<url>http://m.mlb.com/video/[^"\']+)',
 								                webpage)
-												[mlb] Add support for embedded videos (Closes #3653)

											
										
										
											10 years ago
+								        if mobj is not None:
 								            return self.url_result(mobj.group('url'), 'MLB')
-												[condenast] Add support for embedded videos (Closes #3929)

											
										
										
											10 years ago
+								        mobj = re.search(
-												[extractor/generic] Add support for condenast script embeds (Closes #6885, closes #6991)

											
										
										
											9 years ago
+								            r'<(?:iframe|script)[^>]+?src=(["\'])(?P<url>%s)\1' % CondeNastIE.EMBED_URL,
-												[condenast] Add support for embedded videos (Closes #3929)

											
										
										
											10 years ago
+								            webpage)
 								        if mobj is not None:
 								            return self.url_result(self._proto_relative_url(mobj.group('url'), scheme='http:'), 'CondeNast')
-												[generic] Add support for livestream embeds (Fixes #4185)

											
										
										
											10 years ago
+								        mobj = re.search(
-												[generic] Improve Livestream detection (closes #2234)

											
										
										
											9 years ago
+								            r'<iframe[^>]+src="(?P<url>https?://(?:new\.)?livestream\.com/[^"]+/player[^"]+)"',
-												[generic] Add support for livestream embeds (Fixes #4185)

											
										
										
											10 years ago
+								            webpage)
 								        if mobj is not None:
 								            return self.url_result(mobj.group('url'), 'Livestream')
-												[generic] Add support for Zapiks embeds (#5014)

											
										
										
											10 years ago
+								        # Look for Zapiks embed
 								        mobj = re.search(
 								            r'<iframe[^>]+src="(?P<url>https?://(?:www\.)?zapiks\.fr/index\.php\?.+?)"', webpage)
 								        if mobj is not None:
 								            return self.url_result(mobj.group('url'), 'Zapiks')
-												[generic] Support dynamic Kaltura embeds (#5016) (#5073)

											
										
										
											10 years ago
+								        # Look for Kaltura embeds
-												[extractor/generic] Use _extract_url for kaltura embeds (Closes #9922)

											
										
										
											9 years ago
+								        kaltura_url = KalturaIE._extract_url(webpage)
 								        if kaltura_url:
 								            return self.url_result(smuggle_url(kaltura_url, {'source_url': url}), KalturaIE.ie_key())
-												[generic] Support dynamic Kaltura embeds (#5016) (#5073)

											
										
										
											10 years ago
-												[eagleplatform] Add support for referrer protected videos (closes #13557)

											
										
										
											8 years ago
+								        # Look for EaglePlatform embeds
-												[eagleplatform] Improve embed detection and extract in separate routine (Closes #9926)

											
										
										
											9 years ago
+								        eagleplatform_url = EaglePlatformIE._extract_url(webpage)
 								        if eagleplatform_url:
-												[eagleplatform] Add support for referrer protected videos (closes #13557)

											
										
										
											8 years ago
+								            return self.url_result(smuggle_url(eagleplatform_url, {'referrer': url}), EaglePlatformIE.ie_key())
-												[eagleplatform] Add support for embeds

											
										
										
											10 years ago
-												[eagleplatform] Add support for referrer protected videos (closes #13557)

											
										
										
											8 years ago
+								        # Look for ClipYou (uses EaglePlatform) embeds
-												[eagleplatform] Add support for ClipYou embeds

											
										
										
											10 years ago
+								        mobj = re.search(
 								            r'<iframe[^>]+src="https?://(?P<host>media\.clipyou\.ru)/index/player\?.*\brecord_id=(?P<id>\d+).*"', webpage)
 								        if mobj is not None:
 								            return self.url_result('eagleplatform:%(host)s:%(id)s' % mobj.groupdict(), 'EaglePlatform')
-												[pladform] Add support for embeds

											
										
										
											10 years ago
+								        # Look for Pladform embeds
-												[extractor/generic] Use _extract_url for pladform

											
										
										
											9 years ago
+								        pladform_url = PladformIE._extract_url(webpage)
 								        if pladform_url:
 								            return self.url_result(pladform_url)
-												[pladform] Add support for embeds

											
										
										
											10 years ago
-												[extractor/generic] Add support for videomore embeds

											
										
										
											9 years ago
+								        # Look for Videomore embeds
 								        videomore_url = VideomoreIE._extract_url(webpage)
 								        if videomore_url:
 								            return self.url_result(videomore_url)
-												[extractor/generic] Add support for webcaster.pro embeds

											
										
										
											8 years ago
+								        # Look for Webcaster embeds
 								        webcaster_url = WebcasterFeedIE._extract_url(self, webpage)
 								        if webcaster_url:
 								            return self.url_result(webcaster_url, ie=WebcasterFeedIE.ie_key())
-												[generic] Add support for playwire embeds (Closes #5430)

											
										
										
											10 years ago
+								        # Look for Playwire embeds
 								        mobj = re.search(
 								            r'<script[^>]+data-config=(["\'])(?P<url>(?:https?:)?//config\.playwire\.com/.+?)\1', webpage)
 								        if mobj is not None:
 								            return self.url_result(mobj.group('url'))
-												[generic] Add support for 5min embeds (#5310)

											
										
										
											10 years ago
+								        # Look for 5min embeds
 								        mobj = re.search(
 								            r'<meta[^>]+property="og:video"[^>]+content="https?://embed\.5min\.com/(?P<id>[0-9]+)/?', webpage)
 								        if mobj is not None:
 								            return self.url_result('5min:%s' % mobj.group('id'), 'FiveMin')
-												[generic] Add support for Crooks and Liars embeds

											
										
										
											10 years ago
+								        # Look for Crooks and Liars embeds
 								        mobj = re.search(
 								            r'<(?:iframe[^>]+src|param[^>]+value)=(["\'])(?P<url>(?:https?:)?//embed\.crooksandliars\.com/(?:embed|v)/.+?)\1', webpage)
 								        if mobj is not None:
 								            return self.url_result(mobj.group('url'))
-												[NBC/ThePlatform/Generic] Add a generic detector for NBCSportsVPlayer and enhance error detection in ThePlatformIE

											
										
										
											10 years ago
+								        # Look for NBC Sports VPlayer embeds
 								        nbc_sports_url = NBCSportsVPlayerIE._extract_url(webpage)
 								        if nbc_sports_url:
 								            return self.url_result(nbc_sports_url, 'NBCSportsVPlayer')
-												[generic] Detect NBC News embeds

											
										
										
											9 years ago
+								        # Look for NBC News embeds
 								        nbc_news_embed_url = re.search(
 								            r'<iframe[^>]+src=(["\'])(?P<url>(?:https?:)?//www\.nbcnews\.com/widget/video-embed/[^"\']+)\1', webpage)
 								        if nbc_news_embed_url:
 								            return self.url_result(nbc_news_embed_url.group('url'), 'NBCNews')
-												add google drive embeds
											
										
										
											10 years ago
+								        # Look for Google Drive embeds
-												[googledrive] Modernize

											
										
										
											9 years ago
+								        google_drive_url = GoogleDriveIE._extract_url(webpage)
-												add google drive embeds
											
										
										
											10 years ago
+								        if google_drive_url:
 								            return self.url_result(google_drive_url, 'GoogleDrive')
-												[udn] Add new extractor

											
										
										
											10 years ago
+								        # Look for UDN embeds
 								        mobj = re.search(
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								            r'<iframe[^>]+src="(?:https?:)?(?P<url>%s)"' % UDNEmbedIE._PROTOCOL_RELATIVE_VALID_URL, webpage)
-												[udn] Add new extractor

											
										
										
											10 years ago
+								        if mobj is not None:
 								            return self.url_result(
-												[utils] Remove url_infer_protocol

											
										
										
											10 years ago
+								                compat_urlparse.urljoin(url, mobj.group('url')), 'UDNEmbed')
-												[udn] Add new extractor

											
										
										
											10 years ago
-												[CSpan] Add detection for Senate ISVP. Closes #5302

											
										
										
											10 years ago
+								        # Look for Senate ISVP iframe
 								        senate_isvp_url = SenateISVPIE._search_iframe_url(webpage)
 								        if senate_isvp_url:
-												[generic] Fix typo

											
										
										
											10 years ago
+								            return self.url_result(senate_isvp_url, 'SenateISVP')
-												[CSpan] Add detection for Senate ISVP. Closes #5302

											
										
										
											10 years ago
-												[extractor/generic] Add support for OnionStudios embeds (Closes #5841)

											
										
										
											10 years ago
+								        # Look for OnionStudios embeds
 								        onionstudios_url = OnionStudiosIE._extract_url(webpage)
 								        if onionstudios_url:
 								            return self.url_result(onionstudios_url)
-												[viewlift] replace SnagFilms extractors

- add support for other sites that use the same logic
- improve format extraction and sorting

											
										
										
											9 years ago
+								        # Look for ViewLift embeds
 								        viewlift_url = ViewLiftEmbedIE._extract_url(webpage)
 								        if viewlift_url:
 								            return self.url_result(viewlift_url)
-												[extractor/generic] Add support for snagfilms embeds

											
										
										
											10 years ago
-												[makertv] improve extraction

											
										
										
											9 years ago
+								        # Look for JWPlatform embeds
-												[jwplatform] Add support for multiple embeds (closes #15192)

											
										
										
											7 years ago
+								        jwplatform_urls = JWPlatformIE._extract_urls(webpage)
 								        if jwplatform_urls:
 								            return self.playlist_from_matches(jwplatform_urls, video_id, video_title, ie=JWPlatformIE.ie_key())
-												[makertv] improve extraction

											
										
										
											9 years ago
-												[ultimedia] Rename to digiteka

											
										
										
											9 years ago
+								        # Look for Digiteka embeds
 								        digiteka_url = DigitekaIE._extract_url(webpage)
 								        if digiteka_url:
 								            return self.url_result(self._proto_relative_url(digiteka_url), DigitekaIE.ie_key())
-												[jukebox] remove extractor and handle it using generic extractor

											
										
										
											9 years ago
-												[extractor/generic] Add support for arkena embeds

											
										
										
											9 years ago
+								        # Look for Arkena embeds
 								        arkena_url = ArkenaIE._extract_url(webpage)
 								        if arkena_url:
 								            return self.url_result(arkena_url, ArkenaIE.ie_key())
-												[piksel] Add new extractor(closes #11246)

											
										
										
											8 years ago
+								        # Look for Piksel embeds
 								        piksel_url = PikselIE._extract_url(webpage)
 								        if piksel_url:
 								            return self.url_result(piksel_url, PikselIE.ie_key())
-												[generic] Add support for Limelight API

											
										
										
											9 years ago
+								        # Look for Limelight embeds
-												[limelight] Improve embeds extraction (closes #12761)
* Move extraction code to extractor
* Add extraction for LimelightEmbeddedPlayerFlash embeds
* Extract multiple video

											
										
										
											8 years ago
+								        limelight_urls = LimelightBaseIE._extract_urls(webpage, url)
 								        if limelight_urls:
 								            return self.playlist_result(
 								                limelight_urls, video_id, video_title, video_description)
-												[anvato] Improve extraction (closes #12913)
* Promote to regular shortcut based extractor
* Add mcp to access key mapping table
* Add support for embeds extraction
* Add support for anvato embeds in generic extractor

											
										
										
											8 years ago
+								        # Look for Anvato embeds
 								        anvato_urls = AnvatoIE._extract_urls(self, webpage, video_id)
 								        if anvato_urls:
 								            return self.playlist_result(
 								                anvato_urls, video_id, video_title, video_description)
-												[generic/adobetv] Support AdobeTVVideo embeds (#6039)

											
										
										
											10 years ago
+								        # Look for AdobeTVVideo embeds
 								        mobj = re.search(
 								            r'<iframe[^>]+src=[\'"]((?:https?:)?//video\.tv\.adobe\.com/v/\d+[^"]+)[\'"]',
 								            webpage)
 								        if mobj is not None:
 								            return self.url_result(
 								                self._proto_relative_url(unescapeHTML(mobj.group(1))),
 								                'AdobeTVVideo')
-												[generic] Support Vine embeds (#8817)

											
										
										
											9 years ago
+								        # Look for Vine embeds
 								        mobj = re.search(
 								            r'<iframe[^>]+src=[\'"]((?:https?:)?//(?:www\.)?vine\.co/v/[^/]+/embed/(?:simple|postcard))',
 								            webpage)
 								        if mobj is not None:
 								            return self.url_result(
 								                self._proto_relative_url(unescapeHTML(mobj.group(1))), 'Vine')
-												[vodplatform] Add new extractor

											
										
										
											9 years ago
+								        # Look for VODPlatform embeds
 								        mobj = re.search(
-												[generic,vodplatform] improve embed regex

											
										
										
											8 years ago
+								            r'<iframe[^>]+src=(["\'])(?P<url>(?:https?:)?//(?:www\.)?vod-platform\.net/[eE]mbed/.+?)\1',
-												[vodplatform] Add new extractor

											
										
										
											9 years ago
+								            webpage)
 								        if mobj is not None:
 								            return self.url_result(
-												[generic,vodplatform] improve embed regex

											
										
										
											8 years ago
+								                self._proto_relative_url(unescapeHTML(mobj.group('url'))), 'VODPlatform')
-												[vodplatform] Add new extractor

											
										
										
											9 years ago
-												[mangomolo] add support for Mangomolo embeds

											
										
										
											8 years ago
+								        # Look for Mangomolo embeds
 								        mobj = re.search(
-												[mangomolo] fix domain regex

											
										
										
											8 years ago
+								            r'''(?x)<iframe[^>]+src=(["\'])(?P<url>(?:https?:)?//(?:www\.)?admin\.mangomolo\.com/analytics/index\.php/customers/embed/
-												[mangomolo] add support for Mangomolo embeds

											
										
										
											8 years ago
+								                (?:
 								                    video\?.*?\bid=(?P<video_id>\d+)|
 								                    index\?.*?\bchannelid=(?P<channel_id>(?:[A-Za-z0-9+/=]|%2B|%2F|%3D)+)
 								                ).+?)\1''', webpage)
 								        if mobj is not None:
 								            info = {
 								                '_type': 'url_transparent',
 								                'url': self._proto_relative_url(unescapeHTML(mobj.group('url'))),
 								                'title': video_title,
 								                'description': video_description,
 								                'thumbnail': video_thumbnail,
 								                'uploader': video_uploader,
 								            }
 								            video_id = mobj.group('video_id')
 								            if video_id:
 								                info.update({
 								                    'ie_key': 'MangomoloVideo',
 								                    'id': video_id,
 								                })
 								            else:
 								                info.update({
 								                    'ie_key': 'MangomoloLive',
 								                    'id': mobj.group('channel_id'),
 								                })
 								            return info
-												[generic] Extract Instagram embeds (#8817)

											
										
										
											9 years ago
+								        # Look for Instagram embeds
 								        instagram_embed_url = InstagramIE._extract_embed_url(webpage)
 								        if instagram_embed_url is not None:
-												[extractor/generic] Improve instagram embeds (Closes #9213)

											
										
										
											9 years ago
+								            return self.url_result(
 								                self._proto_relative_url(instagram_embed_url), InstagramIE.ie_key())
-												[generic] Extract Instagram embeds (#8817)

											
										
										
											9 years ago
-												[generic] Add support for LiveLeak embeds

											
										
										
											9 years ago
+								        # Look for LiveLeak embeds
-												[liveleak] Support another liveleak embedding pattern (closes #13336)

											
										
										
											7 years ago
+								        liveleak_urls = LiveLeakIE._extract_urls(webpage)
 								        if liveleak_urls:
 								            return self.playlist_from_matches(liveleak_urls, video_id, video_title)
-												[generic] Add support for LiveLeak embeds

											
										
										
											9 years ago
-												[extractor/generic:3qsdn] Add support for embeds

											
										
										
											9 years ago
+								        # Look for 3Q SDN embeds
 								        threeqsdn_url = ThreeQSDNIE._extract_url(webpage)
 								        if threeqsdn_url:
-												[extractor/generic] Improve 3qsdn embeds support (Closes #9453)

											
										
										
											9 years ago
+								            return {
 								                '_type': 'url_transparent',
 								                'ie_key': ThreeQSDNIE.ie_key(),
 								                'url': self._proto_relative_url(threeqsdn_url),
 								                'title': video_title,
 								                'description': video_description,
 								                'thumbnail': video_thumbnail,
 								                'uploader': video_uploader,
 								            }
-												[extractor/generic:3qsdn] Add support for embeds

											
										
										
											9 years ago
-												[vbox7:generic] Add support for vbox7 embeds

											
										
										
											8 years ago
+								        # Look for VBOX7 embeds
 								        vbox7_url = Vbox7IE._extract_url(webpage)
 								        if vbox7_url:
 								            return self.url_result(vbox7_url, Vbox7IE.ie_key())
-												[DBTV:generic] Add support for embeds

											
										
										
											8 years ago
+								        # Look for DBTV embeds
 								        dbtv_urls = DBTVIE._extract_urls(webpage)
 								        if dbtv_urls:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								            return self.playlist_from_matches(dbtv_urls, video_id, video_title, ie=DBTVIE.ie_key())
-												[DBTV:generic] Add support for embeds

											
										
										
											8 years ago
-												[videa] Add support for videa embeds

											
										
										
											8 years ago
+								        # Look for Videa embeds
 								        videa_urls = VideaIE._extract_urls(webpage)
 								        if videa_urls:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								            return self.playlist_from_matches(videa_urls, video_id, video_title, ie=VideaIE.ie_key())
-												[videa] Add support for videa embeds

											
										
										
											8 years ago
-												[extractor/generic] Add support for 20 minuten embeds (closes #11683, closes #11751)

											
										
										
											8 years ago
+								        # Look for 20 minuten embeds
 								        twentymin_urls = TwentyMinutenIE._extract_urls(webpage)
 								        if twentymin_urls:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								            return self.playlist_from_matches(
 								                twentymin_urls, video_id, video_title, ie=TwentyMinutenIE.ie_key())
-												[extractor/generic] Add support for 20 minuten embeds (closes #11683, closes #11751)

											
										
										
											8 years ago
-												[extractor/generic] Add support for openload embeds (closes #11536, closes #11812)

											
										
										
											8 years ago
+								        # Look for Openload embeds
 								        openload_urls = OpenloadIE._extract_urls(webpage)
 								        if openload_urls:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								            return self.playlist_from_matches(
 								                openload_urls, video_id, video_title, ie=OpenloadIE.ie_key())
-												[extractor/generic] Add support for openload embeds (closes #11536, closes #11812)

											
										
										
											8 years ago
-												[videopress] Add extractor

											
										
										
											8 years ago
+								        # Look for VideoPress embeds
 								        videopress_urls = VideoPressIE._extract_urls(webpage)
 								        if videopress_urls:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								            return self.playlist_from_matches(
 								                videopress_urls, video_id, video_title, ie=VideoPressIE.ie_key())
-												[videopress] Add extractor

											
										
										
											8 years ago
-												[generic] Add support for rutube embeds

											
										
										
											8 years ago
+								        # Look for Rutube embeds
 								        rutube_urls = RutubeIE._extract_urls(webpage)
 								        if rutube_urls:
-												[BostonGlobe] New. Nonstandard version of Brightcove.

Has a "data-brightcove-video-id" instead of a "data-video-id," otherwise
pretty much just Brightcove. Except the Globe isn't all Brightcove
videos, so fallback to Generic, too.

Also, abstract playlist_from_matches() from generic.py to common.py, and use
it here.

History of these changes can be found in
51170427d4b1143572a498dedaee61863a5b2c5b.

											
										
										
											8 years ago
+								            return self.playlist_from_matches(
-												Fix bugs caused by typos


											
										
										
											8 years ago
+								                rutube_urls, video_id, video_title, ie=RutubeIE.ie_key())
-												[videopress] Add extractor

											
										
										
											8 years ago
-												[washingtonpost] Add support for embeds (closes #12699)

											
										
										
											8 years ago
+								        # Look for WashingtonPost embeds
 								        wapo_urls = WashingtonPostIE._extract_urls(webpage)
 								        if wapo_urls:
 								            return self.playlist_from_matches(
 								                wapo_urls, video_id, video_title, ie=WashingtonPostIE.ie_key())
-												[extractor/generic] Add support for mediaset embeds

											
										
										
											8 years ago
+								        # Look for Mediaset embeds
-												[mediaset] Improve embed support (closes #17668)

											
										
										
											6 years ago
+								        mediaset_urls = MediasetIE._extract_urls(self, webpage)
-												[extractor/generic] Add support for mediaset embeds

											
										
										
											8 years ago
+								        if mediaset_urls:
 								            return self.playlist_from_matches(
 								                mediaset_urls, video_id, video_title, ie=MediasetIE.ie_key())
-												[joj] Rewrite and add support for generic embeds (closes #13268)

											
										
										
											8 years ago
+								        # Look for JOJ.sk embeds
 								        joj_urls = JojIE._extract_urls(webpage)
 								        if joj_urls:
 								            return self.playlist_from_matches(
 								                joj_urls, video_id, video_title, ie=JojIE.ie_key())
-												[megaphone] Add extractor

											
										
										
											8 years ago
+								        # Look for megaphone.fm embeds
 								        mpfn_urls = MegaphoneIE._extract_urls(webpage)
 								        if mpfn_urls:
 								            return self.playlist_from_matches(
 								                mpfn_urls, video_id, video_title, ie=MegaphoneIE.ie_key())
-												[generic] Replace vzaar embed test

											
										
										
											7 years ago
+								        # Look for vzaar embeds
 								        vzaar_urls = VzaarIE._extract_urls(webpage)
 								        if vzaar_urls:
 								            return self.playlist_from_matches(
 								                vzaar_urls, video_id, video_title, ie=VzaarIE.ie_key())
-												[generic] Add support for channel9 embeds (closes #14469)

											
										
										
											7 years ago
+								        channel9_urls = Channel9IE._extract_urls(webpage)
 								        if channel9_urls:
 								            return self.playlist_from_matches(
 								                channel9_urls, video_id, video_title, ie=Channel9IE.ie_key())
-												[vshare] Fix extraction (closes #14473)


											
										
										
											7 years ago
+								        vshare_urls = VShareIE._extract_urls(webpage)
 								        if vshare_urls:
 								            return self.playlist_from_matches(
 								                vshare_urls, video_id, video_title, ie=VShareIE.ie_key())
-												[mediasite] Add extractor, subsume sandia and collegerama extractors

											
										
										
											8 years ago
+								        # Look for Mediasite embeds
-												[mediasite] Improve extraction and code style, add support for DASH (closes #11185, closes #14343, refs #5428)

											
										
										
											7 years ago
+								        mediasite_urls = MediasiteIE._extract_urls(webpage)
 								        if mediasite_urls:
 								            entries = [
 								                self.url_result(smuggle_url(
 								                    compat_urlparse.urljoin(url, mediasite_url),
 								                    {'UrlReferrer': url}), ie=MediasiteIE.ie_key())
 								                for mediasite_url in mediasite_urls]
 								            return self.playlist_result(entries, video_id, video_title)
-												[mediasite] Add extractor, subsume sandia and collegerama extractors

											
										
										
											8 years ago
-												[springboardplatform] Add extractor

											
										
										
											7 years ago
+								        springboardplatform_urls = SpringboardPlatformIE._extract_urls(webpage)
 								        if springboardplatform_urls:
 								            return self.playlist_from_matches(
 								                springboardplatform_urls, video_id, video_title,
 								                ie=SpringboardPlatformIE.ie_key())
-												[yapfiles] Add extractor (closes #15726, refs #11085)

											
										
										
											7 years ago
+								        yapfiles_urls = YapFilesIE._extract_urls(webpage)
 								        if yapfiles_urls:
 								            return self.playlist_from_matches(
 								                yapfiles_urls, video_id, video_title, ie=YapFilesIE.ie_key())
-												[vice] Fix extraction and rework extractors (closes #11101, closes #13019, closes #13622, closes #13778)

											
										
										
											7 years ago
+								        vice_urls = ViceIE._extract_urls(webpage)
 								        if vice_urls:
 								            return self.playlist_from_matches(
 								                vice_urls, video_id, video_title, ie=ViceIE.ie_key())
-												[generic] Add support for xfileshare embeds (closes #15879)

											
										
										
											7 years ago
+								        xfileshare_urls = XFileShareIE._extract_urls(webpage)
 								        if xfileshare_urls:
 								            return self.playlist_from_matches(
 								                xfileshare_urls, video_id, video_title, ie=XFileShareIE.ie_key())
-												[cloudflarestream] Add support for cloudflare streams (closes #16375)

											
										
										
											7 years ago
+								        cloudflarestream_urls = CloudflareStreamIE._extract_urls(webpage)
 								        if cloudflarestream_urls:
 								            return self.playlist_from_matches(
 								                cloudflarestream_urls, video_id, video_title, ie=CloudflareStreamIE.ie_key())
-												[peertube] Improve generic support (closes #16733)

											
										
										
											7 years ago
+								        peertube_urls = PeerTubeIE._extract_urls(webpage, url)
-												[peertube] Add support for generic embeds

											
										
										
											7 years ago
+								        if peertube_urls:
 								            return self.playlist_from_matches(
 								                peertube_urls, video_id, video_title, ie=PeerTubeIE.ie_key())
-												[indavideo] Add support for generic embeds (closes #11989)

											
										
										
											7 years ago
+								        indavideo_urls = IndavideoEmbedIE._extract_urls(webpage)
 								        if indavideo_urls:
 								            return self.playlist_from_matches(
 								                indavideo_urls, video_id, video_title, ie=IndavideoEmbedIE.ie_key())
-												[apa] Add extractor (closes #15041, closes #15672)

											
										
										
											7 years ago
+								        apa_urls = APAIE._extract_urls(webpage)
 								        if apa_urls:
 								            return self.playlist_from_matches(
 								                apa_urls, video_id, video_title, ie=APAIE.ie_key())
-												[foxnews] Add support for iframe embeds (closes #15810, closes #16711)

											
										
										
											7 years ago
+								        foxnews_urls = FoxNewsIE._extract_urls(webpage)
 								        if foxnews_urls:
 								            return self.playlist_from_matches(
 								                foxnews_urls, video_id, video_title, ie=FoxNewsIE.ie_key())
-												[generic] PEP 8 (#17455)

											
										
										
											6 years ago
+								        sharevideos_urls = [sharevideos_mobj.group('url') for sharevideos_mobj in re.finditer(
-												[generic] Restrict share-videos.se embeds regex to filter bogus URLs (#16115)

											
										
										
											7 years ago
+								            r'<iframe[^>]+?\bsrc\s*=\s*(["\'])(?P<url>(?:https?:)?//embed\.share-videos\.se/auto/embed/\d+\?.*?\buid=\d+.*?)\1',
 								            webpage)]
 								        if sharevideos_urls:
 								            return self.playlist_from_matches(
 								                sharevideos_urls, video_id, video_title)
-												[viqeo] Add extractor (closes #17066)

											
										
										
											7 years ago
+								        viqeo_urls = ViqeoIE._extract_urls(webpage)
 								        if viqeo_urls:
 								            return self.playlist_from_matches(
 								                viqeo_urls, video_id, video_title, ie=ViqeoIE.ie_key())
-												[generic] Add support for expressen embeds

											
										
										
											6 years ago
 								        expressen_urls = ExpressenIE._extract_urls(webpage)
 								        if expressen_urls:
 								            return self.playlist_from_matches(
 								                expressen_urls, video_id, video_title, ie=ExpressenIE.ie_key())
-												[viqeo] Add extractor (closes #17066)

											
										
										
											7 years ago
-												[utils] Fix xattr error handling

											
										
										
											8 years ago
+								        # Look for HTML5 media
 								        entries = self._parse_html5_media_entries(url, webpage, video_id, m3u8_id='hls')
 								        if entries:
-												[generic] Fix support for multiple HTML5 videos on one page (closes #14080)


											
										
										
											7 years ago
+								            if len(entries) == 1:
 								                entries[0].update({
-												[utils] Fix xattr error handling

											
										
										
											8 years ago
+								                    'id': video_id,
 								                    'title': video_title,
 								                })
-												[generic] Fix support for multiple HTML5 videos on one page (closes #14080)


											
										
										
											7 years ago
+								            else:
 								                for num, entry in enumerate(entries, start=1):
 								                    entry.update({
 								                        'id': '%s-%s' % (video_id, num),
 								                        'title': '%s (%d)' % (video_title, num),
 								                    })
 								            for entry in entries:
-												[utils] Fix xattr error handling

											
										
										
											8 years ago
+								                self._sort_formats(entry['formats'])
-												[generic] Fix support for multiple HTML5 videos on one page (closes #14080)


											
										
										
											7 years ago
+								            return self.playlist_result(entries, video_id, video_title)
-												[utils] Fix xattr error handling

											
										
										
											8 years ago
-												_find_jwplayer_data() returns dict or None

This simplifies code for callers of `_find_jwplayer_data()` which no longer have
to run `_parse_json()` on the return value.

It also makes sure that `_find_jwplayer_data()` returns either a `dict` or
`None` and nothing else.

											
										
										
											8 years ago
+								        jwplayer_data = self._find_jwplayer_data(
 								            webpage, video_id, transform_source=js_to_json)
 								        if jwplayer_data:
-												[generic] Skip unsuccessful jwplayer extraction (closes #16735)

											
										
										
											7 years ago
+								            try:
 								                info = self._parse_jwplayer_data(
 								                    jwplayer_data, video_id, require_title=False, base_url=url)
 								                return merge_dicts(info, info_dict)
 								            except ExtractorError:
 								                # See https://github.com/rg3/youtube-dl/pull/16735
 								                pass
-												[generic] Try parsing JWPlayer embedded videos (closes #12030)

											
										
										
											8 years ago
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
+								        # Video.js embed
 								        mobj = re.search(
-												[generic] Add support for single format Video.js embeds (closes #14371)

											
										
										
											7 years ago
+								            r'(?s)\bvideojs\s*\(.+?\.src\s*\(\s*((?:\[.+?\]|{.+?}))\s*\)\s*;',
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
+								            webpage)
 								        if mobj is not None:
 								            sources = self._parse_json(
 								                mobj.group(1), video_id, transform_source=js_to_json,
 								                fatal=False) or []
-												[generic] Add support for single format Video.js embeds (closes #14371)

											
										
										
											7 years ago
+								            if not isinstance(sources, list):
 								                sources = [sources]
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
+								            formats = []
 								            for source in sources:
-												[generic] Allow relative src for videojs embeds (closes #17324)

											
										
										
											6 years ago
+								                src = source.get('src')
 								                if not src or not isinstance(src, compat_str):
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
+								                    continue
 								                src = compat_urlparse.urljoin(url, src)
 								                src_type = source.get('type')
 								                if isinstance(src_type, compat_str):
 								                    src_type = src_type.lower()
 								                ext = determine_ext(src).lower()
 								                if src_type == 'video/youtube':
 								                    return self.url_result(src, YoutubeIE.ie_key())
 								                if src_type == 'application/dash+xml' or ext == 'mpd':
 								                    formats.extend(self._extract_mpd_formats(
 								                        src, video_id, mpd_id='dash', fatal=False))
 								                elif src_type == 'application/x-mpegurl' or ext == 'm3u8':
 								                    formats.extend(self._extract_m3u8_formats(
 								                        src, video_id, 'mp4', entry_protocol='m3u8_native',
 								                        m3u8_id='hls', fatal=False))
 								                else:
 								                    formats.append({
 								                        'url': src,
 								                        'ext': (mimetype2ext(src_type) or
 								                                ext if ext in KNOWN_EXTENSIONS else 'mp4'),
 								                    })
 								            if formats:
 								                self._sort_formats(formats)
 								                info_dict['formats'] = formats
 								                return info_dict
-												[extractor/generic] Extract from LD-JSON last of all
Previous sources may contain several formats, e.g. http://tamasha.com/v/PgGZ

											
										
										
											7 years ago
+								        # Looking for http://schema.org/VideoObject
 								        json_ld = self._search_json_ld(
 								            webpage, video_id, default={}, expected_type='VideoObject')
 								        if json_ld.get('url'):
 								            return merge_dicts(json_ld, info_dict)
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											10 years ago
+								        def check_video(vurl):
-												[generic] Add support for jwPlayer YouTube videos

This makes nationalarchives.gov.uk work (Fixes #4907, fixes #4876)

											
										
										
											10 years ago
+								            if YoutubeIE.suitable(vurl):
 								                return True
-												[extractor/generic] Improve rtmp support (closes #11993)

											
										
										
											8 years ago
+								            if RtmpIE.suitable(vurl):
 								                return True
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											10 years ago
+								            vpath = compat_urlparse.urlparse(vurl).path
 								            vext = determine_ext(vpath)
-												[generic] exclude urls with xml ext from valid video urls(closes #10768)(closes #11654)

											
										
										
											8 years ago
+								            return '.' in vpath and vext not in ('swf', 'png', 'jpg', 'srt', 'sbv', 'sub', 'vtt', 'ttml', 'js', 'xml')
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											10 years ago
 								        def filter_video(urls):
 								            return list(filter(check_video, urls))
-												Move GenericIE into its own file

											
										
										
											12 years ago
+								        # Start with something easy: JW Player in SWFObject
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											10 years ago
+								        found = filter_video(re.findall(r'flashvars: [\'"](?:.*&)?file=(http[^\'"&]*)', webpage))
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								        if not found:
-												[generic] Support gorillavid.in

Previously, we were a little bit over-eager and got a random swf file.
Fixes #2084.

											
										
										
											11 years ago
+								            # Look for gorilla-vid style embedding
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											10 years ago
+								            found = filter_video(re.findall(r'''(?sx)
-												[generic] Improve jwplayer detection (Fixes #2731)

											
										
										
											11 years ago
+								                (?:
 								                    jw_plugins|
 								                    JWPlayerOptions|
 								                    jwplayer\s*\(\s*["'][^'"]+["']\s*\)\s*\.setup
 								                )
-												[generic] Add support for jwPlayer YouTube videos

This makes nationalarchives.gov.uk work (Fixes #4907, fixes #4876)

											
										
										
											10 years ago
+								                .*?
 								                ['"]?file['"]?\s*:\s*["\'](.*?)["\']''', webpage))
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								        if not found:
-												Move GenericIE into its own file

											
										
										
											12 years ago
+								            # Broaden the search a little bit
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											10 years ago
+								            found = filter_video(re.findall(r'[^A-Za-z0-9]?(?:file|source)=(http[^\'"&]*)', webpage))
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								        if not found:
 								            # Broaden the findall a little bit: JWPlayer JS loader
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											10 years ago
+								            found = filter_video(re.findall(
-												[generic] Expand jwplayer support

											
										
										
											10 years ago
+								                r'[^A-Za-z0-9]?(?:file|video_url)["\']?:\s*["\'](http(?![^\'"]+\.[0-9]+[\'"])[^\'"]+)["\']', webpage))
-												[generic] Automatic detection of flow player and age_limit (Fixes #3576)

											
										
										
											10 years ago
+								        if not found:
 								            # Flow player
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											10 years ago
+								            found = filter_video(re.findall(r'''(?xs)
-												[generic] Automatic detection of flow player and age_limit (Fixes #3576)

											
										
										
											10 years ago
+								                flowplayer\("[^"]+",\s*
 								                    \{[^}]+?\}\s*,
-												The opening curly brace `{` is a regex reserved [control character](http://stackoverflow.com/a/400316/1106367), so it needs to be escaped.

											
										
										
											10 years ago
+								                    \s*\{[^}]+? ["']?clip["']?\s*:\s*\{\s*
-												[generic] Automatic detection of flow player and age_limit (Fixes #3576)

											
										
										
											10 years ago
+								                        ["']?url["']?\s*:\s*["']([^"']+)["']
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											10 years ago
+								            ''', webpage))
-												[generic] Add support for Cinerama player (Fixes #4752)

											
										
										
											10 years ago
+								        if not found:
 								            # Cinerama player
 								            found = re.findall(
 								                r"cinerama\.embedPlayer\(\s*\'[^']+\',\s*'([^']+)'", webpage)
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								        if not found:
-												Move GenericIE into its own file

											
										
										
											12 years ago
+								            # Try to find twitter cards info
-												[extractor/generic] Change twitter:player embeds priority to lowest (Closes #10090)

											
										
										
											9 years ago
+								            # twitter:player:stream should be checked before twitter:player since
 								            # it is expected to contain a raw stream (see
 								            # https://dev.twitter.com/cards/types/player#On_twitter.com_via_desktop_browser)
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											10 years ago
+								            found = filter_video(re.findall(
 								                r'<meta (?:property|name)="twitter:player:stream" (?:content|value)="(.+?)"', webpage))
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								        if not found:
-												Move GenericIE into its own file

											
										
										
											12 years ago
+								            # We look for Open Graph info:
 								            # We have to match any number spaces between elements, some sites try to align them (eg.: statigr.am)
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								            m_video_type = re.findall(r'<meta.*?property="og:video:type".*?content="video/(.*?)"', webpage)
-												Move GenericIE into its own file

											
										
										
											12 years ago
+								            # We only look in og:video if the MIME type is a video, don't try if it's a Flash player:
 								            if m_video_type is not None:
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											10 years ago
+								                found = filter_video(re.findall(r'<meta.*?property="og:video".*?content="(.*?)"', webpage))
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								        if not found:
-												[generic] Generalize redirect regex

											
										
										
											10 years ago
+								            REDIRECT_REGEX = r'[0-9]{,2};\s*(?:URL|url)=\'?([^\'"]+)'
-												[generic] Fix redirect

											
										
										
											11 years ago
+								            found = re.search(
-												[generic] Add support for <meta redirect>

Fixes #413

											
										
										
											11 years ago
+								                r'(?i)<meta\s+(?=(?:[a-z-]+="[^"]+"\s+)*http-equiv="refresh")'
-												[generic] Generalize redirect regex

											
										
										
											10 years ago
+								                r'(?:[a-z-]+="[^"]+"\s+)*?content="%s' % REDIRECT_REGEX,
-												[generic] Add support for <meta redirect>

Fixes #413

											
										
										
											11 years ago
+								                webpage)
-												[generic] Follow redirects specified by `Refresh` HTTP header

											
										
										
											10 years ago
+								            if not found:
 								                # Look also in Refresh HTTP header
 								                refresh_header = head_response.headers.get('Refresh')
 								                if refresh_header:
-												[extractor/generic] Fix following redirect in Refresh HTTP header on python 2

											
										
										
											9 years ago
+								                    # In python 2 response HTTP headers are bytestrings
 								                    if sys.version_info < (3, 0) and isinstance(refresh_header, str):
 								                        refresh_header = refresh_header.decode('iso-8859-1')
-												[generic] Generalize redirect regex

											
										
										
											10 years ago
+								                    found = re.search(REDIRECT_REGEX, refresh_header)
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								            if found:
-												[generic] Unescape HTML escape sequences in redirect urls (fixes #6311)

											
										
										
											10 years ago
+								                new_url = compat_urlparse.urljoin(url, unescapeHTML(found.group(1)))
-												[generic] Do not follow redirects to the same URL

											
										
										
											8 years ago
+								                if new_url != url:
 								                    self.report_following_redirect(new_url)
 								                    return {
 								                        '_type': 'url',
 								                        'url': new_url,
 								                    }
 								                else:
 								                    found = None
-												[extractor/generic] Change twitter:player embeds priority to lowest (Closes #10090)

											
										
										
											9 years ago
 								        if not found:
 								            # twitter:player is a https URL to iframe player that may or may not
 								            # be supported by youtube-dl thus this is checked the very last (see
 								            # https://dev.twitter.com/cards/types/player#On_twitter.com_via_desktop_browser)
 								            embed_url = self._html_search_meta('twitter:player', webpage, default=None)
-												[generic] Fix infinite recursion for twitter:player URLs (closes #14339)

											
										
										
											7 years ago
+								            if embed_url and embed_url != url:
-												[extractor/generic] Change twitter:player embeds priority to lowest (Closes #10090)

											
										
										
											9 years ago
+								                return self.url_result(embed_url)
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								        if not found:
-												Add documentation about supported sites (Fixes #4503)

											
										
										
											10 years ago
+								            raise UnsupportedError(url)
-												Move GenericIE into its own file

											
										
										
											12 years ago
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								        entries = []
-												[genric] Eliminate duplicated video URLs (closes #6562)

											
										
										
											9 years ago
+								        for video_url in orderedSet(found):
-												[generic] Unescape the video URL

Fixes #9279

											
										
										
											9 years ago
+								            video_url = unescapeHTML(video_url)
-												[generic] Unescape URLs from JWPlayer (#7582)

											
										
										
											9 years ago
+								            video_url = video_url.replace('\\/', '/')
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								            video_url = compat_urlparse.urljoin(url, video_url)
-												[extractor/generic] Use compat_urllib_parse_unquote

											
										
										
											10 years ago
+								            video_id = compat_urllib_parse_unquote(os.path.basename(video_url))
-												Move GenericIE into its own file

											
										
										
											12 years ago
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								            # Sometimes, jwplayer extraction will result in a YouTube URL
 								            if YoutubeIE.suitable(video_url):
 								                entries.append(self.url_result(video_url, 'Youtube'))
 								                continue
-												Move GenericIE into its own file

											
										
										
											12 years ago
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								            # here's a fun little line of code for you:
 								            video_id = os.path.splitext(video_id)[0]
-												[youtube] Support jwplayer with YouTube URLs (Closes #2075)

											
										
										
											11 years ago
-												[generic] Refactor

											
										
										
											9 years ago
+								            entry_info_dict = {
 								                'id': video_id,
 								                'uploader': video_uploader,
 								                'title': video_title,
 								                'age_limit': age_limit,
 								            }
-												[extractor/generic] Add test for #11993 and more metadata for rtmp

											
										
										
											8 years ago
+								            if RtmpIE.suitable(video_url):
 								                entry_info_dict.update({
 								                    '_type': 'url_transparent',
 								                    'ie_key': RtmpIE.ie_key(),
 								                    'url': video_url,
 								                })
 								                entries.append(entry_info_dict)
 								                continue
-												[extractor/generic] Add support for xspf playlists

											
										
										
											10 years ago
+								            ext = determine_ext(video_url)
 								            if ext == 'smil':
-												[generic] Refactor

											
										
										
											9 years ago
+								                entry_info_dict['formats'] = self._extract_smil_formats(video_url, video_id)
-												[extractor/generic] Add support for xspf playlists

											
										
										
											10 years ago
+								            elif ext == 'xspf':
 								                return self.playlist_result(self._extract_xspf_playlist(video_url, video_id), video_id)
-												[generic] Extract M3U8 formats (closes #7582)

											
										
										
											9 years ago
+								            elif ext == 'm3u8':
 								                entry_info_dict['formats'] = self._extract_m3u8_formats(video_url, video_id, ext='mp4')
-												[extractor/generic] Detect DASH manifests in found URLs and extract mpd formats

											
										
										
											9 years ago
+								            elif ext == 'mpd':
 								                entry_info_dict['formats'] = self._extract_mpd_formats(video_url, video_id)
-												[extractor/generic] Extract f4m formats from final URLs

											
										
										
											9 years ago
+								            elif ext == 'f4m':
 								                entry_info_dict['formats'] = self._extract_f4m_formats(video_url, video_id)
-												[extractor/generic] Skip URLs we came from when delegating ISM extraction

											
										
										
											8 years ago
+								            elif re.search(r'(?i)\.(?:ism|smil)/manifest', video_url) and video_url != url:
-												[extractor/generic] Improve ISM extraction

											
										
										
											8 years ago
+								                # Just matching .ism/manifest is not enough to be reliably sure
 								                # whether it's actually an ISM manifest or some other streaming
 								                # manifest since there are various streaming URL formats
 								                # possible (see [1]) as well as some other shenanigans like
 								                # .smil/manifest URLs that actually serve an ISM (see [2]) and
 								                # so on.
 								                # Thus the most reasonable way to solve this is to delegate
 								                # to generic extractor in order to look into the contents of
 								                # the manifest itself.
 								                # 1. https://azure.microsoft.com/en-us/documentation/articles/media-services-deliver-content-overview/#streaming-url-formats
 								                # 2. https://svs.itworkscdn.net/lbcivod/smil:itwfcdn/lbci/170976.smil/Manifest
 								                entry_info_dict = self.url_result(
 								                    smuggle_url(video_url, {'to_generic': True}),
 								                    GenericIE.ie_key())
-												[generic] Extract videos from SMIL manifests (closes #5145 and fixes #5135)

											
										
										
											10 years ago
+								            else:
-												[generic] Refactor

											
										
										
											9 years ago
+								                entry_info_dict['url'] = video_url
-												Remove _sort_formats from _extract_*_formats methods

Now _sort_formats should be called explicitly.
_sort_formats has been added to all the necessary places in code.

Closes #8051

											
										
										
											9 years ago
+								            if entry_info_dict.get('formats'):
 								                self._sort_formats(entry_info_dict['formats'])
-												[generic] Refactor

											
										
										
											9 years ago
+								            entries.append(entry_info_dict)
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
 								        if len(entries) == 1:
-												[generic] Fix wrong entries index

											
										
										
											11 years ago
+								            return entries[0]
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								        else:
 								            for num, e in enumerate(entries, start=1):
-												[generic] Don't set the 'title' if it's not defined in the entry (closes #5061)

Some of them may be an 'url' result, which in general don't have the 'title' field.

											
										
										
											10 years ago
+								                # 'url' results don't have a title
 								                if e.get('title') is not None:
 								                    e['title'] = '%s (%d)' % (e['title'], num)
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								            return {
 								                '_type': 'playlist',
 								                'entries': entries,
 								            }