3 from __future__ 
import unicode_literals
 
   9 from .common 
import InfoExtractor
 
  10 from .youtube 
import YoutubeIE
 
  11 from ..compat 
import ( 
  12     compat_etree_fromstring
, 
  14     compat_urllib_parse_unquote
, 
  16     compat_xml_parse_error
, 
  37 from .commonprotocols 
import RtmpIE
 
  38 from .brightcove 
import ( 
  46 from .nbc 
import NBCSportsVPlayerIE
 
  47 from .ooyala 
import OoyalaIE
 
  48 from .rutv 
import RUTVIE
 
  49 from .tvc 
import TVCIE
 
  50 from .sportbox 
import SportBoxIE
 
  51 from .smotri 
import SmotriIE
 
  52 from .myvi 
import MyviIE
 
  53 from .condenast 
import CondeNastIE
 
  54 from .udn 
import UDNEmbedIE
 
  55 from .senateisvp 
import SenateISVPIE
 
  56 from .svt 
import SVTIE
 
  57 from .pornhub 
import PornHubIE
 
  58 from .xhamster 
import XHamsterEmbedIE
 
  59 from .tnaflix 
import TNAFlixNetworkEmbedIE
 
  60 from .drtuber 
import DrTuberIE
 
  61 from .redtube 
import RedTubeIE
 
  62 from .tube8 
import Tube8IE
 
  63 from .vimeo 
import VimeoIE
 
  64 from .dailymotion 
import DailymotionIE
 
  65 from .dailymail 
import DailyMailIE
 
  66 from .onionstudios 
import OnionStudiosIE
 
  67 from .viewlift 
import ViewLiftEmbedIE
 
  68 from .mtv 
import MTVServicesEmbeddedIE
 
  69 from .pladform 
import PladformIE
 
  70 from .videomore 
import VideomoreIE
 
  71 from .webcaster 
import WebcasterFeedIE
 
  72 from .googledrive 
import GoogleDriveIE
 
  73 from .jwplatform 
import JWPlatformIE
 
  74 from .digiteka 
import DigitekaIE
 
  75 from .arkena 
import ArkenaIE
 
  76 from .instagram 
import InstagramIE
 
  77 from .liveleak 
import LiveLeakIE
 
  78 from .threeqsdn 
import ThreeQSDNIE
 
  79 from .theplatform 
import ThePlatformIE
 
  80 from .vessel 
import VesselIE
 
  81 from .kaltura 
import KalturaIE
 
  82 from .eagleplatform 
import EaglePlatformIE
 
  83 from .facebook 
import FacebookIE
 
  84 from .soundcloud 
import SoundcloudIE
 
  85 from .tunein 
import TuneInBaseIE
 
  86 from .vbox7 
import Vbox7IE
 
  87 from .dbtv 
import DBTVIE
 
  88 from .piksel 
import PikselIE
 
  89 from .videa 
import VideaIE
 
  90 from .twentymin 
import TwentyMinutenIE
 
  91 from .ustream 
import UstreamIE
 
  92 from .openload 
import ( 
  96 from .videopress 
import VideoPressIE
 
  97 from .rutube 
import RutubeIE
 
  98 from .limelight 
import LimelightBaseIE
 
  99 from .anvato 
import AnvatoIE
 
 100 from .washingtonpost 
import WashingtonPostIE
 
 101 from .wistia 
import WistiaIE
 
 102 from .mediaset 
import MediasetIE
 
 103 from .joj 
import JojIE
 
 104 from .megaphone 
import MegaphoneIE
 
 105 from .vzaar 
import VzaarIE
 
 106 from .channel9 
import Channel9IE
 
 107 from .vshare 
import VShareIE
 
 108 from .mediasite 
import MediasiteIE
 
 109 from .springboardplatform 
import SpringboardPlatformIE
 
 110 from .yapfiles 
import YapFilesIE
 
 111 from .vice 
import ViceIE
 
 112 from .xfileshare 
import XFileShareIE
 
 113 from .cloudflarestream 
import CloudflareStreamIE
 
 114 from .peertube 
import PeerTubeIE
 
 115 from .teachable 
import TeachableIE
 
 116 from .indavideo 
import IndavideoEmbedIE
 
 117 from .apa 
import APAIE
 
 118 from .foxnews 
import FoxNewsIE
 
 119 from .viqeo 
import ViqeoIE
 
 120 from .expressen 
import ExpressenIE
 
 121 from .zype 
import ZypeIE
 
 124 class GenericIE(InfoExtractor
): 
 125     IE_DESC 
= 'Generic downloader that works on some sites' 
 129         # Direct link to a video 
 131             'url': 'http://media.w3.org/2010/05/sintel/trailer.mp4', 
 132             'md5': '67d406c2bcb6af27fa886f31aa934bbe', 
 137                 'upload_date': '20100513', 
 140         # Direct link to media delivered compressed (until Accept-Encoding is *) 
 142             'url': 'http://calimero.tk/muzik/FictionJunction-Parallel_Hearts.flac', 
 143             'md5': '128c42e68b13950268b648275386fc74', 
 145                 'id': 'FictionJunction-Parallel_Hearts', 
 147                 'title': 'FictionJunction-Parallel_Hearts', 
 148                 'upload_date': '20140522', 
 150             'expected_warnings': [ 
 151                 'URL could be a direct video link, returning it as such.' 
 153             'skip': 'URL invalid', 
 155         # Direct download with broken HEAD 
 157             'url': 'http://ai-radio.org:8000/radio.opus', 
 164                 'skip_download': True,  # infinite live stream 
 166             'expected_warnings': [ 
 167                 r
'501.*Not Implemented', 
 171         # Direct link with incorrect MIME type 
 173             'url': 'http://ftp.nluug.nl/video/nluug/2014-11-20_nj14/zaal-2/5_Lennart_Poettering_-_Systemd.webm', 
 174             'md5': '4ccbebe5f36706d85221f204d7eb5913', 
 176                 'url': 'http://ftp.nluug.nl/video/nluug/2014-11-20_nj14/zaal-2/5_Lennart_Poettering_-_Systemd.webm', 
 177                 'id': '5_Lennart_Poettering_-_Systemd', 
 179                 'title': '5_Lennart_Poettering_-_Systemd', 
 180                 'upload_date': '20141120', 
 182             'expected_warnings': [ 
 183                 'URL could be a direct video link, returning it as such.' 
 188             'url': 'http://phihag.de/2014/youtube-dl/rss2.xml', 
 190                 'id': 'http://phihag.de/2014/youtube-dl/rss2.xml', 
 191                 'title': 'Zero Punctuation', 
 192                 'description': 're:.*groundbreaking video review series.*' 
 194             'playlist_mincount': 11, 
 196         # RSS feed with enclosure 
 198             'url': 'http://podcastfeeds.nbcnews.com/audio/podcast/MSNBC-MADDOW-NETCAST-M4V.xml', 
 200                 'id': 'pdv_maddow_netcast_m4v-02-27-2015-201624', 
 202                 'upload_date': '20150228', 
 203                 'title': 'pdv_maddow_netcast_m4v-02-27-2015-201624', 
 206         # RSS feed with enclosures and unsupported link URLs 
 208             'url': 'http://www.hellointernet.fm/podcast?format=rss', 
 210                 'id': 'http://www.hellointernet.fm/podcast?format=rss', 
 211                 'description': 'CGP Grey and Brady Haran talk about YouTube, life, work, whatever.', 
 212                 'title': 'Hello Internet', 
 214             'playlist_mincount': 100, 
 216         # SMIL from http://videolectures.net/promogram_igor_mekjavic_eng 
 218             'url': 'http://videolectures.net/promogram_igor_mekjavic_eng/video/1/smil.xml', 
 222                 'title': 'Automatics, robotics and biocybernetics', 
 223                 'description': 'md5:815fc1deb6b3a2bff99de2d5325be482', 
 224                 'upload_date': '20130627', 
 225                 'formats': 'mincount:16', 
 226                 'subtitles': 'mincount:1', 
 229                 'force_generic_extractor': True, 
 230                 'skip_download': True, 
 233         # SMIL from http://www1.wdr.de/mediathek/video/livestream/index.html 
 235             'url': 'http://metafilegenerator.de/WDR/WDR_FS/hds/hds.smil', 
 240                 'formats': 'mincount:1', 
 243                 'skip_download': True, 
 246         # SMIL from https://www.restudy.dk/video/play/id/1637 
 248             'url': 'https://www.restudy.dk/awsmedia/SmilDirectory/video_1637.xml', 
 252                 'title': 'video_1637', 
 253                 'formats': 'mincount:3', 
 256                 'skip_download': True, 
 259         # SMIL from http://adventure.howstuffworks.com/5266-cool-jobs-iditarod-musher-video.htm 
 261             'url': 'http://services.media.howstuffworks.com/videos/450221/smil-service.smil', 
 263                 'id': 'smil-service', 
 265                 'title': 'smil-service', 
 266                 'formats': 'mincount:1', 
 269                 'skip_download': True, 
 272         # SMIL from http://new.livestream.com/CoheedandCambria/WebsterHall/videos/4719370 
 274             'url': 'http://api.new.livestream.com/accounts/1570303/events/1585861/videos/4719370.smil', 
 278                 'title': '571de1fd-47bc-48db-abf9-238872a58d1f', 
 279                 'formats': 'mincount:3', 
 282                 'skip_download': True, 
 285         # XSPF playlist from http://www.telegraaf.nl/tv/nieuws/binnenland/24353229/__Tikibad_ontruimd_wegens_brand__.html 
 287             'url': 'http://www.telegraaf.nl/xml/playlist/2015/8/7/mZlp2ctYIUEB.xspf', 
 289                 'id': 'mZlp2ctYIUEB', 
 291                 'title': 'Tikibad ontruimd wegens brand', 
 292                 'description': 'md5:05ca046ff47b931f9b04855015e163a4', 
 293                 'thumbnail': r
're:^https?://.*\.jpg$', 
 297                 'skip_download': True, 
 300         # MPD from http://dash-mse-test.appspot.com/media.html 
 302             'url': 'http://yt-dash-mse-test.commondatastorage.googleapis.com/media/car-20120827-manifest.mpd', 
 303             'md5': '4b57baab2e30d6eb3a6a09f0ba57ef53', 
 305                 'id': 'car-20120827-manifest', 
 307                 'title': 'car-20120827-manifest', 
 308                 'formats': 'mincount:9', 
 309                 'upload_date': '20130904', 
 312                 'format': 'bestvideo', 
 315         # m3u8 served with Content-Type: audio/x-mpegURL; charset=utf-8 
 317             'url': 'http://once.unicornmedia.com/now/master/playlist/bb0b18ba-64f5-4b1b-a29f-0ac252f06b68/77a785f3-5188-4806-b788-0893a61634ed/93677179-2d99-4ef4-9e17-fe70d49abfbf/content.m3u8', 
 322                 'formats': 'mincount:8', 
 326                 'skip_download': True, 
 328             'skip': 'video gone', 
 330         # m3u8 served with Content-Type: text/plain 
 332             'url': 'http://www.nacentapps.com/m3u8/index.m3u8', 
 337                 'upload_date': '20140720', 
 338                 'formats': 'mincount:11', 
 342                 'skip_download': True, 
 344             'skip': 'video gone', 
 348             'url': 'http://www.google.com/url?sa=t&rct=j&q=&esrc=s&source=web&cd=1&cad=rja&ved=0CCUQtwIwAA&url=http%3A%2F%2Fwww.youtube.com%2Fwatch%3Fv%3DcmQHVoWB5FY&ei=F-sNU-LLCaXk4QT52ICQBQ&usg=AFQjCNEw4hL29zgOohLXvpJ-Bdh2bils1Q&bvm=bv.61965928,d.bGE', 
 352                 'upload_date': '20130224', 
 353                 'uploader_id': 'TheVerge', 
 354                 'description': r
're:^Chris Ziegler takes a look at the\.*', 
 355                 'uploader': 'The Verge', 
 356                 'title': 'First Firefox OS phones side-by-side', 
 359                 'skip_download': False, 
 363             # redirect in Refresh HTTP header 
 364             'url': 'https://www.facebook.com/l.php?u=https%3A%2F%2Fwww.youtube.com%2Fwatch%3Fv%3DpO8h3EaFRdo&h=TAQHsoToz&enc=AZN16h-b6o4Zq9pZkCCdOLNKMN96BbGMNtcFwHSaazus4JHT_MFYkAA-WARTX2kvsCIdlAIyHZjl6d33ILIJU7Jzwk_K3mcenAXoAzBNoZDI_Q7EXGDJnIhrGkLXo_LJ_pAa2Jzbx17UHMd3jAs--6j2zaeto5w9RTn8T_1kKg3fdC5WPX9Dbb18vzH7YFX0eSJmoa6SP114rvlkw6pkS1-T&s=1', 
 368                 'title': 'Tripeo Boiler Room x Dekmantel Festival DJ Set', 
 369                 'description': 'md5:6294cc1af09c4049e0652b51a2df10d5', 
 370                 'upload_date': '20150917', 
 371                 'uploader_id': 'brtvofficial', 
 372                 'uploader': 'Boiler Room', 
 375                 'skip_download': False, 
 379             'url': 'http://www.hodiho.fr/2013/02/regis-plante-sa-jeep.html', 
 380             'md5': '85b90ccc9d73b4acd9138d3af4c27f89', 
 382                 'id': '13601338388002', 
 384                 'uploader': 'www.hodiho.fr', 
 385                 'title': 'R\u00e9gis plante sa Jeep', 
 388         # bandcamp page with custom domain 
 390             'add_ie': ['Bandcamp'], 
 391             'url': 'http://bronyrock.com/track/the-pony-mash', 
 395                 'title': 'The Pony Mash', 
 396                 'uploader': 'M_Pallante', 
 398             'skip': 'There is a limit of 200 free downloads / month for the test song', 
 401             # embedded brightcove video 
 402             # it also tests brightcove videos that need to set the 'Referer' 
 403             # in the http requests 
 404             'add_ie': ['BrightcoveLegacy'], 
 405             'url': 'http://www.bfmtv.com/video/bfmbusiness/cours-bourse/cours-bourse-l-analyse-technique-154522/', 
 407                 'id': '2765128793001', 
 409                 'title': 'Le cours de bourse : lāanalyse technique', 
 410                 'description': 'md5:7e9ad046e968cb2d1114004aba466fd9', 
 411                 'uploader': 'BFM BUSINESS', 
 414                 'skip_download': True, 
 418             # embedded with itemprop embedURL and video id spelled as `idVideo` 
 419             'add_id': ['BrightcoveLegacy'], 
 420             'url': 'http://bfmbusiness.bfmtv.com/mediaplayer/chroniques/olivier-delamarche/', 
 422                 'id': '5255628253001', 
 424                 'title': 'md5:37c519b1128915607601e75a87995fc0', 
 425                 'description': 'md5:37f7f888b434bb8f8cc8dbd4f7a4cf26', 
 426                 'uploader': 'BFM BUSINESS', 
 427                 'uploader_id': '876450612001', 
 428                 'timestamp': 1482255315, 
 429                 'upload_date': '20161220', 
 432                 'skip_download': True, 
 436             # https://github.com/ytdl-org/youtube-dl/issues/2253 
 437             'url': 'http://bcove.me/i6nfkrc3', 
 438             'md5': '0ba9446db037002366bab3b3eb30c88c', 
 440                 'id': '3101154703001', 
 442                 'title': 'Still no power', 
 443                 'uploader': 'thestar.com', 
 444                 'description': 'Mississauga resident David Farmer is still out of power as a result of the ice storm a month ago. To keep the house warm, Farmer cuts wood from his property for a wood burning stove downstairs.', 
 446             'add_ie': ['BrightcoveLegacy'], 
 447             'skip': 'video gone', 
 450             'url': 'http://www.championat.com/video/football/v/87/87499.html', 
 451             'md5': 'fb973ecf6e4a78a67453647444222983', 
 453                 'id': '3414141473001', 
 455                 'title': 'ŠŠøŠ“ео. УГаление ŠŠ·Š°Š³Š¾ŠµŠ²Š° (Š¦Š”ŠŠ)', 
 456                 'description': 'ŠŠ½Š»Š°Š¹Š½-ŃŃŠ°Š½ŃŠ»ŃŃŠøŃ маŃŃŠ° Š¦Š”ŠŠ - "ŠŠ¾Š»Š³Š°"', 
 457                 'uploader': 'Championat', 
 461             # https://github.com/ytdl-org/youtube-dl/issues/3541 
 462             'add_ie': ['BrightcoveLegacy'], 
 463             'url': 'http://www.kijk.nl/sbs6/leermijvrouwenkennen/videos/jqMiXKAYan2S/aflevering-1', 
 465                 'id': '3866516442001', 
 467                 'title': 'Leer mij vrouwen kennen: Aflevering 1', 
 468                 'description': 'Leer mij vrouwen kennen: Aflevering 1', 
 469                 'uploader': 'SBS Broadcasting', 
 471             'skip': 'Restricted to Netherlands', 
 473                 'skip_download': True,  # m3u8 download 
 477             # Brightcove video in <iframe> 
 478             'url': 'http://www.un.org/chinese/News/story.asp?NewsID=27724', 
 479             'md5': '36d74ef5e37c8b4a2ce92880d208b968', 
 481                 'id': '5360463607001', 
 483                 'title': 'åå©äŗå¤±ęåæē«„åØåŗå¢äøę¼å±ćåæč·³ć  å¼åč·å¾ę£åøøē«„幓ēę“»', 
 484                 'description': 'čåå½åæē«„åŗéä¼äøäøååéåŗå大使ćä½ę²å®¶ęå¾·Ā·čæŖęå°¼ļ¼Zade Diraniļ¼åØ3ę15ę„åå©äŗå²ēŖēå7åØå¹“ēŗŖåæµę„ä¹é
ååøäŗäøŗåå©äŗč°±åēęę²ćåæč·³ćļ¼HEARTBEATļ¼ļ¼äøŗåå°å
幓å²ēŖå½±åēåå©äŗåæē«„ååŗå¼ŗēååļ¼å¼åäøēååŗå
±ååŖåļ¼ä½æåå©äŗåæē«„éę°č·å¾äŗ«ęę£åøøē«„幓ēę“»ēęå©ć', 
 485                 'uploader': 'United Nations', 
 486                 'uploader_id': '1362235914001', 
 487                 'timestamp': 1489593889, 
 488                 'upload_date': '20170315', 
 490             'add_ie': ['BrightcoveLegacy'], 
 493             # Brightcove with alternative playerID key 
 494             'url': 'http://www.nature.com/nmeth/journal/v9/n7/fig_tab/nmeth.2062_SV1.html', 
 496                 'id': 'nmeth.2062_SV1', 
 497                 'title': 'Simultaneous multiview imaging of the Drosophila syncytial blastoderm : Quantitative high-speed imaging of entire developing embryos with simultaneous multiview light-sheet microscopy : Nature Methods : Nature Research', 
 501                     'id': '2228375078001', 
 503                     'title': 'nmeth.2062-sv1', 
 504                     'description': 'nmeth.2062-sv1', 
 505                     'timestamp': 1363357591, 
 506                     'upload_date': '20130315', 
 507                     'uploader': 'Nature Publishing Group', 
 508                     'uploader_id': '1964492299001', 
 513             # Brightcove with UUID in videoPlayer 
 514             'url': 'http://www8.hp.com/cn/zh/home.html', 
 516                 'id': '5255815316001', 
 518                 'title': 'Sprocket Video - China', 
 519                 'description': 'Sprocket Video - China', 
 520                 'uploader': 'HP-Video Gallery', 
 521                 'timestamp': 1482263210, 
 522                 'upload_date': '20161220', 
 523                 'uploader_id': '1107601872001', 
 526                 'skip_download': True,  # m3u8 download 
 528             'skip': 'video rotates...weekly?', 
 531             # Brightcove:new type [2]. 
 532             'url': 'http://www.delawaresportszone.com/video-st-thomas-more-earns-first-trip-to-basketball-semis', 
 533             'md5': '2b35148fcf48da41c9fb4591650784f3', 
 535                 'id': '5348741021001', 
 537                 'upload_date': '20170306', 
 538                 'uploader_id': '4191638492001', 
 539                 'timestamp': 1488769918, 
 540                 'title': 'VIDEO:  St. Thomas More earns first trip to basketball semis', 
 545             # Alternative brightcove <video> attributes 
 546             'url': 'http://www.programme-tv.net/videos/extraits/81095-guillaume-canet-evoque-les-rumeurs-d-infidelite-de-marion-cotillard-avec-brad-pitt-dans-vivement-dimanche/', 
 548                 'id': '81095-guillaume-canet-evoque-les-rumeurs-d-infidelite-de-marion-cotillard-avec-brad-pitt-dans-vivement-dimanche', 
 549                 'title': "Guillaume Canet eĢvoque les rumeurs d'infideĢliteĢ de Marion Cotillard avec Brad Pitt dans Vivement Dimanche, Extraits : toutes les vidĆ©os avec TĆ©lĆ©-Loisirs", 
 552                 'md5': '732d22ba3d33f2f3fc253c39f8f36523', 
 554                     'id': '5311302538001', 
 556                     'title': "Guillaume Canet eĢvoque les rumeurs d'infideĢliteĢ de Marion Cotillard avec Brad Pitt dans Vivement Dimanche", 
 557                     'description': "Guillaume Canet eĢvoque les rumeurs d'infideĢliteĢ de Marion Cotillard avec Brad Pitt dans Vivement Dimanche (France 2, 5 fĆ©vrier 2017)", 
 558                     'timestamp': 1486321708, 
 559                     'upload_date': '20170205', 
 560                     'uploader_id': '800000640001', 
 562                 'only_matching': True, 
 566             # Brightcove with UUID in videoPlayer 
 567             'url': 'http://www8.hp.com/cn/zh/home.html', 
 569                 'id': '5255815316001', 
 571                 'title': 'Sprocket Video - China', 
 572                 'description': 'Sprocket Video - China', 
 573                 'uploader': 'HP-Video Gallery', 
 574                 'timestamp': 1482263210, 
 575                 'upload_date': '20161220', 
 576                 'uploader_id': '1107601872001', 
 579                 'skip_download': True,  # m3u8 download 
 584             'url': 'http://www.rollingstone.com/music/videos/norwegian-dj-cashmere-cat-goes-spartan-on-with-me-premiere-20131219', 
 585             'md5': '166dd577b433b4d4ebfee10b0824d8ff', 
 587                 'id': 'BwY2RxaTrTkslxOfcan0UCf0YqyvWysJ', 
 589                 'title': '2cc213299525360.mov',  # that's what we get 
 592             'add_ie': ['Ooyala'], 
 595             # ooyala video embedded with http://player.ooyala.com/iframe.js 
 596             'url': 'http://www.macrumors.com/2015/07/24/steve-jobs-the-man-in-the-machine-first-trailer/', 
 598                 'id': 'p0MGJndjoG5SOKqO_hZJuZFPB-Tr5VgB', 
 600                 'title': '"Steve Jobs: Man in the Machine" trailer', 
 601                 'description': 'The first trailer for the Alex Gibney documentary "Steve Jobs: Man in the Machine."', 
 605                 'skip_download': True, 
 607             'skip': 'movie expired', 
 609         # ooyala video embedded with http://player.ooyala.com/static/v4/production/latest/core.min.js 
 611             'url': 'http://wnep.com/2017/07/22/steampunk-fest-comes-to-honesdale/', 
 613                 'id': 'lwYWYxYzE6V5uJMjNGyKtwwiw9ZJD7t2', 
 615                 'title': 'Steampunk Fest Comes to Honesdale', 
 619                 'skip_download': True, 
 624             'url': 'http://www.tested.com/science/weird/460206-tested-grinding-coffee-2000-frames-second/', 
 628                 'title': 'Tested: Grinding Coffee at 2000 Frames Per Second', 
 629                 'upload_date': '20140225', 
 630                 'description': 'md5:06a40fbf30b220468f1e0957c0f558ff', 
 631                 'uploader': 'Tested', 
 632                 'uploader_id': 'testedcom', 
 634             # No need to test YoutubeIE here 
 636                 'skip_download': True, 
 641             'url': 'http://www.theguardian.com/world/2014/mar/11/obama-zach-galifianakis-between-two-ferns', 
 645                 'title': 'Between Two Ferns with Zach Galifianakis: President Barack Obama', 
 646                 'description': 'Episode 18: President Barack Obama sits down with Zach Galifianakis for his most memorable interview yet.', 
 648             # HEAD requests lead to endless 301, while GET is OK 
 649             'expected_warnings': ['301'], 
 653             'url': 'http://www.rg.ru/2014/03/15/reg-dfo/anklav-anons.html', 
 657                 'title': 'ŠŃ
оŃŃŠŗŠ¾Šµ Š¼Š¾ŃŠµ ŃŃŠ°Š»Š¾ ŃŠµŠ»ŠøŠŗŠ¾Š¼ ŃŠ¾ŃŃŠøŠ¹Ńким', 
 658                 'description': 'md5:5ed62483b14663e2a95ebbe115eb8f43', 
 662                 'skip_download': True, 
 667             'url': 'http://sch1298sz.mskobr.ru/dou_edu/karamel_ki/filial_galleries/video/iframe_src_http_tvc_ru_video_iframe_id_55304_isplay_false_acc_video_id_channel_brand_id_11_show_episodes_episode_id_32307_frameb/', 
 671                 'title': 'ŠŠ¾ŃŠŗŠ¾Š»ŃŠ½Š¾Šµ Š²Š¾ŃŠæŠøŃŠ°Š½ŠøŠµ', 
 676             'url': 'http://www.vestifinance.ru/articles/25753', 
 679                 'title': 'ŠŃŃŠ¼Ńе ŃŃŠ°Š½ŃŠ»ŃŃŠøŠø Ń Š¤Š¾ŃŃŠ¼Š°-вŃŃŃŠ°Š²ŠŗŠø "ŠŠ¾Ńзаказ-2013"', 
 684                     'title': 'ŠŠ¾Ńзаказ. ŠŠµŠ½Ń 3', 
 690                     'title': 'ŠŠ¾Ńзаказ. ŠŠµŠ½Ń 2', 
 696                     'title': 'ŠŠ¾Ńзаказ. ŠŠµŠ½Ń 1', 
 702                 'skip_download': True, 
 707             'url': 'http://www.kinomyvi.tv/news/detail/Pervij-dublirovannij-trejler--Uzhastikov-_nOw1', 
 709                 'id': 'f4dafcad-ff21-423d-89b5-146cfd89fa1e', 
 711                 'title': 'УжаŃŃŠøŠŗŠø, ŃŃŃŃŠŗŠøŠ¹ ŃŃŠµŠ¹Š»ŠµŃ (2015)', 
 712                 'thumbnail': r
're:^https?://.*\.jpg$', 
 718             'url': 'http://www.numisc.com/forum/showthread.php?11696-FM15-which-pumiscer-was-this-%28-vid-%29-%28-alfa-as-fuck-srx-%29&s=711f5db534502e22260dec8c5e2d66d8', 
 721                 'title': '[NSFL] [FM15] which pumiscer was this ( vid ) ( alfa as fuck srx )', 
 723             'playlist_mincount': 7, 
 724             # This forum does not allow <iframe> syntaxes anymore 
 725             # Now HTML tags are displayed as-is 
 726             'skip': 'No videos on this page', 
 730             'url': 'http://en.support.wordpress.com/videos/ted-talks/', 
 731             'md5': '65fdff94098e4a607385a60c5177c638', 
 735                 'title': 'Hidden miracles of the natural world', 
 736                 'uploader': 'Louie Schwartzberg', 
 737                 'description': 'md5:8145d19d320ff3e52f28401f4c4283b9', 
 740         # nowvideo embed hidden behind percent encoding 
 742             'url': 'http://www.waoanime.tv/the-super-dimension-fortress-macross-episode-1/', 
 743             'md5': '2baf4ddd70f697d94b1c18cf796d5107', 
 745                 'id': '06e53103ca9aa', 
 747                 'title': 'Macross Episode 001  Watch Macross Episode 001 onl', 
 748                 'description': 'No description', 
 753             'url': 'http://www.tv-replay.fr/redirection/20-03-14/x-enius-arte-10753389.html', 
 754             'md5': '7653032cbb25bf6c80d80f217055fa43', 
 756                 'id': '048195-004_PLUS7-F', 
 759                 'description': 'md5:d5fdf32ef6613cdbfd516ae658abf168', 
 760                 'upload_date': '20140320', 
 763                 'skip_download': 'Requires rtmpdump' 
 765             'skip': 'video gone', 
 769             'url': 'http://www.tsprod.com/replay-du-concert-alcaline-de-calogero', 
 773                 'title': 'Alcaline, le concert avec Calogero', 
 774                 'description': 'md5:61f08036dcc8f47e9cfc33aed08ffaff', 
 775                 'upload_date': '20150226', 
 776                 'timestamp': 1424989860, 
 781                 'skip_download': True, 
 783             'expected_warnings': [ 
 789             'url': 'http://www.wired.com/2014/04/honda-asimo/', 
 790             'md5': 'ba0dfe966fa007657bd1443ee672db0f', 
 792                 'id': '53501be369702d3275860000', 
 794                 'title': 'Hondaās  New Asimo Robot Is More Human Than Ever', 
 799             'url': 'http://www.spi0n.com/zap-spi0n-com-n216/', 
 800             'md5': '441aeeb82eb72c422c7f14ec533999cd', 
 802                 'id': 'k2mm4bCdJ6CQ2i7c8o2', 
 804                 'title': 'Le Zap de Spi0n n°216 - Zapping du Web', 
 805                 'description': 'md5:faf028e48a461b8b7fad38f1e104b119', 
 807                 'uploader_id': 'xgditw', 
 808                 'upload_date': '20140425', 
 809                 'timestamp': 1398441542, 
 811             'add_ie': ['Dailymotion'], 
 815             'url': 'http://www.bumm.sk/krimi/2017/07/05/biztonsagi-kamera-buktatta-le-az-agg-ferfit-utlegelo-apolot', 
 819                 'title': 'Care worker punches elderly dementia patient in head 11 times', 
 820                 'description': 'md5:3a743dee84e57e48ec68bf67113199a5', 
 822             'add_ie': ['DailyMail'], 
 824                 'skip_download': True, 
 829             'url': 'http://www.badzine.de/ansicht/datum/2014/06/09/so-funktioniert-die-neue-englische-badminton-liga.html', 
 833                 'title': 'The NBL Auction 2014', 
 834                 'uploader': 'BADMINTON England', 
 835                 'uploader_id': 'BADMINTONEvents', 
 836                 'upload_date': '20140603', 
 837                 'description': 'md5:9ef128a69f1e262a700ed83edb163a73', 
 839             'add_ie': ['Youtube'], 
 841                 'skip_download': True, 
 846             'url': 'http://www.vulture.com/2016/06/new-key-peele-sketches-released.html', 
 847             'md5': 'ca1aef97695ef2c1d6973256a57e5252', 
 849                 'id': '769f7ec0-0692-4d62-9b45-0d88074bffc1', 
 851                 'title': 'Key and Peele|October 10, 2012|2|203|Liam Neesons - Uncensored', 
 852                 'description': 'Two valets share their love for movie star Liam Neesons.', 
 853                 'timestamp': 1349922600, 
 854                 'upload_date': '20121011', 
 857         # YouTube embed via <data-embed-url=""> 
 859             'url': 'https://play.google.com/store/apps/details?id=com.gameloft.android.ANMP.GloftA8HM', 
 863                 'title': 'Asphalt 8: Airborne - Update - Welcome to Dubai!', 
 864                 'uploader': 'Gameloft', 
 865                 'uploader_id': 'gameloft', 
 866                 'upload_date': '20140828', 
 867                 'description': 'md5:c80da9ed3d83ae6d1876c834de03e1c4', 
 870                 'skip_download': True, 
 873         # YouTube <object> embed 
 875             'url': 'http://www.improbable.com/2017/04/03/untrained-modern-youths-and-ancient-masters-in-selfie-portraits/', 
 876             'md5': '516718101ec834f74318df76259fb3cc', 
 880                 'title': 'Feynman: Mirrors FUN TO IMAGINE 6', 
 881                 'upload_date': '20080526', 
 882                 'description': 'md5:0ffc78ea3f01b2e2c247d5f8d1d3c18d', 
 883                 'uploader': 'Christopher Sykes', 
 884                 'uploader_id': 'ChristopherJSykes', 
 886             'add_ie': ['Youtube'], 
 890             'url': 'http://www.ll.mit.edu/workshops/education/videocourses/antennas/lecture1/video/', 
 892                 'md5': '0c5e352edabf715d762b0ad4e6d9ee67', 
 894                     'id': 'Fenn-AA_PA_Radar_Course_Lecture_1c_Final', 
 895                     'title': 'Fenn-AA_PA_Radar_Course_Lecture_1c_Final - video1', 
 900                 'md5': '10e4bb3aaca9fd630e273ff92d9f3c63', 
 902                     'id': 'Fenn-AA_PA_Radar_Course_Lecture_1c_Final_PIP', 
 903                     'title': 'Fenn-AA_PA_Radar_Course_Lecture_1c_Final - pip', 
 909                 'title': 'Fenn-AA_PA_Radar_Course_Lecture_1c_Final', 
 914             'url': 'http://www.handjobhub.com/video/busty-blonde-siri-tit-fuck-while-wank-6313.html', 
 915             'md5': '9d65602bf31c6e20014319c7d07fba27', 
 917                 'id': '5123ea6d5e5a7', 
 920                 'uploader': 'www.handjobhub.com', 
 921                 'title': 'Busty Blonde Siri Tit Fuck While Wank at HandjobHub.com', 
 924         # Multiple brightcove videos 
 925         # https://github.com/ytdl-org/youtube-dl/issues/2283 
 927             'url': 'http://www.newyorker.com/online/blogs/newsdesk/2014/01/always-never-nuclear-command-and-control.html', 
 929                 'id': 'always-never', 
 930                 'title': 'Always / Never - The New Yorker', 
 934                 'extract_flat': False, 
 935                 'skip_download': True, 
 940             'url': 'http://umpire-empire.com/index.php/topic/58125-laz-decides-no-thats-low/', 
 941             'md5': '96f09a37e44da40dd083e12d9a683327', 
 945                 'title': 'Ump changes call to ball', 
 946                 'description': 'md5:71c11215384298a172a6dcb4c2e20685', 
 948                 'timestamp': 1401537900, 
 949                 'upload_date': '20140531', 
 950                 'thumbnail': r
're:^https?://.*\.jpg$', 
 955             'url': 'http://study.com/academy/lesson/north-american-exploration-failed-colonies-of-spain-france-england.html#lesson', 
 956             'md5': '1953f3a698ab51cfc948ed3992a0b7ff', 
 960                 'title': 'paywall_north-american-exploration-failed-colonies-of-spain-france-england', 
 961                 'description': 'a Paywall Videos video from Remilon', 
 963                 'uploader': 'study.com', 
 964                 'timestamp': 1459678540, 
 965                 'upload_date': '20160403', 
 966                 'filesize': 24687186, 
 970             'url': 'http://thoughtworks.wistia.com/medias/uxjb0lwrcz', 
 971             'md5': 'baf49c2baa8a7de5f3fc145a8506dcd4', 
 975                 'title': 'Conversation about Hexagonal Rails Part 1', 
 976                 'description': 'a Martin Fowler video from ThoughtWorks', 
 978                 'uploader': 'thoughtworks.wistia.com', 
 979                 'timestamp': 1401832161, 
 980                 'upload_date': '20140603', 
 983         # Wistia standard embed (async) 
 985             'url': 'https://www.getdrip.com/university/brennan-dunn-drip-workshop/', 
 989                 'title': 'Drip Brennan Dunn Workshop', 
 990                 'description': 'a JV Webinars video from getdrip-1', 
 992                 'timestamp': 1463607249, 
 993                 'upload_date': '20160518', 
 996                 'skip_download': True, 
1001             'url': 'http://nakedsecurity.sophos.com/2014/10/29/sscc-171-are-you-sure-that-1234-is-a-bad-password-podcast/', 
1005                 'description': 'md5:ff867d6b555488ad3c52572bb33d432c', 
1006                 'uploader': 'Sophos Security', 
1007                 'title': 'Chet Chat 171 - Oct 29, 2014', 
1008                 'upload_date': '20141029', 
1011         # Soundcloud multiple embeds 
1013             'url': 'http://www.guitarplayer.com/lessons/1014/legato-workout-one-hour-to-more-fluid-performance---tab/52809', 
1016                 'title': 'Guitar Essentials: Legato WorkoutāOne-Hour to Fluid Performance  | TAB + AUDIO', 
1018             'playlist_mincount': 7, 
1020         # TuneIn station embed 
1022             'url': 'http://radiocnrv.com/promouvoir-radio-cnrv/', 
1027                 'location': 'Paris, France', 
1032                 'skip_download': True, 
1037             'url': 'http://www.esa.int/Our_Activities/Space_Science/Rosetta/Philae_comet_touch-down_webcast', 
1041                 'upload_date': '20141112', 
1042                 'title': 'Rosetta #CometLanding webcast HL 10', 
1045         # Another Livestream embed, without 'new.' in URL 
1047             'url': 'https://www.freespeech.org/', 
1051                 'title': 're:^FSTV [0-9]{4}-[0-9]{2}-[0-9]{2} [0-9]{2}:[0-9]{2}$', 
1055                 'skip_download': True, 
1060             'url': 'https://skiplagged.com/', 
1063                 'title': 'Skiplagged: The smart way to find cheap flights', 
1065             'playlist_mincount': 1, 
1066             'add_ie': ['Youtube'], 
1070             'url': 'http://undergroundwellness.com/podcasts/306-5-steps-to-permanent-gut-healing/', 
1074                 'upload_date': '20141126', 
1075                 'title': 'Jack Tips: 5 Steps to Permanent Gut Healing', 
1080             'url': 'http://www.abc.net.au/7.30/content/2015/s4164797.htm', 
1082                 'id': '730m_DandD_1901_512k', 
1084                 'uploader': 'www.abc.net.au', 
1085                 'title': 'Game of Thrones with dice - Dungeons and Dragons fantasy role-playing game gets new life - 19/01/2015', 
1088         # embedded viddler video 
1090             'url': 'http://deadspin.com/i-cant-stop-watching-john-wall-chop-the-nuggets-with-th-1681801597', 
1094                 'uploader': 'deadspin', 
1095                 'title': 'WALL-TO-GORTAT', 
1096                 'timestamp': 1422285291, 
1097                 'upload_date': '20150126', 
1099             'add_ie': ['Viddler'], 
1103             'url': 'http://thedailyshow.cc.com/podcast/episodetwelve', 
1107                 'title': "The Daily Show Podcast without Jon Stewart - Episode 12: Bassem Youssef: Egypt's Jon Stewart", 
1108                 'description': 'md5:601cb790edd05908957dae8aaa866465', 
1109                 'upload_date': '20150220', 
1111             'skip': 'All The Daily Show URLs now redirect to http://www.cc.com/shows/', 
1115             'url': 'http://media.nationalarchives.gov.uk/index.php/webinar-using-discovery-national-archives-online-catalogue/', 
1117                 'id': 'Mrj4DVp2zeA', 
1119                 'upload_date': '20150212', 
1120                 'uploader': 'The National Archives UK', 
1121                 'description': 'md5:8078af856dca76edc42910b61273dbbf', 
1122                 'uploader_id': 'NationalArchives08', 
1123                 'title': 'Webinar: Using Discovery, The National Archivesā online catalogue', 
1128             'url': 'http://www.suffolk.edu/sjc/live.php', 
1132                 'title': 'Massachusetts Supreme Judicial Court Oral Arguments', 
1133                 'uploader': 'www.suffolk.edu', 
1136                 'skip_download': True, 
1138             'skip': 'Only has video a few mornings per month, see http://www.suffolk.edu/sjc/', 
1142             'url': 'http://www.indiedb.com/games/king-machine/videos', 
1146                 'title': 'king machine trailer 1', 
1147                 'description': 'Browse King Machine videos & audio for sweet media. Your eyes will thank you.', 
1148                 'thumbnail': r
're:^https?://.*\.jpg$', 
1152             # JWPlayer config passed as variable 
1153             'url': 'http://www.txxx.com/videos/3326530/ariele/', 
1157                 'title': 'ARIELE | Tube Cup', 
1158                 'uploader': 'www.txxx.com', 
1162                 'skip_download': True, 
1167             'url': 'https://www.mediaite.com/tv/dem-senator-claims-gary-cohn-faked-a-bad-connection-during-trump-call-to-get-him-off-the-phone/', 
1168             'md5': 'ca00a040364b5b439230e7ebfd02c4e9', 
1172                 'upload_date': '20171122', 
1173                 'timestamp': 1511366290, 
1174                 'title': 'Dem Senator Claims Gary Cohn Faked a Bad Connection During Trump Call to Get Him Off the Phone', 
1176             'add_ie': [JWPlatformIE
.ie_key()], 
1179             # Video.js embed, multiple formats 
1180             'url': 'http://ortcam.com/solidworks-ŃŃŠ¾Šŗ-6-наŃŃŃŠ¾Š¹ŠŗŠ°-ŃŠµŃŃŠµŠ¶Š°_33f9b7351.html', 
1182                 'id': 'yygqldloqIk', 
1184                 'title': 'SolidWorks. Š£ŃŠ¾Šŗ 6 ŠŠ°ŃŃŃŠ¾Š¹ŠŗŠ° ŃŠµŃŃŠµŠ¶Š°', 
1185                 'description': 'md5:baf95267792646afdbf030e4d06b2ab3', 
1186                 'upload_date': '20130314', 
1187                 'uploader': 'PROŃŃŠ¾Šµ3D', 
1188                 'uploader_id': 'PROstoe3D', 
1191                 'skip_download': True, 
1195             # Video.js embed, single format 
1196             'url': 'https://www.vooplayer.com/v3/watch/watch.php?v=NzgwNTg=', 
1200                 'title': 'Step 1 -  Good Foundation', 
1201                 'description': 'md5:d1e7ff33a29fc3eb1673d6c270d344f4', 
1204                 'skip_download': True, 
1209             'url': 'http://www.rtlnieuws.nl/nieuws/buitenland/aanslagen-kopenhagen', 
1210             'playlist_mincount': 5, 
1212                 'id': 'aanslagen-kopenhagen', 
1213                 'title': 'Aanslagen Kopenhagen', 
1218             'url': 'http://www.skipass.com/news/116090-bon-appetit-s5ep3-baqueira-mi-cor.html', 
1222                 'title': 'EP3S5 - Bon AppƩtit - Baqueira Mi Corazon !', 
1225         # Kaltura embed (different embed code) 
1227             'url': 'http://www.premierchristianradio.com/Shows/Saturday/Unbelievable/Conference-Videos/Os-Guinness-Is-It-Fools-Talk-Unbelievable-Conference-2014', 
1231                 'upload_date': '20150127', 
1232                 'uploader_id': 'PremierMedia', 
1234                 'title': 'Os Guinness // Is It Fools Talk? // Unbelievable? Conference 2014', 
1237         # Kaltura embed with single quotes 
1239             'url': 'http://fod.infobase.com/p_ViewPlaylist.aspx?AssignmentID=NUN8ZY', 
1244                 'timestamp': 1355743100, 
1245                 'upload_date': '20121217', 
1246                 'uploader_id': 'cplapp@learn360.com', 
1248             'add_ie': ['Kaltura'], 
1251             # Kaltura embedded via quoted entry_id 
1252             'url': 'https://www.oreilly.com/ideas/my-cloud-makes-pretty-pictures', 
1256                 'title': '06_matthew_brender_raj_dutt', 
1257                 'timestamp': 1466638791, 
1258                 'upload_date': '20160622', 
1260             'add_ie': ['Kaltura'], 
1261             'expected_warnings': [ 
1262                 'Could not send HEAD request' 
1265                 'skip_download': True, 
1269             # Kaltura embedded, some fileExt broken (#11480) 
1270             'url': 'http://www.cornell.edu/video/nima-arkani-hamed-standard-models-of-particle-physics', 
1274                 'title': 'Our "Standard Models" of particle physics and cosmology', 
1275                 'description': 'md5:67ea74807b8c4fea92a6f38d6d323861', 
1276                 'timestamp': 1321158993, 
1277                 'upload_date': '20111113', 
1278                 'uploader_id': 'kps1', 
1280             'add_ie': ['Kaltura'], 
1283             # Kaltura iframe embed 
1284             'url': 'http://www.gsd.harvard.edu/event/i-m-pei-a-centennial-celebration/', 
1285             'md5': 'ae5ace8eb09dc1a35d03b579a9c2cc44', 
1289                 'title': 'I. M. Pei: A Centennial Celebration', 
1290                 'description': 'md5:1db8f40c69edc46ca180ba30c567f37c', 
1291                 'upload_date': '20170403', 
1292                 'uploader_id': 'batchUser', 
1293                 'timestamp': 1491232186, 
1295             'add_ie': ['Kaltura'], 
1298             # Kaltura iframe embed, more sophisticated 
1299             'url': 'http://www.cns.nyu.edu/~eero/math-tools/Videos/lecture-05sep2017.html', 
1303                 'title': 'lecture-05sep2017', 
1304                 'description': 'md5:40f347d91fd4ba047e511c5321064b49', 
1305                 'upload_date': '20170913', 
1306                 'uploader_id': 'eps2', 
1307                 'timestamp': 1505340777, 
1310                 'skip_download': True, 
1312             'add_ie': ['Kaltura'], 
1315             # meta twitter:player 
1316             'url': 'http://thechive.com/2017/12/08/all-i-want-for-christmas-is-more-twerk/', 
1320                 'title': 'Main Twerk (Video)', 
1321                 'upload_date': '20171208', 
1322                 'uploader_id': 'sebastian.salinas@thechive.com', 
1323                 'timestamp': 1512713057, 
1326                 'skip_download': True, 
1328             'add_ie': ['Kaltura'], 
1330         # referrer protected EaglePlatform embed 
1332             'url': 'https://tvrain.ru/lite/teleshow/kak_vse_nachinalos/namin-418921/', 
1336                 'title': 'Š”ŃŠ°Ń ŠŠ°Š¼ŠøŠ½: Ā«ŠŃ наŃŃŃŠøŠ»Šø ГевŃŃŠ²ŠµŠ½Š½Š¾ŃŃŃ ŠŃемлŃĀ»', 
1337                 'thumbnail': r
're:^https?://.*\.jpg$', 
1342                 'skip_download': True, 
1345         # ClipYou (EaglePlatform) embed (custom URL) 
1347             'url': 'http://muz-tv.ru/play/7129/', 
1348             # Not checking MD5 as sometimes the direct HTTP link results in 404 and HLS is used 
1352                 'title': "'O Sole Mio", 
1353                 'thumbnail': r
're:^https?://.*\.jpg$', 
1358                 'skip_download': True, 
1360             'skip': 'This video is unavailable.', 
1364             'url': 'http://muz-tv.ru/kinozal/view/7400/', 
1368                 'title': 'Š¢Š°Š¹Š½Ń ŠæŠµŃŠµŠ²Š°Š»Š° ŠŃŃŠ»Š¾Š²Š° ⢠1 ŃŠµŃŠøŃ 2 ŃŠ°ŃŃŃ', 
1369                 'description': 'ŠŠ¾ŠŗŃŠ¼ŠµŠ½ŃŠ°Š»ŃŠ½ŃŠ¹ ŃŠµŃиал-ŃŠ°ŃŃŠ»ŠµŠ“ование оГной ŠøŠ· ŃŠ°Š¼ŃŃ
 жŃŃŠŗŠøŃ
 ŃŠ°Š¹Š½ ЄЄ века', 
1370                 'thumbnail': r
're:^https?://.*\.jpg$', 
1374             'skip': 'HTTP Error 404: Not Found', 
1378             'url': 'http://www.cinemablend.com/new/First-Joe-Dirt-2-Trailer-Teaser-Stupid-Greatness-70874.html', 
1382                 'title': 'Joe Dirt 2 Beautiful Loser Teaser Trailer', 
1383                 'thumbnail': r
're:^https?://.*\.png$', 
1389             'url': 'http://techcrunch.com/video/facebook-creates-on-this-day-crunch-report/518726732/', 
1390             'md5': '4c6f127a30736b59b3e2c19234ee2bf7', 
1394                 'title': 'Facebook Creates "On This Day" | Crunch Report', 
1395                 'description': 'Amazon updates Fire TV line, Tesla\'s Model X spotted in the wild', 
1396                 'timestamp': 1427237531, 
1397                 'uploader': 'Crunch Report', 
1398                 'upload_date': '20150324', 
1402                 'skip_download': True, 
1405         # Crooks and Liars embed 
1407             'url': 'http://crooksandliars.com/2015/04/fox-friends-says-protecting-atheists', 
1411                 'title': "Fox & Friends Says Protecting Atheists From Discrimination Is Anti-Christian!", 
1412                 'description': 'md5:e1a46ad1650e3a5ec7196d432799127f', 
1413                 'timestamp': 1428207000, 
1414                 'upload_date': '20150405', 
1415                 'uploader': 'Heather', 
1418         # Crooks and Liars external embed 
1420             'url': 'http://theothermccain.com/2010/02/02/video-proves-that-bill-kristol-has-been-watching-glenn-beck/comment-page-1/', 
1422                 'id': 'MTE3MjUtMzQ2MzA', 
1424                 'title': 'md5:5e3662a81a4014d24c250d76d41a08d5', 
1425                 'description': 'md5:9b8e9542d6c3c5de42d6451b7d780cec', 
1426                 'timestamp': 1265032391, 
1427                 'upload_date': '20100201', 
1428                 'uploader': 'Heather', 
1431         # NBC Sports vplayer embed 
1433             'url': 'http://www.riderfans.com/forum/showthread.php?121827-Freeman&s=e98fa1ea6dc08e886b1678d35212494a', 
1435                 'id': 'ln7x1qSThw4k', 
1437                 'title': "PFT Live: New leader in the 'new-look' defense", 
1438                 'description': 'md5:65a19b4bbfb3b0c0c5768bed1dfad74e', 
1439                 'uploader': 'NBCU-SPORTS', 
1440                 'upload_date': '20140107', 
1441                 'timestamp': 1389118457, 
1443             'skip': 'Invalid Page URL', 
1447             'url': 'http://www.vulture.com/2016/06/letterman-couldnt-care-less-about-late-night.html', 
1448             'md5': '1aa589c675898ae6d37a17913cf68d66', 
1450                 'id': 'x_dtl_oa_LettermanliftPR_160608', 
1452                 'title': 'David Letterman: A Preview', 
1453                 'description': 'A preview of Tom Brokaw\'s interview with David Letterman as part of the On Assignment series powered by Dateline. Airs Sunday June 12 at 7/6c.', 
1454                 'upload_date': '20160609', 
1455                 'timestamp': 1465431544, 
1456                 'uploader': 'NBCU-NEWS', 
1461             'url': 'https://video.udn.com/news/300346', 
1462             'md5': 'fd2060e988c326991037b9aff9df21a6', 
1466                 'title': 'äøäøäøē·åø«č®ę§ å
Øę ”åø«ēåęŗ', 
1467                 'thumbnail': r
're:^https?://.*\.jpg$', 
1471                 'skip_download': True, 
1473             'expected_warnings': ['Failed to parse JSON Expecting value'], 
1475         # Brightcove URL in single quotes 
1477             'url': 'http://www.sportsnet.ca/baseball/mlb/sn-presents-russell-martin-world-citizen/', 
1478             'md5': '4ae374f1f8b91c889c4b9203c8c752af', 
1480                 'id': '4255764656001', 
1482                 'title': 'SN Presents: Russell Martin, World Citizen', 
1483                 'description': 'To understand why he was the Toronto Blue Jaysā top off-season priority is to appreciate his background and upbringing in Montreal, where he first developed his baseball skills. Written and narrated by Stephen Brunt.', 
1484                 'uploader': 'Rogers Sportsnet', 
1485                 'uploader_id': '1704050871', 
1486                 'upload_date': '20150525', 
1487                 'timestamp': 1432570283, 
1490         # OnionStudios embed 
1492             'url': 'http://www.clickhole.com/video/dont-understand-bitcoin-man-will-mumble-explanatio-2537', 
1496                 'title': 'Donāt Understand Bitcoin? This Man Will Mumble An Explanation At You', 
1497                 'thumbnail': r
're:^https?://.*\.jpe?g$', 
1498                 'uploader': 'ClickHole', 
1499                 'uploader_id': 'clickhole', 
1504             'url': 'http://whilewewatch.blogspot.ru/2012/06/whilewewatch-whilewewatch-gripping.html', 
1506                 'id': '74849a00-85a9-11e1-9660-123139220831', 
1508                 'title': '#whilewewatch', 
1511         # AdobeTVVideo embed 
1513             'url': 'https://helpx.adobe.com/acrobat/how-to/new-experience-acrobat-dc.html?set=acrobat--get-started--essential-beginners', 
1514             'md5': '43662b577c018ad707a63766462b1e87', 
1518                 'title': 'New experience with Acrobat DC', 
1519                 'description': 'New experience with Acrobat DC', 
1520                 'duration': 248.667, 
1523         # BrightcoveInPageEmbed embed 
1525             'url': 'http://www.geekandsundry.com/tabletop-bonus-wils-final-thoughts-on-dread/', 
1527                 'id': '4238694884001', 
1529                 'title': 'Tabletop: Dread, Last Thoughts', 
1530                 'description': 'Tabletop: Dread, Last Thoughts', 
1534         # Brightcove embed, with no valid 'renditions' but valid 'IOSRenditions' 
1535         # This video can't be played in browsers if Flash disabled and UA set to iPhone, which is actually a false alarm 
1537             'url': 'https://dl.dropboxusercontent.com/u/29092637/interview.html', 
1539                 'id': '4785848093001', 
1541                 'title': 'The Cardinal Pell Interview', 
1542                 'description': 'Sky News Contributor Andrew Bolt interviews George Pell in Rome, following the Cardinal\'s evidence before the Royal Commission into Child Abuse. ', 
1543                 'uploader': 'GlobeCast Australia - GlobeStream', 
1544                 'uploader_id': '2733773828001', 
1545                 'upload_date': '20160304', 
1546                 'timestamp': 1457083087, 
1550                 'skip_download': True, 
1554             # Brightcove embed with whitespace around attribute names 
1555             'url': 'http://www.stack.com/video/3167554373001/learn-to-hit-open-three-pointers-with-damian-lillard-s-baseline-drift-drill', 
1557                 'id': '3167554373001', 
1559                 'title': "Learn to Hit Open Three-Pointers With Damian Lillard's Baseline Drift Drill", 
1560                 'description': 'md5:57bacb0e0f29349de4972bfda3191713', 
1561                 'uploader_id': '1079349493', 
1562                 'upload_date': '20140207', 
1563                 'timestamp': 1391810548, 
1566                 'skip_download': True, 
1569         # Another form of arte.tv embed 
1571             'url': 'http://www.tv-replay.fr/redirection/09-04-16/arte-reportage-arte-11508975.html', 
1572             'md5': '850bfe45417ddf221288c88a0cffe2e2', 
1574                 'id': '030273-562_PLUS7-F', 
1576                 'title': 'ARTE Reportage - Nulle part, en France', 
1577                 'description': 'md5:e3a0e8868ed7303ed509b9e3af2b870d', 
1578                 'upload_date': '20160409', 
1583             'url': 'http://www.wykop.pl/link/3088787/', 
1584             'md5': '7619da8c820e835bef21a1efa2a0fc71', 
1586                 'id': '874_1459135191', 
1588                 'title': 'Man shows poor quality of new apartment building', 
1589                 'description': 'The wall is like a sand pile.', 
1590                 'uploader': 'Lake8737', 
1592             'add_ie': [LiveLeakIE
.ie_key()], 
1594         # Another LiveLeak embed pattern (#13336) 
1596             'url': 'https://milo.yiannopoulos.net/2017/06/concealed-carry-robbery/', 
1598                 'id': '2eb_1496309988', 
1600                 'title': 'Thief robs place where everyone was armed', 
1601                 'description': 'md5:694d73ee79e535953cf2488562288eee', 
1602                 'uploader': 'brazilwtf', 
1604             'add_ie': [LiveLeakIE
.ie_key()], 
1606         # Duplicated embedded video URLs 
1608             'url': 'http://www.hudl.com/athlete/2538180/highlights/149298443', 
1610                 'id': '149298443_480_16c25b74_2', 
1612                 'title': 'vs. Blue Orange Spring Game', 
1613                 'uploader': 'www.hudl.com', 
1616         # twitter:player:stream embed 
1618             'url': 'http://www.rtl.be/info/video/589263.aspx?CategoryID=288', 
1622                 'title': 'Une nouvelle espèce de dinosaure découverte en Argentine', 
1623                 'uploader': 'www.rtl.be', 
1627                 'skip_download': True, 
1630         # twitter:player embed 
1632             'url': 'http://www.theatlantic.com/video/index/484130/what-do-black-holes-sound-like/', 
1633             'md5': 'a3e0df96369831de324f0778e126653c', 
1635                 'id': '4909620399001', 
1637                 'title': 'What Do Black Holes Sound Like?', 
1638                 'description': 'what do black holes sound like', 
1639                 'upload_date': '20160524', 
1640                 'uploader_id': '29913724001', 
1641                 'timestamp': 1464107587, 
1642                 'uploader': 'TheAtlantic', 
1644             'add_ie': ['BrightcoveLegacy'], 
1646         # Facebook <iframe> embed 
1648             'url': 'https://www.hostblogger.de/blog/archives/6181-Auto-jagt-Betonmischer.html', 
1649             'md5': 'fbcde74f534176ecb015849146dd3aee', 
1651                 'id': '599637780109885', 
1653                 'title': 'Facebook video #599637780109885', 
1656         # Facebook <iframe> embed, plugin video 
1658             'url': 'http://5pillarsuk.com/2017/06/07/tariq-ramadan-disagrees-with-pr-exercise-by-imams-refusing-funeral-prayers-for-london-attackers/', 
1660                 'id': '1754168231264132', 
1662                 'title': 'About the Imams and Religious leaders refusing to perform funeral prayers for...', 
1663                 'uploader': 'Tariq Ramadan (official)', 
1664                 'timestamp': 1496758379, 
1665                 'upload_date': '20170606', 
1668                 'skip_download': True, 
1671         # Facebook API embed 
1673             'url': 'http://www.lothype.com/blue-stars-2016-preview-standstill-full-show/', 
1674             'md5': 'a47372ee61b39a7b90287094d447d94e', 
1676                 'id': '10153467542406923', 
1678                 'title': 'Facebook video #10153467542406923', 
1681         # Wordpress "YouTube Video Importer" plugin 
1683             'url': 'http://www.lothype.com/blue-devils-drumline-stanford-lot-2016/', 
1684             'md5': 'd16797741b560b485194eddda8121b48', 
1686                 'id': 'HNTXWDXV9Is', 
1688                 'title': 'Blue Devils Drumline Stanford lot 2016', 
1689                 'upload_date': '20160627', 
1690                 'uploader_id': 'GENOCIDE8GENERAL10', 
1691                 'uploader': 'cylus cyrus', 
1695             # video stored on custom kaltura server 
1696             'url': 'http://www.expansion.com/multimedia/videos.html?media=EQcM30NHIPv', 
1697             'md5': '537617d06e64dfed891fa1593c4b30cc', 
1701                 'title': 'Elecciones britƔnicas: 5 lecciones para Rajoy', 
1702                 'description': 'md5:435a89d68b9760b92ce67ed227055f16', 
1703                 'uploader_id': 'videos.expansion@el-mundo.net', 
1704                 'upload_date': '20150429', 
1705                 'timestamp': 1430303472, 
1707             'add_ie': ['Kaltura'], 
1710             # Non-standard Vimeo embed 
1711             'url': 'https://openclassrooms.com/courses/understanding-the-web', 
1712             'md5': '64d86f1c7d369afd9a78b38cbb88d80a', 
1716                 'title': 'Understanding the web - Teaser', 
1717                 'description': 'This is "Understanding the web - Teaser" by openclassrooms on Vimeo, the home for high quality videos and the people who love them.', 
1718                 'upload_date': '20151214', 
1719                 'uploader': 'OpenClassrooms', 
1720                 'uploader_id': 'openclassrooms', 
1722             'add_ie': ['Vimeo'], 
1725             # generic vimeo embed that requires original URL passed as Referer 
1726             'url': 'http://racing4everyone.eu/2016/07/30/formula-1-2016-round12-germany/', 
1727             'only_matching': True, 
1730             'url': 'https://support.arkena.com/display/PLAY/Ways+to+embed+your+video', 
1731             'md5': 'b96f2f71b359a8ecd05ce4e1daa72365', 
1733                 'id': 'b41dda37-d8e7-4d3f-b1b5-9a9db578bdfe', 
1735                 'title': 'Big Buck Bunny', 
1736                 'description': 'Royalty free test video', 
1737                 'timestamp': 1432816365, 
1738                 'upload_date': '20150528', 
1742                 'skip_download': True, 
1744             'add_ie': [ArkenaIE
.ie_key()], 
1747             'url': 'http://nova.bg/news/view/2016/08/16/156543/%D0%BD%D0%B0-%D0%BA%D0%BE%D1%81%D1%8A%D0%BC-%D0%BE%D1%82-%D0%B2%D0%B7%D1%80%D0%B8%D0%B2-%D0%BE%D1%82%D1%86%D0%B5%D0%BF%D0%B8%D1%85%D0%B0-%D1%86%D1%8F%D0%BB-%D0%BA%D0%B2%D0%B0%D1%80%D1%82%D0%B0%D0%BB-%D0%B7%D0%B0%D1%80%D0%B0%D0%B4%D0%B8-%D0%B8%D0%B7%D1%82%D0%B8%D1%87%D0%B0%D0%BD%D0%B5-%D0%BD%D0%B0-%D0%B3%D0%B0%D0%B7-%D0%B2-%D0%BF%D0%BB%D0%BE%D0%B2%D0%B4%D0%B8%D0%B2/', 
1751                 'title': 'ŠŠ ŠŠŠ”ŠŖŠ ŠŠ¢ ŠŠŠ ŠŠ: ŠŠ·ŃŠøŃŠ°Š½Šµ на газ на бензиноŃŃŠ°Š½ŃŠøŃ Š² ŠŠ»Š¾Š²Š“ив', 
1754                 'skip_download': True, 
1756             'add_ie': [Vbox7IE
.ie_key()], 
1760             'url': 'http://www.dagbladet.no/2016/02/23/nyheter/nordlys/ski/troms/ver/43254897/', 
1763                 'title': 'Etter ett Ƅrs planlegging, klaffet endelig alt: - Jeg mƄtte ta en liten dans', 
1765             'playlist_mincount': 3, 
1769             'url': 'http://forum.dvdtalk.com/movie-talk/623756-deleted-magic-star-wars-ot-deleted-alt-scenes-docu-style.html', 
1771                 'id': '623756-deleted-magic-star-wars-ot-deleted-alt-scenes-docu-style', 
1772                 'title': 'Deleted Magic - Star Wars: OT Deleted / Alt. Scenes Docu. Style - DVD Talk Forum', 
1774             'playlist_mincount': 2, 
1778             'url': 'http://www.20min.ch/schweiz/news/story/So-kommen-Sie-bei-Eis-und-Schnee-sicher-an-27032552', 
1782                 'title': 'So kommen Sie bei Eis und Schnee sicher an', 
1783                 'description': 'md5:117c212f64b25e3d95747e5276863f7d', 
1786                 'skip_download': True, 
1788             'add_ie': [TwentyMinutenIE
.ie_key()], 
1792             'url': 'https://en.support.wordpress.com/videopress/', 
1796                 'title': 'IMG_5786', 
1797                 'timestamp': 1435711927, 
1798                 'upload_date': '20150701', 
1801                 'skip_download': True, 
1803             'add_ie': [VideoPressIE
.ie_key()], 
1807             'url': 'http://magazzino.friday.ru/videos/vipuski/kazan-2', 
1809                 'id': '9b3d5bee0a8740bf70dfd29d3ea43541', 
1811                 'title': 'ŠŠ°Š³Š°Š·Š·ŠøŠ½Š¾: ŠŠ°Š·Š°Š½Ń 2', 
1812                 'description': 'md5:99bccdfac2269f0e8fdbc4bbc9db184a', 
1813                 'uploader': 'ŠŠ°Š³Š°Š·Š·ŠøŠ½Š¾', 
1814                 'upload_date': '20170228', 
1815                 'uploader_id': '996642', 
1818                 'skip_download': True, 
1820             'add_ie': [RutubeIE
.ie_key()], 
1823             # ThePlatform embedded with whitespaces in URLs 
1824             'url': 'http://www.golfchannel.com/topics/shows/golftalkcentral.htm', 
1825             'only_matching': True, 
1828             # Senate ISVP iframe https 
1829             'url': 'https://www.hsgac.senate.gov/hearings/canadas-fast-track-refugee-plan-unanswered-questions-and-implications-for-us-national-security', 
1830             'md5': 'fb8c70b0b515e5037981a2492099aab8', 
1832                 'id': 'govtaff020316', 
1834                 'title': 'Integrated Senate Video Player', 
1836             'add_ie': [SenateISVPIE
.ie_key()], 
1839             # Limelight embeds (1 channel embed + 4 media embeds) 
1840             'url': 'http://www.sedona.com/FacilitatorTraining2017', 
1842                 'id': 'FacilitatorTraining2017', 
1843                 'title': 'Facilitator Training 2017', 
1845             'playlist_mincount': 5, 
1848             # Limelight embed (LimelightPlayerUtil.embed) 
1849             'url': 'https://tv5.ca/videos?v=xuu8qowr291ri', 
1851                 'id': '95d035dc5c8a401588e9c0e6bd1e9c92', 
1853                 'title': '07448641', 
1854                 'timestamp': 1499890639, 
1855                 'upload_date': '20170712', 
1858                 'skip_download': True, 
1860             'add_ie': ['LimelightMedia'], 
1863             'url': 'http://kron4.com/2017/04/28/standoff-with-walnut-creek-murder-suspect-ends-with-arrest/', 
1865                 'id': 'standoff-with-walnut-creek-murder-suspect-ends-with-arrest', 
1866                 'title': 'Standoff with Walnut Creek murder suspect ends', 
1867                 'description': 'md5:3ccc48a60fc9441eeccfc9c469ebf788', 
1869             'playlist_mincount': 4, 
1872             # WashingtonPost embed 
1873             'url': 'http://www.vanityfair.com/hollywood/2017/04/donald-trump-tv-pitches', 
1875                 'id': '8caf6e88-d0ec-11e5-90d3-34c2c42653ac', 
1877                 'title': "No one has seen the drama series based on Trump's life \u2014 until now", 
1878                 'description': 'Donald Trump wanted a weekly TV drama based on his life. It never aired. But The Washington Post recently obtained a scene from the pilot script ā and enlisted actors.', 
1879                 'timestamp': 1455216756, 
1880                 'uploader': 'The Washington Post', 
1881                 'upload_date': '20160211', 
1883             'add_ie': [WashingtonPostIE
.ie_key()], 
1887             'url': 'http://www.tgcom24.mediaset.it/politica/serracchiani-voglio-vivere-in-una-societa-aperta-reazioni-sproporzionate-_3071354-201702a.shtml', 
1891                 'title': 'Serracchiani: "Voglio vivere in una societĆ  aperta, con tutela del patto di fiducia"', 
1894                 'skip_download': True, 
1896             'add_ie': [MediasetIE
.ie_key()], 
1900             'url': 'https://www.noviny.sk/slovensko/238543-slovenskom-sa-prehnala-vlna-silnych-burok', 
1902                 'id': '238543-slovenskom-sa-prehnala-vlna-silnych-burok', 
1903                 'title': 'Slovenskom sa prehnala vlna silných búrok', 
1905             'playlist_mincount': 5, 
1906             'add_ie': [JojIE
.ie_key()], 
1909             # AMP embed (see https://www.ampproject.org/docs/reference/components/amp-video) 
1910             'url': 'https://tvrain.ru/amp/418921/', 
1911             'md5': 'cc00413936695987e8de148b67d14f1d', 
1915                 'title': 'Š”ŃŠ°Ń ŠŠ°Š¼ŠøŠ½: Ā«ŠŃ наŃŃŃŠøŠ»Šø ГевŃŃŠ²ŠµŠ½Š½Š¾ŃŃŃ ŠŃемлŃĀ»', 
1920             'url': 'http://help.vzaar.com/article/165-embedding-video', 
1921             'md5': '7e3919d9d2620b89e3e00bec7fe8c9d4', 
1925                 'title': 'Building A Business Online: Principal Chairs Q & A', 
1929             # multiple HTML5 videos on one page 
1930             'url': 'https://www.paragon-software.com/home/rk-free/keyscenarios.html', 
1932                 'id': 'keyscenarios', 
1933                 'title': 'Rescue Kit 14 Free Edition - Getting started', 
1935             'playlist_count': 4, 
1939             'url': 'https://youtube-dl-demo.neocities.org/vshare.html', 
1940             'md5': '17b39f55b5497ae8b59f5fbce8e35886', 
1943                 'title': 'vl14062007715967', 
1948             'url': 'http://www.heidelberg-laureate-forum.org/blog/video/lecture-friday-september-23-2016-sir-c-antony-r-hoare/', 
1949             'md5': 'aecd089f55b1cb5a59032cb049d3a356', 
1951                 'id': '90227f51a80c4d8f86c345a7fa62bd9a1d', 
1953                 'title': 'Lecture: Friday, September 23, 2016 - Sir Tony Hoare', 
1954                 'description': 'md5:5a51db84a62def7b7054df2ade403c6c', 
1955                 'timestamp': 1474354800, 
1956                 'upload_date': '20160920', 
1960             'url': 'http://www.kidzworld.com/article/30935-trolls-the-beat-goes-on-interview-skylar-astin-and-amanda-leighton', 
1964                 'title': 'Official Trailer | TROLLS: THE BEAT GOES ON!', 
1965                 'description': 'md5:eb5f23826a027ba95277d105f248b825', 
1966                 'timestamp': 1516100691, 
1967                 'upload_date': '20180116', 
1970                 'skip_download': True, 
1972             'add_ie': [SpringboardPlatformIE
.ie_key()], 
1975             'url': 'https://www.youtube.com/shared?ci=1nEzmT-M4fU', 
1977                 'id': 'uPDB5I9wfp8', 
1979                 'title': 'Pocoyo: 90 minutos de episódios completos Português para crianças - PARTE 3', 
1980                 'description': 'md5:d9e4d9346a2dfff4c7dc4c8cec0f546d', 
1981                 'upload_date': '20160219', 
1982                 'uploader': 'Pocoyo - PortuguĆŖs (BR)', 
1983                 'uploader_id': 'PocoyoBrazil', 
1985             'add_ie': [YoutubeIE
.ie_key()], 
1987                 'skip_download': True, 
1991             'url': 'https://www.yapfiles.ru/show/1872528/690b05d3054d2dbe1e69523aa21bb3b1.mp4.html', 
1993                 'id': 'vMDE4NzI1Mjgt690b', 
1995                 'title': 'ŠŠ¾ŃŃŃŠ°', 
1997             'add_ie': [YapFilesIE
.ie_key()], 
1999                 'skip_download': True, 
2003             # CloudflareStream embed 
2004             'url': 'https://www.cloudflare.com/products/cloudflare-stream/', 
2006                 'id': '31c9291ab41fac05471db4e73aa11717', 
2008                 'title': '31c9291ab41fac05471db4e73aa11717', 
2010             'add_ie': [CloudflareStreamIE
.ie_key()], 
2012                 'skip_download': True, 
2017             'url': 'https://joinpeertube.org/fr/home/', 
2020                 'title': 'Reprenez le contrƓle de vos vidƩos ! #JoinPeertube', 
2022             'playlist_count': 2, 
2026             'url': 'https://streetkitchen.hu/receptek/igy_kell_otthon_hamburgert_sutni/', 
2030                 'title': 'Ćgy kell otthon hamburgert sütni', 
2031                 'description': 'md5:f5a730ecf900a5c852e1e00540bbb0f7', 
2032                 'timestamp': 1426330212, 
2033                 'upload_date': '20150314', 
2034                 'uploader': 'StreetKitchen', 
2035                 'uploader_id': '546363', 
2037             'add_ie': [IndavideoEmbedIE
.ie_key()], 
2039                 'skip_download': True, 
2043             # APA embed via JWPlatform embed 
2044             'url': 'http://www.vol.at/blue-man-group/5593454', 
2048                 'title': '"Blau ist mysteriƶs": Die Blue Man Group im Interview', 
2049                 'description': 'md5:d41d8cd98f00b204e9800998ecf8427e', 
2050                 'thumbnail': r
're:^https?://.*\.jpg$', 
2052                 'timestamp': 1519211149, 
2053                 'upload_date': '20180221', 
2056                 'skip_download': True, 
2060             'url': 'http://share-videos.se/auto/video/83645793?uid=13', 
2061             'md5': 'b68d276de422ab07ee1d49388103f457', 
2064                 'title': 'Lock up and get excited', 
2067             'skip': 'TODO: fix nested playlists processing in tests', 
2071             'url': 'https://viqeo.tv/', 
2074                 'title': 'All-new video platform', 
2076             'playlist_count': 6, 
2080             'url': 'https://www.cookscountry.com/episode/554-smoky-barbecue-favorites', 
2082                 'id': '5b400b834b32992a310622b9', 
2084                 'title': 'Smoky Barbecue Favorites', 
2085                 'thumbnail': r
're:^https?://.*\.jpe?g', 
2087             'add_ie': [ZypeIE
.ie_key()], 
2089                 'skip_download': True, 
2094             'url': 'https://video.sibnet.ru/shell.php?videoid=3422904', 
2098                 'title': 'ŠŠ¾ŃŃŠ°Š²ŃŠøŠŗ пиŃŃŃ ŃŠæŃŠ¾ŃŠøŠ» ŃŠ°Š·ŃŠµŃŠµŠ½ŠøŃ ŃŃŠ³ŃаŃŃ Š½Š° ŃŠ¾ŃŃŠµŠæŠøŠ°Š½Š¾', 
2099                 'description': 'md5:89209cdc587dab1e4a090453dbaa2cb1', 
2100                 'thumbnail': r
're:^https?://.*\.jpg$', 
2103                 'skip_download': True, 
2105             'expected_warnings': ['Failed to download MPD manifest'], 
2108             # DailyMotion embed with DM.player 
2109             'url': 'https://www.beinsports.com/us/copa-del-rey/video/the-locker-room-valencia-beat-barca-in-copa/1203804', 
2111                 'id': 'k6aKkGHd9FJs4mtJN39', 
2113                 'title': 'The Locker Room: Valencia Beat Barca In Copa del Rey Final', 
2114                 'description': 'This video is private.', 
2115                 'uploader_id': 'x1jf30l', 
2116                 'uploader': 'beIN SPORTS USA', 
2117                 'upload_date': '20190528', 
2118                 'timestamp': 1559062971, 
2121                 'skip_download': True, 
2125         #     # TODO: find another test 
2126         #     # http://schema.org/VideoObject 
2127         #     'url': 'https://flipagram.com/f/nyvTSJMKId', 
2128         #     'md5': '888dcf08b7ea671381f00fab74692755', 
2130         #         'id': 'nyvTSJMKId', 
2132         #         'title': 'Flipagram by sjuria101 featuring Midnight Memories by One Direction', 
2133         #         'description': '#love for cats.', 
2134         #         'timestamp': 1461244995, 
2135         #         'upload_date': '20160421', 
2138         #         'force_generic_extractor': True, 
2143     def report_following_redirect(self
, new_url
): 
2144         """Report information extraction.""" 
2145         self
._downloader
.to_screen('[redirect] Following redirect to %s' % new_url
) 
2147     def _extract_rss(self
, url
, video_id
, doc
): 
2148         playlist_title 
= doc
.find('./channel/title').text
 
2149         playlist_desc_el 
= doc
.find('./channel/description') 
2150         playlist_desc 
= None if playlist_desc_el 
is None else playlist_desc_el
.text
 
2153         for it 
in doc
.findall('./channel/item'): 
2155             enclosure_nodes 
= it
.findall('./enclosure') 
2156             for e 
in enclosure_nodes
: 
2157                 next_url 
= e
.attrib
.get('url') 
2162                 next_url 
= xpath_text(it
, 'link', fatal
=False) 
2168                 '_type': 'url_transparent', 
2170                 'title': it
.find('title').text
, 
2174             '_type': 'playlist', 
2176             'title': playlist_title
, 
2177             'description': playlist_desc
, 
2181     def _extract_camtasia(self
, url
, video_id
, webpage
): 
2182         """ Returns None if no camtasia video can be found. """ 
2184         camtasia_cfg 
= self
._search
_regex
( 
2185             r
'fo\.addVariable\(\s*"csConfigFile",\s*"([^"]+)"\s*\);', 
2186             webpage
, 'camtasia configuration file', default
=None) 
2187         if camtasia_cfg 
is None: 
2190         title 
= self
._html
_search
_meta
('DC.title', webpage
, fatal
=True) 
2192         camtasia_url 
= compat_urlparse
.urljoin(url
, camtasia_cfg
) 
2193         camtasia_cfg 
= self
._download
_xml
( 
2194             camtasia_url
, video_id
, 
2195             note
='Downloading camtasia configuration', 
2196             errnote
='Failed to download camtasia configuration') 
2197         fileset_node 
= camtasia_cfg
.find('./playlist/array/fileset') 
2200         for n 
in fileset_node
.getchildren(): 
2201             url_n 
= n
.find('./uri') 
2206                 'id': os
.path
.splitext(url_n
.text
.rpartition('/')[2])[0], 
2207                 'title': '%s - %s' % (title
, n
.tag
), 
2208                 'url': compat_urlparse
.urljoin(url
, url_n
.text
), 
2209                 'duration': float_or_none(n
.find('./duration').text
), 
2213             '_type': 'playlist', 
2218     def _real_extract(self
, url
): 
2219         if url
.startswith('//'): 
2220             return self
.url_result(self
.http_scheme() + url
) 
2222         parsed_url 
= compat_urlparse
.urlparse(url
) 
2223         if not parsed_url
.scheme
: 
2224             default_search 
= self
._downloader
.params
.get('default_search') 
2225             if default_search 
is None: 
2226                 default_search 
= 'fixup_error' 
2228             if default_search 
in ('auto', 'auto_warning', 'fixup_error'): 
2230                     self
._downloader
.report_warning('The url doesn\'t specify the protocol, trying with http') 
2231                     return self
.url_result('http://' + url
) 
2232                 elif default_search 
!= 'fixup_error': 
2233                     if default_search 
== 'auto_warning': 
2234                         if re
.match(r
'^(?:url|URL)$', url
): 
2235                             raise ExtractorError( 
2236                                 'Invalid URL:  %r . Call youtube-dl like this:  youtube-dl -v "https://www.youtube.com/watch?v=BaW_jenozKc"  ' % url
, 
2239                             self
._downloader
.report_warning( 
2240                                 'Falling back to youtube search for  %s . Set --default-search "auto" to suppress this warning.' % url
) 
2241                     return self
.url_result('ytsearch:' + url
) 
2243             if default_search 
in ('error', 'fixup_error'): 
2244                 raise ExtractorError( 
2245                     '%r is not a valid URL. ' 
2246                     'Set --default-search "ytsearch" (or run  youtube-dl "ytsearch:%s" ) to search YouTube' 
2247                     % (url
, url
), expected
=True) 
2249                 if ':' not in default_search
: 
2250                     default_search 
+= ':' 
2251                 return self
.url_result(default_search 
+ url
) 
2253         url
, smuggled_data 
= unsmuggle_url(url
) 
2254         force_videoid 
= None 
2255         is_intentional 
= smuggled_data 
and smuggled_data
.get('to_generic') 
2256         if smuggled_data 
and 'force_videoid' in smuggled_data
: 
2257             force_videoid 
= smuggled_data
['force_videoid'] 
2258             video_id 
= force_videoid
 
2260             video_id 
= self
._generic
_id
(url
) 
2262         self
.to_screen('%s: Requesting header' % video_id
) 
2264         head_req 
= HEADRequest(url
) 
2265         head_response 
= self
._request
_webpage
( 
2267             note
=False, errnote
='Could not send HEAD request to %s' % url
, 
2270         if head_response 
is not False: 
2271             # Check for redirect 
2272             new_url 
= compat_str(head_response
.geturl()) 
2274                 self
.report_following_redirect(new_url
) 
2276                     new_url 
= smuggle_url( 
2277                         new_url
, {'force_videoid': force_videoid
}) 
2278                 return self
.url_result(new_url
) 
2280         full_response 
= None 
2281         if head_response 
is False: 
2282             request 
= sanitized_Request(url
) 
2283             request
.add_header('Accept-Encoding', '*') 
2284             full_response 
= self
._request
_webpage
(request
, video_id
) 
2285             head_response 
= full_response
 
2289             'title': self
._generic
_title
(url
), 
2290             'upload_date': unified_strdate(head_response
.headers
.get('Last-Modified')) 
2293         # Check for direct link to a video 
2294         content_type 
= head_response
.headers
.get('Content-Type', '').lower() 
2295         m 
= re
.match(r
'^(?P<type>audio|video|application(?=/(?:ogg$|(?:vnd\.apple\.|x-)?mpegurl)))/(?P<format_id>[^;\s]+)', content_type
) 
2297             format_id 
= compat_str(m
.group('format_id')) 
2298             if format_id
.endswith('mpegurl'): 
2299                 formats 
= self
._extract
_m
3u8_formats
(url
, video_id
, 'mp4') 
2300             elif format_id 
== 'f4m': 
2301                 formats 
= self
._extract
_f
4m
_formats
(url
, video_id
) 
2304                     'format_id': format_id
, 
2306                     'vcodec': 'none' if m
.group('type') == 'audio' else None 
2308                 info_dict
['direct'] = True 
2309             self
._sort
_formats
(formats
) 
2310             info_dict
['formats'] = formats
 
2313         if not self
._downloader
.params
.get('test', False) and not is_intentional
: 
2314             force 
= self
._downloader
.params
.get('force_generic_extractor', False) 
2315             self
._downloader
.report_warning( 
2316                 '%s on generic information extractor.' % ('Forcing' if force 
else 'Falling back')) 
2318         if not full_response
: 
2319             request 
= sanitized_Request(url
) 
2320             # Some webservers may serve compressed content of rather big size (e.g. gzipped flac) 
2321             # making it impossible to download only chunk of the file (yet we need only 512kB to 
2322             # test whether it's HTML or not). According to youtube-dl default Accept-Encoding 
2323             # that will always result in downloading the whole file that is not desirable. 
2324             # Therefore for extraction pass we have to override Accept-Encoding to any in order 
2325             # to accept raw bytes and being able to download only a chunk. 
2326             # It may probably better to solve this by checking Content-Type for application/octet-stream 
2327             # after HEAD request finishes, but not sure if we can rely on this. 
2328             request
.add_header('Accept-Encoding', '*') 
2329             full_response 
= self
._request
_webpage
(request
, video_id
) 
2331         first_bytes 
= full_response
.read(512) 
2333         # Is it an M3U playlist? 
2334         if first_bytes
.startswith(b
'#EXTM3U'): 
2335             info_dict
['formats'] = self
._extract
_m
3u8_formats
(url
, video_id
, 'mp4') 
2336             self
._sort
_formats
(info_dict
['formats']) 
2339         # Maybe it's a direct link to a video? 
2340         # Be careful not to download the whole thing! 
2341         if not is_html(first_bytes
): 
2342             self
._downloader
.report_warning( 
2343                 'URL could be a direct video link, returning it as such.') 
2350         webpage 
= self
._webpage
_read
_content
( 
2351             full_response
, url
, video_id
, prefix
=first_bytes
) 
2353         self
.report_extraction(video_id
) 
2355         # Is it an RSS feed, a SMIL file, an XSPF playlist or a MPD manifest? 
2357             doc 
= compat_etree_fromstring(webpage
.encode('utf-8')) 
2358             if doc
.tag 
== 'rss': 
2359                 return self
._extract
_rss
(url
, video_id
, doc
) 
2360             elif doc
.tag 
== 'SmoothStreamingMedia': 
2361                 info_dict
['formats'] = self
._parse
_ism
_formats
(doc
, url
) 
2362                 self
._sort
_formats
(info_dict
['formats']) 
2364             elif re
.match(r
'^(?:{[^}]+})?smil$', doc
.tag
): 
2365                 smil 
= self
._parse
_smil
(doc
, url
, video_id
) 
2366                 self
._sort
_formats
(smil
['formats']) 
2368             elif doc
.tag 
== '{http://xspf.org/ns/0/}playlist': 
2369                 return self
.playlist_result( 
2371                         doc
, video_id
, xspf_url
=url
, 
2372                         xspf_base_url
=compat_str(full_response
.geturl())), 
2374             elif re
.match(r
'(?i)^(?:{[^}]+})?MPD$', doc
.tag
): 
2375                 info_dict
['formats'] = self
._parse
_mpd
_formats
( 
2377                     mpd_base_url
=compat_str(full_response
.geturl()).rpartition('/')[0], 
2379                 self
._sort
_formats
(info_dict
['formats']) 
2381             elif re
.match(r
'^{http://ns\.adobe\.com/f4m/[12]\.0}manifest$', doc
.tag
): 
2382                 info_dict
['formats'] = self
._parse
_f
4m
_formats
(doc
, url
, video_id
) 
2383                 self
._sort
_formats
(info_dict
['formats']) 
2385         except compat_xml_parse_error
: 
2388         # Is it a Camtasia project? 
2389         camtasia_res 
= self
._extract
_camtasia
(url
, video_id
, webpage
) 
2390         if camtasia_res 
is not None: 
2393         # Sometimes embedded video player is hidden behind percent encoding 
2394         # (e.g. https://github.com/ytdl-org/youtube-dl/issues/2448) 
2395         # Unescaping the whole page allows to handle those cases in a generic way 
2396         webpage 
= compat_urllib_parse_unquote(webpage
) 
2398         # it's tempting to parse this further, but you would 
2399         # have to take into account all the variations like 
2400         #   Video Title - Site Name 
2401         #   Site Name | Video Title 
2402         #   Video Title - Tagline | Site Name 
2403         # and so on and so forth; it's just not practical 
2404         video_title 
= self
._og
_search
_title
( 
2405             webpage
, default
=None) or self
._html
_search
_regex
( 
2406             r
'(?s)<title>(.*?)</title>', webpage
, 'video title', 
2409         # Try to detect age limit automatically 
2410         age_limit 
= self
._rta
_search
(webpage
) 
2411         # And then there are the jokers who advertise that they use RTA, 
2412         # but actually don't. 
2413         AGE_LIMIT_MARKERS 
= [ 
2414             r
'Proudly Labeled <a href="http://www\.rtalabel\.org/" title="Restricted to Adults">RTA</a>', 
2416         if any(re
.search(marker
, webpage
) for marker 
in AGE_LIMIT_MARKERS
): 
2419         # video uploader is domain name 
2420         video_uploader 
= self
._search
_regex
( 
2421             r
'^(?:https?://)?([^/]*)/.*', url
, 'video uploader') 
2423         video_description 
= self
._og
_search
_description
(webpage
, default
=None) 
2424         video_thumbnail 
= self
._og
_search
_thumbnail
(webpage
, default
=None) 
2427             'title': video_title
, 
2428             'description': video_description
, 
2429             'thumbnail': video_thumbnail
, 
2430             'age_limit': age_limit
, 
2433         # Look for Brightcove Legacy Studio embeds 
2434         bc_urls 
= BrightcoveLegacyIE
._extract
_brightcove
_urls
(webpage
) 
2438                 'url': smuggle_url(bc_url
, {'Referer': url
}), 
2439                 'ie_key': 'BrightcoveLegacy' 
2440             } for bc_url 
in bc_urls
] 
2443                 '_type': 'playlist', 
2444                 'title': video_title
, 
2449         # Look for Brightcove New Studio embeds 
2450         bc_urls 
= BrightcoveNewIE
._extract
_urls
(self
, webpage
) 
2452             return self
.playlist_from_matches( 
2453                 bc_urls
, video_id
, video_title
, 
2454                 getter
=lambda x
: smuggle_url(x
, {'referrer': url
}), 
2457         # Look for Nexx embeds 
2458         nexx_urls 
= NexxIE
._extract
_urls
(webpage
) 
2460             return self
.playlist_from_matches(nexx_urls
, video_id
, video_title
, ie
=NexxIE
.ie_key()) 
2462         # Look for Nexx iFrame embeds 
2463         nexx_embed_urls 
= NexxEmbedIE
._extract
_urls
(webpage
) 
2465             return self
.playlist_from_matches(nexx_embed_urls
, video_id
, video_title
, ie
=NexxEmbedIE
.ie_key()) 
2467         # Look for ThePlatform embeds 
2468         tp_urls 
= ThePlatformIE
._extract
_urls
(webpage
) 
2470             return self
.playlist_from_matches(tp_urls
, video_id
, video_title
, ie
='ThePlatform') 
2472         # Look for Vessel embeds 
2473         vessel_urls 
= VesselIE
._extract
_urls
(webpage
) 
2475             return self
.playlist_from_matches(vessel_urls
, video_id
, video_title
, ie
=VesselIE
.ie_key()) 
2477         # Look for embedded rtl.nl player 
2478         matches 
= re
.findall( 
2479             r
'<iframe[^>]+?src="((?:https?:)?//(?:(?:www|static)\.)?rtl\.nl/(?:system/videoplayer/[^"]+(?:video_)?)?embed[^"]+)"', 
2482             return self
.playlist_from_matches(matches
, video_id
, video_title
, ie
='RtlNl') 
2484         vimeo_urls 
= VimeoIE
._extract
_urls
(url
, webpage
) 
2486             return self
.playlist_from_matches(vimeo_urls
, video_id
, video_title
, ie
=VimeoIE
.ie_key()) 
2488         vid_me_embed_url 
= self
._search
_regex
( 
2489             r
'src=[\'"](https?://vid\.me/[^\'"]+)[\'"]', 
2490             webpage, 'vid.me embed', default=None) 
2491         if vid_me_embed_url is not None: 
2492             return self.url_result(vid_me_embed_url, 'Vidme') 
2494         # Look for YouTube embeds 
2495         youtube_urls = YoutubeIE._extract_urls(webpage) 
2497             return self.playlist_from_matches( 
2498                 youtube_urls, video_id, video_title, ie=YoutubeIE.ie_key()) 
2500         matches = DailymotionIE._extract_urls(webpage) 
2502             return self.playlist_from_matches(matches, video_id, video_title) 
2504         # Look for embedded Dailymotion playlist player (#3822) 
2506             r'<iframe[^>]+?src=(["\'])(?P
<url
>(?
:https?
:)?
//(?
:www\
.)?dailymotion\
.[a
-z
]{2,3}/widget
/jukebox
\?.+?
)\
1', webpage) 
2508             playlists = re.findall( 
2509                 r'list\
[\
]=/playlist
/([^
/]+)/', unescapeHTML(m.group('url
'))) 
2511                 return self.playlist_from_matches( 
2512                     playlists, video_id, video_title, lambda p: '//dailymotion
.com
/playlist
/%s' % p) 
2514         # Look for DailyMail embeds 
2515         dailymail_urls = DailyMailIE._extract_urls(webpage) 
2517             return self.playlist_from_matches( 
2518                 dailymail_urls, video_id, video_title, ie=DailyMailIE.ie_key()) 
2520         # Look for embedded Wistia player 
2521         wistia_url = WistiaIE._extract_url(webpage) 
2524                 '_type
': 'url_transparent
', 
2525                 'url
': self._proto_relative_url(wistia_url), 
2526                 'ie_key
': WistiaIE.ie_key(), 
2527                 'uploader
': video_uploader, 
2530         # Look for SVT player 
2531         svt_url = SVTIE._extract_url(webpage) 
2533             return self.url_result(svt_url, 'SVT
') 
2535         # Look for Bandcamp pages with custom domain 
2536         mobj = re.search(r'<meta 
property="og:url"[^
>]*?content
="(.*?bandcamp\.com.*?)"', webpage) 
2537         if mobj is not None: 
2538             burl = unescapeHTML(mobj.group(1)) 
2539             # Don't 
set the extractor because it can be a track url 
or an album
 
2540             return self
.url_result(burl
) 
2542         # Look for embedded Vevo player 
2544             r
'<iframe[^>]+?src=(["\'])(?P
<url
>(?
:https?
:)?
//(?
:cache\
.)?vevo\
.com
/.+?
)\
1', webpage) 
2545         if mobj is not None: 
2546             return self.url_result(mobj.group('url
')) 
2548         # Look for embedded Viddler player 
2550             r'<(?
:iframe
[^
>]+?src|param
[^
>]+?value
)=(["\'])(?P<url>(?:https?:)?//(?:www\.)?viddler\.com/(?:embed|player)/.+?)\1', 
2552         if mobj is not None: 
2553             return self.url_result(mobj.group('url')) 
2555         # Look for NYTimes player 
2557             r'<iframe[^>]+src=(["\'])(?P
<url
>(?
:https?
:)?
//graphics8\
.nytimes\
.com
/bcvideo
/[^
/]+/iframe
/embed\
.html
.+?
)\
1>', 
2559         if mobj is not None: 
2560             return self.url_result(mobj.group('url
')) 
2562         # Look for Libsyn player 
2564             r'<iframe
[^
>]+src
=(["\'])(?P<url>(?:https?:)?//html5-player\.libsyn\.com/embed/.+?)\1', webpage) 
2565         if mobj is not None: 
2566             return self.url_result(mobj.group('url')) 
2568         # Look for Ooyala videos 
2569         mobj = (re.search(r'player\.ooyala\.com/[^"?
]+[?
#][^"]*?(?:embedCode|ec)=(?P<ec>[^"&]+)', webpage) 
2570                 or re
.search(r
'OO\.Player\.create\([\'"].*?[\'"],\s
*[\'"](?P<ec>.{32})[\'"]', webpage) 
2571                 or re.search(r'OO\
.Player\
.create\
.apply\
(\s
*OO\
.Player\s
*,\s
*op\
(\s
*\
[\s
*[\'"][^\'"]*[\'"]\s*,\s*[\'"](?P
<ec
>.{32}
)[\'"]', webpage) 
2572                 or re.search(r'SBN\.VideoLinkset\.ooyala\([\'"](?P
<ec
>.{32}
)[\'"]\)', webpage) 
2573                 or re.search(r'data-ooyala-video-id\s*=\s*[\'"](?P
<ec
>.{32}
)[\'"]', webpage)) 
2574         if mobj is not None: 
2575             embed_token = self._search_regex( 
2576                 r'embedToken[\'"]?\s
*:\s
*[\'"]([^\'"]+)', 
2577                 webpage, 'ooyala embed token
', default=None) 
2578             return OoyalaIE._build_url_result(smuggle_url( 
2581                     'embed_token
': embed_token, 
2584         # Look for multiple Ooyala embeds on SBN network websites 
2585         mobj = re.search(r'SBN\
.VideoLinkset\
.entryGroup\
((\
[.*?\
])', webpage) 
2586         if mobj is not None: 
2587             embeds = self._parse_json(mobj.group(1), video_id, fatal=False) 
2589                 return self.playlist_from_matches( 
2590                     embeds, video_id, video_title, 
2591                     getter=lambda v: OoyalaIE._url_for_embed_code(smuggle_url(v['provider_video_id
'], {'domain
': url})), ie='Ooyala
') 
2593         # Look for Aparat videos 
2594         mobj = re.search(r'<iframe 
.*?src
="(http://www\.aparat\.com/video/[^"]+)"', webpage) 
2595         if mobj is not None: 
2596             return self.url_result(mobj.group(1), 'Aparat') 
2598         # Look for MPORA videos 
2599         mobj = re.search(r'<iframe .*?src="(http
://mpora\
.(?
:com|de
)/videos
/[^
"]+)"', webpage) 
2600         if mobj is not None: 
2601             return self.url_result(mobj.group(1), 'Mpora
') 
2603         # Look for embedded Facebook player 
2604         facebook_urls = FacebookIE._extract_urls(webpage) 
2606             return self.playlist_from_matches(facebook_urls, video_id, video_title) 
2608         # Look for embedded VK player 
2609         mobj = re.search(r'<iframe
[^
>]+?src
=(["\'])(?P<url>https?://vk\.com/video_ext\.php.+?)\1', webpage) 
2610         if mobj is not None: 
2611             return self.url_result(mobj.group('url'), 'VK') 
2613         # Look for embedded Odnoklassniki player 
2614         mobj = re.search(r'<iframe[^>]+?src=(["\'])(?P
<url
>https?
://(?
:odnoklassniki|ok
)\
.ru
/videoembed
/.+?
)\
1', webpage) 
2615         if mobj is not None: 
2616             return self.url_result(mobj.group('url
'), 'Odnoklassniki
') 
2618         # Look for embedded ivi player 
2619         mobj = re.search(r'<embed
[^
>]+?src
=(["\'])(?P<url>https?://(?:www\.)?ivi\.ru/video/player.+?)\1', webpage) 
2620         if mobj is not None: 
2621             return self.url_result(mobj.group('url'), 'Ivi') 
2623         # Look for embedded Huffington Post player 
2625             r'<iframe[^>]+?src=(["\'])(?P
<url
>https?
://embed\
.live\
.huffingtonpost\
.com
/.+?
)\
1', webpage) 
2626         if mobj is not None: 
2627             return self.url_result(mobj.group('url
'), 'HuffPost
') 
2630         mobj = re.search(r'class=["\']embedly-card["\'][^
>]href
=["\'](?P<url>[^"\']+)', webpage) 
2631         if mobj is not None: 
2632             return self.url_result(mobj.group('url
')) 
2633         mobj = re.search(r'class=["\']embedly-embed["\'][^
>]src
=["\'][^"\']*url
=(?P
<url
>[^
&]+)', webpage) 
2634         if mobj is not None: 
2635             return self.url_result(compat_urllib_parse_unquote(mobj.group('url
'))) 
2637         # Look for funnyordie embed 
2638         matches = re.findall(r'<iframe
[^
>]+?src
="(https?://(?:www\.)?funnyordie\.com/embed/[^"]+)"', webpage) 
2640             return self.playlist_from_matches( 
2641                 matches, video_id, video_title, getter=unescapeHTML, ie='FunnyOrDie') 
2643         # Look for BBC iPlayer embed 
2644         matches = re.findall(r'setPlaylist\("(https?
://www\
.bbc\
.co\
.uk
/iplayer
/[^
/]+/[\da
-z
]{8}
)"\)', webpage) 
2646             return self.playlist_from_matches(matches, video_id, video_title, ie='BBCCoUk') 
2648         # Look for embedded RUTV player 
2649         rutv_url = RUTVIE._extract_url(webpage) 
2651             return self.url_result(rutv_url, 'RUTV') 
2653         # Look for embedded TVC player 
2654         tvc_url = TVCIE._extract_url(webpage) 
2656             return self.url_result(tvc_url, 'TVC') 
2658         # Look for embedded SportBox player 
2659         sportbox_urls = SportBoxIE._extract_urls(webpage) 
2661             return self.playlist_from_matches(sportbox_urls, video_id, video_title, ie=SportBoxIE.ie_key()) 
2663         # Look for embedded XHamster player 
2664         xhamster_urls = XHamsterEmbedIE._extract_urls(webpage) 
2666             return self.playlist_from_matches(xhamster_urls, video_id, video_title, ie='XHamsterEmbed') 
2668         # Look for embedded TNAFlixNetwork player 
2669         tnaflix_urls = TNAFlixNetworkEmbedIE._extract_urls(webpage) 
2671             return self.playlist_from_matches(tnaflix_urls, video_id, video_title, ie=TNAFlixNetworkEmbedIE.ie_key()) 
2673         # Look for embedded PornHub player 
2674         pornhub_urls = PornHubIE._extract_urls(webpage) 
2676             return self.playlist_from_matches(pornhub_urls, video_id, video_title, ie=PornHubIE.ie_key()) 
2678         # Look for embedded DrTuber player 
2679         drtuber_urls = DrTuberIE._extract_urls(webpage) 
2681             return self.playlist_from_matches(drtuber_urls, video_id, video_title, ie=DrTuberIE.ie_key()) 
2683         # Look for embedded RedTube player 
2684         redtube_urls = RedTubeIE._extract_urls(webpage) 
2686             return self.playlist_from_matches(redtube_urls, video_id, video_title, ie=RedTubeIE.ie_key()) 
2688         # Look for embedded Tube8 player 
2689         tube8_urls = Tube8IE._extract_urls(webpage) 
2691             return self.playlist_from_matches(tube8_urls, video_id, video_title, ie=Tube8IE.ie_key()) 
2693         # Look for embedded Tvigle player 
2695             r'<iframe[^>]+?src=(["\'])(?P
<url
>(?
:https?
:)?
//cloud\
.tvigle\
.ru
/video
/.+?
)\
1', webpage) 
2696         if mobj is not None: 
2697             return self.url_result(mobj.group('url
'), 'Tvigle
') 
2699         # Look for embedded TED player 
2701             r'<iframe
[^
>]+?src
=(["\'])(?P<url>https?://embed(?:-ssl)?\.ted\.com/.+?)\1', webpage) 
2702         if mobj is not None: 
2703             return self.url_result(mobj.group('url'), 'TED') 
2705         # Look for embedded Ustream videos 
2706         ustream_url = UstreamIE._extract_url(webpage) 
2708             return self.url_result(ustream_url, UstreamIE.ie_key()) 
2710         # Look for embedded arte.tv player 
2712             r'<(?:script|iframe) [^>]*?src="(?P
<url
>http
://www\
.arte\
.tv
/(?
:playerv2
/embed|arte_vp
/index
)[^
"]+)"', 
2714         if mobj is not None: 
2715             return self.url_result(mobj.group('url
'), 'ArteTVEmbed
') 
2717         # Look for embedded francetv player 
2719             r'<iframe
[^
>]+?src
=(["\'])(?P<url>(?:https?://)?embed\.francetv\.fr/\?ue=.+?)\1', 
2721         if mobj is not None: 
2722             return self.url_result(mobj.group('url')) 
2724         # Look for embedded smotri.com player 
2725         smotri_url = SmotriIE._extract_url(webpage) 
2727             return self.url_result(smotri_url, 'Smotri') 
2729         # Look for embedded Myvi.ru player 
2730         myvi_url = MyviIE._extract_url(webpage) 
2732             return self.url_result(myvi_url) 
2734         # Look for embedded soundcloud player 
2735         soundcloud_urls = SoundcloudIE._extract_urls(webpage) 
2737             return self.playlist_from_matches(soundcloud_urls, video_id, video_title, getter=unescapeHTML, ie=SoundcloudIE.ie_key()) 
2739         # Look for tunein player 
2740         tunein_urls = TuneInBaseIE._extract_urls(webpage) 
2742             return self.playlist_from_matches(tunein_urls, video_id, video_title) 
2744         # Look for embedded mtvservices player 
2745         mtvservices_url = MTVServicesEmbeddedIE._extract_url(webpage) 
2747             return self.url_result(mtvservices_url, ie='MTVServicesEmbedded') 
2749         # Look for embedded yahoo player 
2751             r'<iframe[^>]+?src=(["\'])(?P
<url
>https?
://(?
:screen|movies
)\
.yahoo\
.com
/.+?\
.html
\?format
=embed
)\
1', 
2753         if mobj is not None: 
2754             return self.url_result(mobj.group('url
'), 'Yahoo
') 
2756         # Look for embedded sbs.com.au player 
2760                 <meta\s+property="og:video"\s+content=| 
2763             (["\'])(?P<url>https?://(?:www\.)?sbs\.com\.au/ondemand/video/.+?)\1''', 
2765         if mobj is not None: 
2766             return self.url_result(mobj.group('url
'), 'SBS
') 
2768         # Look for embedded Cinchcast player 
2770             r'<iframe
[^
>]+?src
=(["\'])(?P<url>https?://player\.cinchcast\.com/.+?)\1', 
2772         if mobj is not None: 
2773             return self.url_result(mobj.group('url'), 'Cinchcast') 
2776             r'<iframe[^>]+?src=(["\'])(?P
<url
>https?
://m(?
:lb
)?\
.mlb\
.com
/shared
/video
/embed
/embed\
.html
\?.+?
)\
1', 
2780                 r'data
-video
-link
=["\'](?P<url>http://m.mlb.com/video/[^"\']+)', 
2782         if mobj is not None: 
2783             return self.url_result(mobj.group('url
'), 'MLB
') 
2786             r'<(?
:iframe|script
)[^
>]+?src
=(["\'])(?P<url>%s)\1' % CondeNastIE.EMBED_URL, 
2788         if mobj is not None: 
2789             return self.url_result(self._proto_relative_url(mobj.group('url'), scheme='http:'), 'CondeNast') 
2792             r'<iframe[^>]+src="(?P
<url
>https?
://(?
:new\
.)?livestream\
.com
/[^
"]+/player[^"]+)"', 
2794         if mobj is not None: 
2795             return self.url_result(mobj.group('url'), 'Livestream') 
2797         # Look for Zapiks embed 
2799             r'<iframe[^>]+src="(?P
<url
>https?
://(?
:www\
.)?zapiks\
.fr
/index\
.php
\?.+?
)"', webpage) 
2800         if mobj is not None: 
2801             return self.url_result(mobj.group('url'), 'Zapiks') 
2803         # Look for Kaltura embeds 
2804         kaltura_url = KalturaIE._extract_url(webpage) 
2806             return self.url_result(smuggle_url(kaltura_url, {'source_url': url}), KalturaIE.ie_key()) 
2808         # Look for EaglePlatform embeds 
2809         eagleplatform_url = EaglePlatformIE._extract_url(webpage) 
2810         if eagleplatform_url: 
2811             return self.url_result(smuggle_url(eagleplatform_url, {'referrer': url}), EaglePlatformIE.ie_key()) 
2813         # Look for ClipYou (uses EaglePlatform) embeds 
2815             r'<iframe[^>]+src="https?
://(?P
<host
>media\
.clipyou\
.ru
)/index
/player
\?.*\brecord
_id
=(?P
<id>\d
+).*"', webpage) 
2816         if mobj is not None: 
2817             return self.url_result('eagleplatform:%(host)s:%(id)s' % mobj.groupdict(), 'EaglePlatform') 
2819         # Look for Pladform embeds 
2820         pladform_url = PladformIE._extract_url(webpage) 
2822             return self.url_result(pladform_url) 
2824         # Look for Videomore embeds 
2825         videomore_url = VideomoreIE._extract_url(webpage) 
2827             return self.url_result(videomore_url) 
2829         # Look for Webcaster embeds 
2830         webcaster_url = WebcasterFeedIE._extract_url(self, webpage) 
2832             return self.url_result(webcaster_url, ie=WebcasterFeedIE.ie_key()) 
2834         # Look for Playwire embeds 
2836             r'<script[^>]+data-config=(["\'])(?P
<url
>(?
:https?
:)?
//config\
.playwire\
.com
/.+?
)\
1', webpage) 
2837         if mobj is not None: 
2838             return self.url_result(mobj.group('url
')) 
2840         # Look for 5min embeds 
2842             r'<meta
[^
>]+property="og:video"[^
>]+content
="https?://embed\.5min\.com/(?P<id>[0-9]+)/?', webpage) 
2843         if mobj is not None: 
2844             return self.url_result('5min:%s' % mobj.group('id'), 'FiveMin') 
2846         # Look for Crooks and Liars embeds 
2848             r'<(?:iframe[^>]+src|param[^>]+value)=(["\'])(?P
<url
>(?
:https?
:)?
//embed\
.crooksandliars\
.com
/(?
:embed|v
)/.+?
)\
1', webpage) 
2849         if mobj is not None: 
2850             return self.url_result(mobj.group('url
')) 
2852         # Look for NBC Sports VPlayer embeds 
2853         nbc_sports_url = NBCSportsVPlayerIE._extract_url(webpage) 
2855             return self.url_result(nbc_sports_url, 'NBCSportsVPlayer
') 
2857         # Look for NBC News embeds 
2858         nbc_news_embed_url = re.search( 
2859             r'<iframe
[^
>]+src
=(["\'])(?P<url>(?:https?:)?//www\.nbcnews\.com/widget/video-embed/[^"\']+)\
1', webpage) 
2860         if nbc_news_embed_url: 
2861             return self.url_result(nbc_news_embed_url.group('url
'), 'NBCNews
') 
2863         # Look for Google Drive embeds 
2864         google_drive_url = GoogleDriveIE._extract_url(webpage) 
2865         if google_drive_url: 
2866             return self.url_result(google_drive_url, 'GoogleDrive
') 
2868         # Look for UDN embeds 
2870             r'<iframe
[^
>]+src
="(?:https?:)?(?P<url>%s)"' % UDNEmbedIE._PROTOCOL_RELATIVE_VALID_URL, webpage) 
2871         if mobj is not None: 
2872             return self.url_result( 
2873                 compat_urlparse.urljoin(url, mobj.group('url
')), 'UDNEmbed
') 
2875         # Look for Senate ISVP iframe 
2876         senate_isvp_url = SenateISVPIE._search_iframe_url(webpage) 
2878             return self.url_result(senate_isvp_url, 'SenateISVP
') 
2880         # Look for OnionStudios embeds 
2881         onionstudios_url = OnionStudiosIE._extract_url(webpage) 
2882         if onionstudios_url: 
2883             return self.url_result(onionstudios_url) 
2885         # Look for ViewLift embeds 
2886         viewlift_url = ViewLiftEmbedIE._extract_url(webpage) 
2888             return self.url_result(viewlift_url) 
2890         # Look for JWPlatform embeds 
2891         jwplatform_urls = JWPlatformIE._extract_urls(webpage) 
2893             return self.playlist_from_matches(jwplatform_urls, video_id, video_title, ie=JWPlatformIE.ie_key()) 
2895         # Look for Digiteka embeds 
2896         digiteka_url = DigitekaIE._extract_url(webpage) 
2898             return self.url_result(self._proto_relative_url(digiteka_url), DigitekaIE.ie_key()) 
2900         # Look for Arkena embeds 
2901         arkena_url = ArkenaIE._extract_url(webpage) 
2903             return self.url_result(arkena_url, ArkenaIE.ie_key()) 
2905         # Look for Piksel embeds 
2906         piksel_url = PikselIE._extract_url(webpage) 
2908             return self.url_result(piksel_url, PikselIE.ie_key()) 
2910         # Look for Limelight embeds 
2911         limelight_urls = LimelightBaseIE._extract_urls(webpage, url) 
2913             return self.playlist_result( 
2914                 limelight_urls, video_id, video_title, video_description) 
2916         # Look for Anvato embeds 
2917         anvato_urls = AnvatoIE._extract_urls(self, webpage, video_id) 
2919             return self.playlist_result( 
2920                 anvato_urls, video_id, video_title, video_description) 
2922         # Look for AdobeTVVideo embeds 
2924             r'<iframe
[^
>]+src
=[\'"]((?:https?:)?//video\.tv\.adobe\.com/v/\d+[^"]+)[\'"]', 
2926         if mobj is not None: 
2927             return self.url_result( 
2928                 self._proto_relative_url(unescapeHTML(mobj.group(1))), 
2931         # Look for Vine embeds 
2933             r'<iframe[^>]+src=[\'"]((?
:https?
:)?
//(?
:www\
.)?vine\
.co
/v
/[^
/]+/embed
/(?
:simple|postcard
))', 
2935         if mobj is not None: 
2936             return self.url_result( 
2937                 self._proto_relative_url(unescapeHTML(mobj.group(1))), 'Vine
') 
2939         # Look for VODPlatform embeds 
2941             r'<iframe
[^
>]+src
=(["\'])(?P<url>(?:https?:)?//(?:www\.)?vod-platform\.net/[eE]mbed/.+?)\1', 
2943         if mobj is not None: 
2944             return self.url_result( 
2945                 self._proto_relative_url(unescapeHTML(mobj.group('url'))), 'VODPlatform') 
2947         # Look for Mangomolo embeds 
2949             r'''(?x)<iframe[^>]+src=(["\'])(?P
<url
>(?
:https?
:)?
//(?
:www\
.)?admin\
.mangomolo\
.com
/analytics
/index\
.php
/customers
/embed
/ 
2951                     video
\?.*?
\bid
=(?P
<video_id
>\d
+)|
 
2952                     index
\?.*?
\bchannelid
=(?P
<channel_id
>(?
:[A
-Za
-z0
-9+/=]|
%2B|
%2F|
%3D
)+) 
2953                 ).+?
)\
1''', webpage) 
2954         if mobj is not None: 
2956                 '_type': 'url_transparent', 
2957                 'url': self._proto_relative_url(unescapeHTML(mobj.group('url'))), 
2958                 'title': video_title, 
2959                 'description': video_description, 
2960                 'thumbnail': video_thumbnail, 
2961                 'uploader': video_uploader, 
2963             video_id = mobj.group('video_id') 
2966                     'ie_key': 'MangomoloVideo', 
2971                     'ie_key': 'MangomoloLive', 
2972                     'id': mobj.group('channel_id'), 
2976         # Look for Instagram embeds 
2977         instagram_embed_url = InstagramIE._extract_embed_url(webpage) 
2978         if instagram_embed_url is not None: 
2979             return self.url_result( 
2980                 self._proto_relative_url(instagram_embed_url), InstagramIE.ie_key()) 
2982         # Look for LiveLeak embeds 
2983         liveleak_urls = LiveLeakIE._extract_urls(webpage) 
2985             return self.playlist_from_matches(liveleak_urls, video_id, video_title) 
2987         # Look for 3Q SDN embeds 
2988         threeqsdn_url = ThreeQSDNIE._extract_url(webpage) 
2991                 '_type': 'url_transparent', 
2992                 'ie_key': ThreeQSDNIE.ie_key(), 
2993                 'url': self._proto_relative_url(threeqsdn_url), 
2994                 'title': video_title, 
2995                 'description': video_description, 
2996                 'thumbnail': video_thumbnail, 
2997                 'uploader': video_uploader, 
3000         # Look for VBOX7 embeds 
3001         vbox7_url = Vbox7IE._extract_url(webpage) 
3003             return self.url_result(vbox7_url, Vbox7IE.ie_key()) 
3005         # Look for DBTV embeds 
3006         dbtv_urls = DBTVIE._extract_urls(webpage) 
3008             return self.playlist_from_matches(dbtv_urls, video_id, video_title, ie=DBTVIE.ie_key()) 
3010         # Look for Videa embeds 
3011         videa_urls = VideaIE._extract_urls(webpage) 
3013             return self.playlist_from_matches(videa_urls, video_id, video_title, ie=VideaIE.ie_key()) 
3015         # Look for 20 minuten embeds 
3016         twentymin_urls = TwentyMinutenIE._extract_urls(webpage) 
3018             return self.playlist_from_matches( 
3019                 twentymin_urls, video_id, video_title, ie=TwentyMinutenIE.ie_key()) 
3021         # Look for Openload embeds 
3022         openload_urls = OpenloadIE._extract_urls(webpage) 
3024             return self.playlist_from_matches( 
3025                 openload_urls, video_id, video_title, ie=OpenloadIE.ie_key()) 
3027         # Look for Verystream embeds 
3028         verystream_urls = VerystreamIE._extract_urls(webpage) 
3030             return self.playlist_from_matches( 
3031                 verystream_urls, video_id, video_title, ie=VerystreamIE.ie_key()) 
3033         # Look for VideoPress embeds 
3034         videopress_urls = VideoPressIE._extract_urls(webpage) 
3036             return self.playlist_from_matches( 
3037                 videopress_urls, video_id, video_title, ie=VideoPressIE.ie_key()) 
3039         # Look for Rutube embeds 
3040         rutube_urls = RutubeIE._extract_urls(webpage) 
3042             return self.playlist_from_matches( 
3043                 rutube_urls, video_id, video_title, ie=RutubeIE.ie_key()) 
3045         # Look for WashingtonPost embeds 
3046         wapo_urls = WashingtonPostIE._extract_urls(webpage) 
3048             return self.playlist_from_matches( 
3049                 wapo_urls, video_id, video_title, ie=WashingtonPostIE.ie_key()) 
3051         # Look for Mediaset embeds 
3052         mediaset_urls = MediasetIE._extract_urls(self, webpage) 
3054             return self.playlist_from_matches( 
3055                 mediaset_urls, video_id, video_title, ie=MediasetIE.ie_key()) 
3057         # Look for JOJ.sk embeds 
3058         joj_urls = JojIE._extract_urls(webpage) 
3060             return self.playlist_from_matches( 
3061                 joj_urls, video_id, video_title, ie=JojIE.ie_key()) 
3063         # Look for megaphone.fm embeds 
3064         mpfn_urls = MegaphoneIE._extract_urls(webpage) 
3066             return self.playlist_from_matches( 
3067                 mpfn_urls, video_id, video_title, ie=MegaphoneIE.ie_key()) 
3069         # Look for vzaar embeds 
3070         vzaar_urls = VzaarIE._extract_urls(webpage) 
3072             return self.playlist_from_matches( 
3073                 vzaar_urls, video_id, video_title, ie=VzaarIE.ie_key()) 
3075         channel9_urls = Channel9IE._extract_urls(webpage) 
3077             return self.playlist_from_matches( 
3078                 channel9_urls, video_id, video_title, ie=Channel9IE.ie_key()) 
3080         vshare_urls = VShareIE._extract_urls(webpage) 
3082             return self.playlist_from_matches( 
3083                 vshare_urls, video_id, video_title, ie=VShareIE.ie_key()) 
3085         # Look for Mediasite embeds 
3086         mediasite_urls = MediasiteIE._extract_urls(webpage) 
3089                 self.url_result(smuggle_url( 
3090                     compat_urlparse.urljoin(url, mediasite_url), 
3091                     {'UrlReferrer': url}), ie=MediasiteIE.ie_key()) 
3092                 for mediasite_url in mediasite_urls] 
3093             return self.playlist_result(entries, video_id, video_title) 
3095         springboardplatform_urls = SpringboardPlatformIE._extract_urls(webpage) 
3096         if springboardplatform_urls: 
3097             return self.playlist_from_matches( 
3098                 springboardplatform_urls, video_id, video_title, 
3099                 ie=SpringboardPlatformIE.ie_key()) 
3101         yapfiles_urls = YapFilesIE._extract_urls(webpage) 
3103             return self.playlist_from_matches( 
3104                 yapfiles_urls, video_id, video_title, ie=YapFilesIE.ie_key()) 
3106         vice_urls = ViceIE._extract_urls(webpage) 
3108             return self.playlist_from_matches( 
3109                 vice_urls, video_id, video_title, ie=ViceIE.ie_key()) 
3111         xfileshare_urls = XFileShareIE._extract_urls(webpage) 
3113             return self.playlist_from_matches( 
3114                 xfileshare_urls, video_id, video_title, ie=XFileShareIE.ie_key()) 
3116         cloudflarestream_urls = CloudflareStreamIE._extract_urls(webpage) 
3117         if cloudflarestream_urls: 
3118             return self.playlist_from_matches( 
3119                 cloudflarestream_urls, video_id, video_title, ie=CloudflareStreamIE.ie_key()) 
3121         peertube_urls = PeerTubeIE._extract_urls(webpage, url) 
3123             return self.playlist_from_matches( 
3124                 peertube_urls, video_id, video_title, ie=PeerTubeIE.ie_key()) 
3126         teachable_url = TeachableIE._extract_url(webpage, url) 
3128             return self.url_result(teachable_url) 
3130         indavideo_urls = IndavideoEmbedIE._extract_urls(webpage) 
3132             return self.playlist_from_matches( 
3133                 indavideo_urls, video_id, video_title, ie=IndavideoEmbedIE.ie_key()) 
3135         apa_urls = APAIE._extract_urls(webpage) 
3137             return self.playlist_from_matches( 
3138                 apa_urls, video_id, video_title, ie=APAIE.ie_key()) 
3140         foxnews_urls = FoxNewsIE._extract_urls(webpage) 
3142             return self.playlist_from_matches( 
3143                 foxnews_urls, video_id, video_title, ie=FoxNewsIE.ie_key()) 
3145         sharevideos_urls = [sharevideos_mobj.group('url') for sharevideos_mobj in re.finditer( 
3146             r'<iframe[^>]+?\bsrc\s*=\s*(["\'])(?P<url>(?:https?:)?//embed\.share-videos\.se/auto/embed/\d+\?.*?\buid=\d+.*?)\1', 
3148         if sharevideos_urls: 
3149             return self.playlist_from_matches( 
3150                 sharevideos_urls, video_id, video_title) 
3152         viqeo_urls = ViqeoIE._extract_urls(webpage) 
3154             return self.playlist_from_matches( 
3155                 viqeo_urls, video_id, video_title, ie=ViqeoIE.ie_key()) 
3157         expressen_urls = ExpressenIE._extract_urls(webpage) 
3159             return self.playlist_from_matches( 
3160                 expressen_urls, video_id, video_title, ie=ExpressenIE.ie_key()) 
3162         zype_urls = ZypeIE._extract_urls(webpage) 
3164             return self.playlist_from_matches( 
3165                 zype_urls, video_id, video_title, ie=ZypeIE.ie_key()) 
3167         # Look for HTML5 media 
3168         entries = self._parse_html5_media_entries(url, webpage, video_id, m3u8_id='hls') 
3170             if len(entries) == 1: 
3173                     'title': video_title, 
3176                 for num, entry in enumerate(entries, start=1): 
3178                         'id': '%s-%s' % (video_id, num), 
3179                         'title': '%s (%d)' % (video_title, num), 
3181             for entry in entries: 
3182                 self._sort_formats(entry['formats']) 
3183             return self.playlist_result(entries, video_id, video_title) 
3185         jwplayer_data = self._find_jwplayer_data( 
3186             webpage, video_id, transform_source=js_to_json) 
3189                 info = self._parse_jwplayer_data( 
3190                     jwplayer_data, video_id, require_title=False, base_url=url) 
3191                 return merge_dicts(info, info_dict) 
3192             except ExtractorError: 
3193                 # See https://github.com/ytdl-org/youtube-dl/pull/16735 
3198             r'(?s)\bvideojs\s*\(.+?\.src\s*\(\s*((?:\[.+?\]|{.+?}))\s*\)\s*;', 
3200         if mobj is not None: 
3201             sources = self._parse_json( 
3202                 mobj.group(1), video_id, transform_source=js_to_json, 
3204             if not isinstance(sources, list): 
3207             for source in sources: 
3208                 src = source.get('src') 
3209                 if not src or not isinstance(src, compat_str): 
3211                 src = compat_urlparse.urljoin(url, src) 
3212                 src_type = source.get('type') 
3213                 if isinstance(src_type, compat_str): 
3214                     src_type = src_type.lower() 
3215                 ext = determine_ext(src).lower() 
3216                 if src_type == 'video/youtube': 
3217                     return self.url_result(src, YoutubeIE.ie_key()) 
3218                 if src_type == 'application/dash+xml' or ext == 'mpd': 
3219                     formats.extend(self._extract_mpd_formats( 
3220                         src, video_id, mpd_id='dash', fatal=False)) 
3221                 elif src_type == 'application/x-mpegurl' or ext == 'm3u8': 
3222                     formats.extend(self._extract_m3u8_formats( 
3223                         src, video_id, 'mp4', entry_protocol='m3u8_native', 
3224                         m3u8_id='hls', fatal=False)) 
3228                         'ext': (mimetype2ext(src_type) 
3229                                 or ext if ext in KNOWN_EXTENSIONS else 'mp4'), 
3232                 self._sort_formats(formats) 
3233                 info_dict['formats'] = formats 
3236         # Looking for http://schema.org/VideoObject 
3237         json_ld = self._search_json_ld( 
3238             webpage, video_id, default={}, expected_type='VideoObject') 
3239         if json_ld.get('url'): 
3240             return merge_dicts(json_ld, info_dict) 
3242         def check_video(vurl): 
3243             if YoutubeIE.suitable(vurl): 
3245             if RtmpIE.suitable(vurl): 
3247             vpath = compat_urlparse.urlparse(vurl).path 
3248             vext = determine_ext(vpath) 
3249             return '.' in vpath and vext not in ('swf', 'png', 'jpg', 'srt', 'sbv', 'sub', 'vtt', 'ttml', 'js', 'xml') 
3251         def filter_video(urls): 
3252             return list(filter(check_video, urls)) 
3254         # Start with something easy: JW Player in SWFObject 
3255         found = filter_video(re.findall(r'flashvars: [\'"](?:.*&)?file=(http[^\'"&]*)', webpage)) 
3257             # Look for gorilla-vid style embedding 
3258             found = filter_video(re.findall(r'''(?sx
) 
3262                     jwplayer\s
*\
(\s
*["'][^'"]+["']\s*\)\s*\.setup 
3265                 ['"]?
file['"]?\s*:\s*["\'](.*?)["\']''', webpage)) 
3267             # Broaden the search a little bit 
3268             found = filter_video(re.findall(r'[^A
-Za
-z0
-9]?
(?
:file|source
)=(http
[^
\'"&]*)', webpage)) 
3270             # Broaden the findall a little bit: JWPlayer JS loader 
3271             found = filter_video(re.findall( 
3272                 r'[^A-Za-z0-9]?(?:file|video_url)["\']?
:\s
*["\'](http(?![^\'"]+\
.[0-9]+[\'"])[^\'"]+)["\']', webpage)) 
3275             found = filter_video(re.findall(r'''(?xs) 
3276                 flowplayer\("[^
"]+",\s
* 
3278                     \s
*\
{[^
}]+? 
["']?clip["']?\s*:\s*\{\s* 
3279                         ["']?url
["']?\s*:\s*["']([^"']+)["'] 
3284                 r"cinerama\
.embedPlayer\
(\s
*\'[^
']+\',\s*'([^
']+)'", webpage) 
3286             # Try to find twitter cards info 
3287             # twitter:player:stream should be checked before twitter:player since 
3288             # it is expected to contain a raw stream (see 
3289             # https://dev.twitter.com/cards/types/player#On_twitter.com_via_desktop_browser) 
3290             found = filter_video(re.findall( 
3291                 r'<meta (?:property|name)="twitter
:player
:stream
" (?:content|value)="(.+?
)"', webpage)) 
3293             # We look for Open Graph info: 
3294             # We have to match any number spaces between elements, some sites try to align them (eg.: statigr.am) 
3295             m_video_type = re.findall(r'<meta.*?property="og
:video
:type".*?content="video
/(.*?
)"', webpage) 
3296             # We only look in og:video if the MIME type is a video, don't try if it's a Flash player: 
3297             if m_video_type is not None: 
3298                 found = filter_video(re.findall(r'<meta.*?property="og
:video
".*?content="(.*?
)"', webpage)) 
3300             REDIRECT_REGEX = r'[0-9]{,2};\s*(?:URL|url)=\'?([^\'"]+)' 
3302                 r'(?i
)<meta\s
+(?
=(?
:[a
-z
-]+="[^"]+"\s+)*http-equiv="refresh
")' 
3303                 r'(?:[a-z-]+="[^
"]+"\s
+)*?content
="%s' % REDIRECT_REGEX, 
3306                 # Look also in Refresh HTTP header 
3307                 refresh_header = head_response.headers.get('Refresh') 
3309                     # In python 2 response HTTP headers are bytestrings 
3310                     if sys.version_info < (3, 0) and isinstance(refresh_header, str): 
3311                         refresh_header = refresh_header.decode('iso-8859-1') 
3312                     found = re.search(REDIRECT_REGEX, refresh_header) 
3314                 new_url = compat_urlparse.urljoin(url, unescapeHTML(found.group(1))) 
3316                     self.report_following_redirect(new_url) 
3325             # twitter:player is a https URL to iframe player that may or may not 
3326             # be supported by youtube-dl thus this is checked the very last (see 
3327             # https://dev.twitter.com/cards/types/player#On_twitter.com_via_desktop_browser) 
3328             embed_url = self._html_search_meta('twitter:player', webpage, default=None) 
3329             if embed_url and embed_url != url: 
3330                 return self.url_result(embed_url) 
3333             raise UnsupportedError(url) 
3336         for video_url in orderedSet(found): 
3337             video_url = unescapeHTML(video_url) 
3338             video_url = video_url.replace('\\/', '/') 
3339             video_url = compat_urlparse.urljoin(url, video_url) 
3340             video_id = compat_urllib_parse_unquote(os.path.basename(video_url)) 
3342             # Sometimes, jwplayer extraction will result in a YouTube URL 
3343             if YoutubeIE.suitable(video_url): 
3344                 entries.append(self.url_result(video_url, 'Youtube')) 
3347             # here's a fun little line of code for you: 
3348             video_id = os.path.splitext(video_id)[0] 
3352                 'uploader': video_uploader, 
3353                 'title': video_title, 
3354                 'age_limit': age_limit, 
3357             if RtmpIE.suitable(video_url): 
3358                 entry_info_dict.update({ 
3359                     '_type': 'url_transparent', 
3360                     'ie_key': RtmpIE.ie_key(), 
3363                 entries.append(entry_info_dict) 
3366             ext = determine_ext(video_url) 
3368                 entry_info_dict['formats'] = self._extract_smil_formats(video_url, video_id) 
3370                 return self.playlist_result(self._extract_xspf_playlist(video_url, video_id), video_id) 
3372                 entry_info_dict['formats'] = self._extract_m3u8_formats(video_url, video_id, ext='mp4') 
3374                 entry_info_dict['formats'] = self._extract_mpd_formats(video_url, video_id) 
3376                 entry_info_dict['formats'] = self._extract_f4m_formats(video_url, video_id) 
3377             elif re.search(r'(?i)\.(?:ism|smil)/manifest', video_url) and video_url != url: 
3378                 # Just matching .ism/manifest is not enough to be reliably sure 
3379                 # whether it's actually an ISM manifest or some other streaming 
3380                 # manifest since there are various streaming URL formats 
3381                 # possible (see [1]) as well as some other shenanigans like 
3382                 # .smil/manifest URLs that actually serve an ISM (see [2]) and 
3384                 # Thus the most reasonable way to solve this is to delegate 
3385                 # to generic extractor in order to look into the contents of 
3386                 # the manifest itself. 
3387                 # 1. https://azure.microsoft.com/en-us/documentation/articles/media-services-deliver-content-overview/#streaming-url-formats 
3388                 # 2. https://svs.itworkscdn.net/lbcivod/smil:itwfcdn/lbci/170976.smil/Manifest 
3389                 entry_info_dict = self.url_result( 
3390                     smuggle_url(video_url, {'to_generic': True}), 
3393                 entry_info_dict['url'] = video_url 
3395             if entry_info_dict.get('formats'): 
3396                 self._sort_formats(entry_info_dict['formats']) 
3398             entries.append(entry_info_dict) 
3400         if len(entries) == 1: 
3403             for num, e in enumerate(entries, start=1): 
3404                 # 'url' results don't have a title 
3405                 if e.get('title') is not None: 
3406                     e['title'] = '%s (%d)' % (e['title'], num) 
3408                 '_type': 'playlist',