]>
Raphaƫl G. Git Repositories - youtubedl/blob - test/test_all_urls.py
3 from __future__
import unicode_literals
5 # Allow direct execution
9 sys
.path
.insert(0, os
.path
.dirname(os
.path
.dirname(os
.path
.abspath(__file__
))))
12 from test
.helper
import gettestcases
14 from youtube_dl
.extractor
import (
23 class TestAllURLsMatching(unittest
.TestCase
):
25 self
.ies
= gen_extractors()
27 def matching_ies(self
, url
):
28 return [ie
.IE_NAME
for ie
in self
.ies
if ie
.suitable(url
) and ie
.IE_NAME
!= 'generic']
30 def assertMatch(self
, url
, ie_list
):
31 self
.assertEqual(self
.matching_ies(url
), ie_list
)
33 def test_youtube_playlist_matching(self
):
34 assertPlaylist
= lambda url
: self
.assertMatch(url
, ['youtube:playlist'])
35 assertPlaylist('ECUl4u3cNGP61MdtwGTqZA0MreSaDybji8')
36 assertPlaylist('UUBABnxM4Ar9ten8Mdjj1j0Q') #585
37 assertPlaylist('PL63F0C78739B09958')
38 assertPlaylist('https://www.youtube.com/playlist?list=UUBABnxM4Ar9ten8Mdjj1j0Q')
39 assertPlaylist('https://www.youtube.com/course?list=ECUl4u3cNGP61MdtwGTqZA0MreSaDybji8')
40 assertPlaylist('https://www.youtube.com/playlist?list=PLwP_SiAcdui0KVebT0mU9Apz359a4ubsC')
41 assertPlaylist('https://www.youtube.com/watch?v=AV6J6_AeFEQ&playnext=1&list=PL4023E734DA416012') #668
42 self
.assertFalse('youtube:playlist' in self
.matching_ies('PLtS2H6bU1M'))
44 assertPlaylist('https://www.youtube.com/playlist?list=MCUS.20142101')
46 def test_youtube_matching(self
):
47 self
.assertTrue(YoutubeIE
.suitable('PLtS2H6bU1M'))
48 self
.assertFalse(YoutubeIE
.suitable('https://www.youtube.com/watch?v=AV6J6_AeFEQ&playnext=1&list=PL4023E734DA416012')) #668
49 self
.assertMatch('http://youtu.be/BaW_jenozKc', ['youtube'])
50 self
.assertMatch('http://www.youtube.com/v/BaW_jenozKc', ['youtube'])
51 self
.assertMatch('https://youtube.googleapis.com/v/BaW_jenozKc', ['youtube'])
52 self
.assertMatch('http://www.cleanvideosearch.com/media/action/yt/watch?videoId=8v_4O44sfjM', ['youtube'])
54 def test_youtube_channel_matching(self
):
55 assertChannel
= lambda url
: self
.assertMatch(url
, ['youtube:channel'])
56 assertChannel('https://www.youtube.com/channel/HCtnHdj3df7iM')
57 assertChannel('https://www.youtube.com/channel/HCtnHdj3df7iM?feature=gb_ch_rec')
58 assertChannel('https://www.youtube.com/channel/HCtnHdj3df7iM/videos')
60 def test_youtube_user_matching(self
):
61 self
.assertMatch('www.youtube.com/NASAgovVideo/videos', ['youtube:user'])
63 def test_youtube_feeds(self
):
64 self
.assertMatch('https://www.youtube.com/feed/watch_later', ['youtube:watch_later'])
65 self
.assertMatch('https://www.youtube.com/feed/subscriptions', ['youtube:subscriptions'])
66 self
.assertMatch('https://www.youtube.com/feed/recommended', ['youtube:recommended'])
67 self
.assertMatch('https://www.youtube.com/my_favorites', ['youtube:favorites'])
69 def test_youtube_show_matching(self
):
70 self
.assertMatch('http://www.youtube.com/show/airdisasters', ['youtube:show'])
72 def test_youtube_truncated(self
):
73 self
.assertMatch('http://www.youtube.com/watch?', ['youtube:truncated_url'])
75 def test_youtube_search_matching(self
):
76 self
.assertMatch('http://www.youtube.com/results?search_query=making+mustard', ['youtube:search_url'])
77 self
.assertMatch('https://www.youtube.com/results?baz=bar&search_query=youtube-dl+test+video&filters=video&lclk=video', ['youtube:search_url'])
79 def test_justin_tv_channelid_matching(self
):
80 self
.assertTrue(JustinTVIE
.suitable('justin.tv/vanillatv'))
81 self
.assertTrue(JustinTVIE
.suitable('twitch.tv/vanillatv'))
82 self
.assertTrue(JustinTVIE
.suitable('www.justin.tv/vanillatv'))
83 self
.assertTrue(JustinTVIE
.suitable('www.twitch.tv/vanillatv'))
84 self
.assertTrue(JustinTVIE
.suitable('http://www.justin.tv/vanillatv'))
85 self
.assertTrue(JustinTVIE
.suitable('http://www.twitch.tv/vanillatv'))
86 self
.assertTrue(JustinTVIE
.suitable('http://www.justin.tv/vanillatv/'))
87 self
.assertTrue(JustinTVIE
.suitable('http://www.twitch.tv/vanillatv/'))
89 def test_justintv_videoid_matching(self
):
90 self
.assertTrue(JustinTVIE
.suitable('http://www.twitch.tv/vanillatv/b/328087483'))
92 def test_justin_tv_chapterid_matching(self
):
93 self
.assertTrue(JustinTVIE
.suitable('http://www.twitch.tv/tsm_theoddone/c/2349361'))
95 def test_youtube_extract(self
):
96 assertExtractId
= lambda url
, id: self
.assertEqual(YoutubeIE
.extract_id(url
), id)
97 assertExtractId('http://www.youtube.com/watch?&v=BaW_jenozKc', 'BaW_jenozKc')
98 assertExtractId('https://www.youtube.com/watch?&v=BaW_jenozKc', 'BaW_jenozKc')
99 assertExtractId('https://www.youtube.com/watch?feature=player_embedded&v=BaW_jenozKc', 'BaW_jenozKc')
100 assertExtractId('https://www.youtube.com/watch_popup?v=BaW_jenozKc', 'BaW_jenozKc')
101 assertExtractId('http://www.youtube.com/watch?v=BaW_jenozKcsharePLED17F32AD9753930', 'BaW_jenozKc')
102 assertExtractId('BaW_jenozKc', 'BaW_jenozKc')
104 def test_facebook_matching(self
):
105 self
.assertTrue(FacebookIE
.suitable('https://www.facebook.com/Shiniknoh#!/photo.php?v=10153317450565268'))
107 def test_no_duplicates(self
):
108 ies
= gen_extractors()
109 for tc
in gettestcases(include_onlymatching
=True):
112 if type(ie
).__name
__ in ('GenericIE', tc
['name'] + 'IE'):
113 self
.assertTrue(ie
.suitable(url
), '%s should match URL %r' % (type(ie
).__name
__, url
))
115 self
.assertFalse(ie
.suitable(url
), '%s should not match URL %r' % (type(ie
).__name
__, url
))
117 def test_keywords(self
):
118 self
.assertMatch(':ytsubs', ['youtube:subscriptions'])
119 self
.assertMatch(':ytsubscriptions', ['youtube:subscriptions'])
120 self
.assertMatch(':ythistory', ['youtube:history'])
121 self
.assertMatch(':thedailyshow', ['ComedyCentralShows'])
122 self
.assertMatch(':tds', ['ComedyCentralShows'])
123 self
.assertMatch(':colbertreport', ['ComedyCentralShows'])
124 self
.assertMatch(':cr', ['ComedyCentralShows'])
126 def test_vimeo_matching(self
):
127 self
.assertMatch('http://vimeo.com/channels/tributes', ['vimeo:channel'])
128 self
.assertMatch('http://vimeo.com/channels/31259', ['vimeo:channel'])
129 self
.assertMatch('http://vimeo.com/channels/31259/53576664', ['vimeo'])
130 self
.assertMatch('http://vimeo.com/user7108434', ['vimeo:user'])
131 self
.assertMatch('http://vimeo.com/user7108434/videos', ['vimeo:user'])
132 self
.assertMatch('https://vimeo.com/user21297594/review/75524534/3c257a1b5d', ['vimeo:review'])
134 # https://github.com/rg3/youtube-dl/issues/1930
135 def test_soundcloud_not_matching_sets(self
):
136 self
.assertMatch('http://soundcloud.com/floex/sets/gone-ep', ['soundcloud:set'])
138 def test_tumblr(self
):
139 self
.assertMatch('http://tatianamaslanydaily.tumblr.com/post/54196191430/orphan-black-dvd-extra-behind-the-scenes', ['Tumblr'])
140 self
.assertMatch('http://tatianamaslanydaily.tumblr.com/post/54196191430', ['Tumblr'])
143 # https://github.com/rg3/youtube-dl/issues/2350
144 self
.assertMatch('http://video.pbs.org/viralplayer/2365173446/', ['PBS'])
145 self
.assertMatch('http://video.pbs.org/widget/partnerplayer/980042464/', ['PBS'])
147 def test_ComedyCentralShows(self
):
149 'http://thedailyshow.cc.com/extended-interviews/xm3fnq/andrew-napolitano-extended-interview',
150 ['ComedyCentralShows'])
152 'http://thecolbertreport.cc.com/videos/29w6fx/-realhumanpraise-for-fox-news',
153 ['ComedyCentralShows'])
155 'http://thecolbertreport.cc.com/videos/gh6urb/neil-degrasse-tyson-pt--1?xrs=eml_col_031114',
156 ['ComedyCentralShows'])
158 'http://thedailyshow.cc.com/guests/michael-lewis/3efna8/exclusive---michael-lewis-extended-interview-pt--3',
159 ['ComedyCentralShows'])
161 'http://thedailyshow.cc.com/episodes/sy7yv0/april-8--2014---denis-leary',
162 ['ComedyCentralShows'])
164 'http://thecolbertreport.cc.com/episodes/8ase07/april-8--2014---jane-goodall',
165 ['ComedyCentralShows'])
167 'http://thedailyshow.cc.com/video-playlists/npde3s/the-daily-show-19088-highlights',
168 ['ComedyCentralShows'])
170 'http://thedailyshow.cc.com/special-editions/2l8fdb/special-edition---a-look-back-at-food',
171 ['ComedyCentralShows'])
173 def test_yahoo_https(self
):
174 # https://github.com/rg3/youtube-dl/issues/2701
176 'https://screen.yahoo.com/smartwatches-latest-wearable-gadgets-163745379-cbs.html',
180 if __name__
== '__main__':