]> Raphaƫl G. Git Repositories - youtubedl/blob - test/test_InfoExtractor.py
debian/control: Add recommends on ca-certificates.
[youtubedl] / test / test_InfoExtractor.py
1 #!/usr/bin/env python
2
3 from __future__ import unicode_literals
4
5 # Allow direct execution
6 import os
7 import sys
8 import unittest
9 sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
10
11 from test.helper import FakeYDL
12 from youtube_dl.extractor.common import InfoExtractor
13 from youtube_dl.extractor import YoutubeIE, get_info_extractor
14 from youtube_dl.utils import encode_data_uri, strip_jsonp, ExtractorError
15
16
17 class TestIE(InfoExtractor):
18 pass
19
20
21 class TestInfoExtractor(unittest.TestCase):
22 def setUp(self):
23 self.ie = TestIE(FakeYDL())
24
25 def test_ie_key(self):
26 self.assertEqual(get_info_extractor(YoutubeIE.ie_key()), YoutubeIE)
27
28 def test_html_search_regex(self):
29 html = '<p id="foo">Watch this <a href="http://www.youtube.com/watch?v=BaW_jenozKc">video</a></p>'
30 search = lambda re, *args: self.ie._html_search_regex(re, html, *args)
31 self.assertEqual(search(r'<p id="foo">(.+?)</p>', 'foo'), 'Watch this video')
32
33 def test_opengraph(self):
34 ie = self.ie
35 html = '''
36 <meta name="og:title" content='Foo'/>
37 <meta content="Some video's description " name="og:description"/>
38 <meta property='og:image' content='http://domain.com/pic.jpg?key1=val1&amp;key2=val2'/>
39 <meta content='application/x-shockwave-flash' property='og:video:type'>
40 <meta content='Foo' property=og:foobar>
41 <meta name="og:test1" content='foo > < bar'/>
42 <meta name="og:test2" content="foo >//< bar"/>
43 '''
44 self.assertEqual(ie._og_search_title(html), 'Foo')
45 self.assertEqual(ie._og_search_description(html), 'Some video\'s description ')
46 self.assertEqual(ie._og_search_thumbnail(html), 'http://domain.com/pic.jpg?key1=val1&key2=val2')
47 self.assertEqual(ie._og_search_video_url(html, default=None), None)
48 self.assertEqual(ie._og_search_property('foobar', html), 'Foo')
49 self.assertEqual(ie._og_search_property('test1', html), 'foo > < bar')
50 self.assertEqual(ie._og_search_property('test2', html), 'foo >//< bar')
51
52 def test_html_search_meta(self):
53 ie = self.ie
54 html = '''
55 <meta name="a" content="1" />
56 <meta name='b' content='2'>
57 <meta name="c" content='3'>
58 <meta name=d content='4'>
59 <meta property="e" content='5' >
60 <meta content="6" name="f">
61 '''
62
63 self.assertEqual(ie._html_search_meta('a', html), '1')
64 self.assertEqual(ie._html_search_meta('b', html), '2')
65 self.assertEqual(ie._html_search_meta('c', html), '3')
66 self.assertEqual(ie._html_search_meta('d', html), '4')
67 self.assertEqual(ie._html_search_meta('e', html), '5')
68 self.assertEqual(ie._html_search_meta('f', html), '6')
69
70 def test_download_json(self):
71 uri = encode_data_uri(b'{"foo": "blah"}', 'application/json')
72 self.assertEqual(self.ie._download_json(uri, None), {'foo': 'blah'})
73 uri = encode_data_uri(b'callback({"foo": "blah"})', 'application/javascript')
74 self.assertEqual(self.ie._download_json(uri, None, transform_source=strip_jsonp), {'foo': 'blah'})
75 uri = encode_data_uri(b'{"foo": invalid}', 'application/json')
76 self.assertRaises(ExtractorError, self.ie._download_json, uri, None)
77 self.assertEqual(self.ie._download_json(uri, None, fatal=False), None)
78
79 if __name__ == '__main__':
80 unittest.main()