]>
Raphaƫl G. Git Repositories - youtubedl/blob - youtube_dl/extractor/instagram.py
3 from .common
import InfoExtractor
5 class InstagramIE(InfoExtractor
):
6 _VALID_URL
= r
'(?:http://)?instagram.com/p/(.*?)/'
8 u
'url': u
'http://instagram.com/p/aye83DjauH/#',
9 u
'file': u
'aye83DjauH.mp4',
10 u
'md5': u
'0d2da106a9d2631273e192b372806516',
12 u
"uploader_id": u
"naomipq",
13 u
"title": u
"Video by naomipq"
17 def _real_extract(self
, url
):
18 mobj
= re
.match(self
._VALID
_URL
, url
)
19 video_id
= mobj
.group(1)
20 webpage
= self
._download
_webpage
(url
, video_id
)
21 video_url
= self
._html
_search
_regex
(
22 r
'<meta property="og:video" content="(.+?)"',
23 webpage
, u
'video URL')
24 thumbnail_url
= self
._html
_search
_regex
(
25 r
'<meta property="og:image" content="(.+?)" />',
26 webpage
, u
'thumbnail URL', fatal
=False)
27 html_title
= self
._html
_search
_regex
(
28 r
'<title>(.+?)</title>',
29 webpage
, u
'title', flags
=re
.DOTALL
)
30 title
= re
.sub(u
'(?: *\(Videos?\))? \u2022 Instagram$', '', html_title
).strip()
31 uploader_id
= self
._html
_search
_regex
(r
'content="(.*?)\'s video on Instagram
',
32 webpage, u'uploader name
', fatal=False)
40 'thumbnail
': thumbnail_url,
41 'uploader_id
' : uploader_id