- """Information Extractor for xHamster"""
- _VALID_URL = r'(?:http://)?(?:www\.)?xhamster\.com/movies/(?P<id>[0-9]+)/(?P<seo>.+?)\.html(?:\?.*)?'
- _TESTS = [{
- 'url': 'http://xhamster.com/movies/1509445/femaleagent_shy_beauty_takes_the_bait.html',
- 'file': '1509445.mp4',
- 'md5': '8281348b8d3c53d39fffb377d24eac4e',
- 'info_dict': {
- "upload_date": "20121014",
- "uploader_id": "Ruseful2011",
- "title": "FemaleAgent Shy beauty takes the bait",
- "age_limit": 18,
- }
- },
- {
- 'url': 'http://xhamster.com/movies/2221348/britney_spears_sexy_booty.html?hd',
- 'file': '2221348.flv',
- 'md5': 'e767b9475de189320f691f49c679c4c7',
- 'info_dict': {
- "upload_date": "20130914",
- "uploader_id": "jojo747400",
- "title": "Britney Spears Sexy Booty",
- "age_limit": 18,
- }
- }]
-
- def _real_extract(self,url):
- def extract_video_url(webpage):
- mobj = re.search(r'\'srv\': \'(?P<server>[^\']*)\',\s*\'file\': \'(?P<file>[^\']+)\',', webpage)
- if mobj is None:
- raise ExtractorError('Unable to extract media URL')
- if len(mobj.group('server')) == 0:
- return compat_urllib_parse.unquote(mobj.group('file'))
- else:
- return mobj.group('server')+'/key='+mobj.group('file')
-
- def extract_mp4_video_url(webpage):
- mp4 = re.search(r'<a href=\"(.+?)\" class=\"mp4Play\"',webpage)
- if mp4 is None:
- return None
- else:
- return mp4.group(1)
+ _VALID_URL = r'(?P<proto>https?)://(?:.+?\.)?xhamster\.com/movies/(?P<id>[0-9]+)/(?P<seo>.+?)\.html(?:\?.*)?'
+ _TESTS = [
+ {
+ 'url': 'http://xhamster.com/movies/1509445/femaleagent_shy_beauty_takes_the_bait.html',
+ 'info_dict': {
+ 'id': '1509445',
+ 'ext': 'mp4',
+ 'title': 'FemaleAgent Shy beauty takes the bait',
+ 'upload_date': '20121014',
+ 'uploader': 'Ruseful2011',
+ 'duration': 893,
+ 'age_limit': 18,
+ }
+ },
+ {
+ 'url': 'http://xhamster.com/movies/2221348/britney_spears_sexy_booty.html?hd',
+ 'info_dict': {
+ 'id': '2221348',
+ 'ext': 'mp4',
+ 'title': 'Britney Spears Sexy Booty',
+ 'upload_date': '20130914',
+ 'uploader': 'jojo747400',
+ 'duration': 200,
+ 'age_limit': 18,
+ }
+ },
+ {
+ 'url': 'https://xhamster.com/movies/2272726/amber_slayed_by_the_knight.html',
+ 'only_matching': True,
+ },
+ ]
+
+ def _real_extract(self, url):
+ def extract_video_url(webpage, name):
+ return self._search_regex(
+ [r'''file\s*:\s*(?P<q>["'])(?P<mp4>.+?)(?P=q)''',
+ r'''<a\s+href=(?P<q>["'])(?P<mp4>.+?)(?P=q)\s+class=["']mp4Thumb''',
+ r'''<video[^>]+file=(?P<q>["'])(?P<mp4>.+?)(?P=q)[^>]*>'''],
+ webpage, name, group='mp4')