Imported Upstream version 2015.07.21

[youtubedl] / youtube_dl / extractor / twitch.py
diff --git a/youtube_dl/extractor/twitch.py b/youtube_dl/extractor/twitch.py

index 94bd6345da18815a50b72502a8b91ae4e30ae2b5..73ce335b7f0a5b5790f8dd65e3ac170e9791b7d8 100644 (file)
--- a/youtube_dl/extractor/twitch.py
+++ b/youtube_dl/extractor/twitch.py
@@ -22,8 +22,8 @@ class TwitchBaseIE(InfoExtractor):
  
      _API_BASE = 'https://api.twitch.tv'
      _USHER_BASE = 'http://usher.twitch.tv'
-    _LOGIN_URL = 'https://secure.twitch.tv/user/login'
-    _LOGIN_POST_URL = 'https://secure-login.twitch.tv/login'
+    _LOGIN_URL = 'https://secure.twitch.tv/login'
+    _LOGIN_POST_URL = 'https://passport.twitch.tv/authorize'
      _NETRC_MACHINE = 'twitch'
  
      def _handle_error(self, response):
@@ -59,20 +59,12 @@ class TwitchBaseIE(InfoExtractor):
          login_page = self._download_webpage(
              self._LOGIN_URL, None, 'Downloading login page')
  
-        authenticity_token = self._search_regex(
-            r'<input name="authenticity_token" type="hidden" value="([^"]+)"',
-            login_page, 'authenticity token')
-
-        login_form = {
-            'utf8': '✓'.encode('utf-8'),
-            'authenticity_token': authenticity_token,
-            'redirect_on_login': '',
-            'embed_form': 'false',
-            'mp_source_action': 'login-button',
-            'follow': '',
-            'login': username,
-            'password': password,
-        }
+        login_form = self._hidden_inputs(login_page)
+
+        login_form.update({
+            'login': username.encode('utf-8'),
+            'password': password.encode('utf-8'),
+        })
  
          request = compat_urllib_request.Request(
              self._LOGIN_POST_URL, compat_urllib_parse.urlencode(login_form).encode('utf-8'))
@@ -80,11 +72,15 @@ class TwitchBaseIE(InfoExtractor):
          response = self._download_webpage(
              request, None, 'Logging in as %s' % username)
  
-        m = re.search(
-            r"id=([\"'])login_error_message\1[^>]*>(?P<msg>[^<]+)", response)
-        if m:
+        error_message = self._search_regex(
+            r'<div[^>]+class="subwindow_notice"[^>]*>([^<]+)</div>',
+            response, 'error message', default=None)
+        if error_message:
              raise ExtractorError(
-                'Unable to login: %s' % m.group('msg').strip(), expected=True)
+                'Unable to login. Twitch said: %s' % error_message, expected=True)
+
+        if '>Reset your password<' in response:
+            self.report_warning('Twitch asks you to reset your password, go to https://secure.twitch.tv/reset/submit')
  
      def _prefer_source(self, formats):
          try:
@@ -189,17 +185,17 @@ class TwitchVodIE(TwitchItemBaseIE):
      _ITEM_SHORTCUT = 'v'
  
      _TEST = {
-        'url': 'http://www.twitch.tv/ksptv/v/3622000',
+        'url': 'http://www.twitch.tv/riotgames/v/6528877',
          'info_dict': {
-            'id': 'v3622000',
+            'id': 'v6528877',
              'ext': 'mp4',
-            'title': '''KSPTV: Squadcast: "Everyone's on vacation so here's Dahud" Edition!''',
+            'title': 'LCK Summer Split - Week 6 Day 1',
              'thumbnail': 're:^https?://.*\.jpg$',
-            'duration': 6951,
-            'timestamp': 1419028564,
-            'upload_date': '20141219',
-            'uploader': 'KSPTV',
-            'uploader_id': 'ksptv',
+            'duration': 17208,
+            'timestamp': 1435131709,
+            'upload_date': '20150624',
+            'uploader': 'Riot Games',
+            'uploader_id': 'riotgames',
              'view_count': int,
          },
          'params': {
@@ -215,7 +211,7 @@ class TwitchVodIE(TwitchItemBaseIE):
              '%s/api/vods/%s/access_token' % (self._API_BASE, item_id), item_id,
              'Downloading %s access token' % self._ITEM_TYPE)
          formats = self._extract_m3u8_formats(
-            '%s/vod/%s?nauth=%s&nauthsig=%s'
+            '%s/vod/%s?nauth=%s&nauthsig=%s&allow_source=true'
              % (self._USHER_BASE, item_id, access_token['token'], access_token['sig']),
              item_id, 'mp4')
          self._prefer_source(formats)
@@ -314,9 +310,9 @@ class TwitchBookmarksIE(TwitchPlaylistBaseIE):
  
  class TwitchStreamIE(TwitchBaseIE):
      IE_NAME = 'twitch:stream'
-    _VALID_URL = r'%s/(?P<id>[^/]+)/?(?:\#.*)?$' % TwitchBaseIE._VALID_URL_BASE
+    _VALID_URL = r'%s/(?P<id>[^/#?]+)/?(?:\#.*)?$' % TwitchBaseIE._VALID_URL_BASE
  
-    _TEST = {
+    _TESTS = [{
          'url': 'http://www.twitch.tv/shroomztv',
          'info_dict': {
              'id': '12772022048',
@@ -335,7 +331,10 @@ class TwitchStreamIE(TwitchBaseIE):
              # m3u8 download
              'skip_download': True,
          },
-    }
+    }, {
+        'url': 'http://www.twitch.tv/miracle_doto#profile-0',
+        'only_matching': True,
+    }]
  
      def _real_extract(self, url):
          channel_id = self._match_id(url)
@@ -350,6 +349,12 @@ class TwitchStreamIE(TwitchBaseIE):
                  'http://www.twitch.tv/%s/profile' % channel_id,
                  'TwitchProfile', channel_id)
  
+        # Channel name may be typed if different case than the original channel name
+        # (e.g. http://www.twitch.tv/TWITCHPLAYSPOKEMON) that will lead to constructing
+        # an invalid m3u8 URL. Working around by use of original channel name from stream
+        # JSON and fallback to lowercase if it's not available.
+        channel_id = stream.get('channel', {}).get('name') or channel_id.lower()
+
          access_token = self._download_json(
              '%s/api/channels/%s/access_token' % (self._API_BASE, channel_id), channel_id,
              'Downloading channel access token')