Update upstream source from tag 'upstream/2020.05.08'

[youtubedl] / youtube_dl / extractor / ninenow.py
diff --git a/youtube_dl/extractor/ninenow.py b/youtube_dl/extractor/ninenow.py

index faa5772376cac8c27dacabbf84f6ae1d5000980e..6157dc7c16e785ca7f570a45c36cd8e90bbd05e1 100644 (file)
--- a/youtube_dl/extractor/ninenow.py
+++ b/youtube_dl/extractor/ninenow.py
@@ -4,15 +4,17 @@ from __future__ import unicode_literals
  from .common import InfoExtractor
  from ..compat import compat_str
  from ..utils import (
  from .common import InfoExtractor
  from ..compat import compat_str
  from ..utils import (
+    ExtractorError,
      int_or_none,
      float_or_none,
      int_or_none,
      float_or_none,
-    ExtractorError,
+    smuggle_url,
  )
  
  
  class NineNowIE(InfoExtractor):
      IE_NAME = '9now.com.au'
      _VALID_URL = r'https?://(?:www\.)?9now\.com\.au/(?:[^/]+/){2}(?P<id>[^/?#]+)'
  )
  
  
  class NineNowIE(InfoExtractor):
      IE_NAME = '9now.com.au'
      _VALID_URL = r'https?://(?:www\.)?9now\.com\.au/(?:[^/]+/){2}(?P<id>[^/?#]+)'
+    _GEO_COUNTRIES = ['AU']
      _TESTS = [{
          # clip
          'url': 'https://www.9now.com.au/afl-footy-show/2016/clip-ciql02091000g0hp5oktrnytc',
      _TESTS = [{
          # clip
          'url': 'https://www.9now.com.au/afl-footy-show/2016/clip-ciql02091000g0hp5oktrnytc',
@@ -43,8 +45,25 @@ class NineNowIE(InfoExtractor):
          webpage = self._download_webpage(url, display_id)
          page_data = self._parse_json(self._search_regex(
              r'window\.__data\s*=\s*({.*?});', webpage,
          webpage = self._download_webpage(url, display_id)
          page_data = self._parse_json(self._search_regex(
              r'window\.__data\s*=\s*({.*?});', webpage,
-            'page data'), display_id)
-        common_data = page_data.get('episode', {}).get('episode') or page_data.get('clip', {}).get('clip')
+            'page data', default='{}'), display_id, fatal=False)
+        if not page_data:
+            page_data = self._parse_json(self._parse_json(self._search_regex(
+                r'window\.__data\s*=\s*JSON\.parse\s*\(\s*(".+?")\s*\)\s*;',
+                webpage, 'page data'), display_id), display_id)
+
+        for kind in ('episode', 'clip'):
+            current_key = page_data.get(kind, {}).get(
+                'current%sKey' % kind.capitalize())
+            if not current_key:
+                continue
+            cache = page_data.get(kind, {}).get('%sCache' % kind, {})
+            if not cache:
+                continue
+            common_data = (cache.get(current_key) or list(cache.values())[0])[kind]
+            break
+        else:
+            raise ExtractorError('Unable to find video data')
+
          video_data = common_data['video']
  
          if video_data.get('drm'):
          video_data = common_data['video']
  
          if video_data.get('drm'):
@@ -62,7 +81,9 @@ class NineNowIE(InfoExtractor):
  
          return {
              '_type': 'url_transparent',
  
          return {
              '_type': 'url_transparent',
-            'url': self.BRIGHTCOVE_URL_TEMPLATE % brightcove_id,
+            'url': smuggle_url(
+                self.BRIGHTCOVE_URL_TEMPLATE % brightcove_id,
+                {'geo_countries': self._GEO_COUNTRIES}),
              'id': video_id,
              'title': title,
              'description': common_data.get('description'),
              'id': video_id,
              'title': title,
              'description': common_data.get('description'),