summary refs log tree commit diff
diff options
context:
space:
mode:
authorSergey M․ <dstftw@gmail.com>2017-07-02 20:04:08 +0700
committerSergey M․ <dstftw@gmail.com>2017-07-02 20:06:15 +0700
commit50ae3f646e6c7eec187078dd43f1cb3777ccfb4c (patch)
tree1f2b54928c44b2416a2e63ad1f315ab03847e647
parent99a7e76240f3e79d770bff0029dc3321e14b2a97 (diff)
downloadyoutube-dl-50ae3f646e6c7eec187078dd43f1cb3777ccfb4c.tar.gz
youtube-dl-50ae3f646e6c7eec187078dd43f1cb3777ccfb4c.tar.xz
youtube-dl-50ae3f646e6c7eec187078dd43f1cb3777ccfb4c.zip
[thisoldhouse] Add more fallbacks for video id (closes #13541)
-rw-r--r--youtube_dl/extractor/thisoldhouse.py17
1 files changed, 13 insertions, 4 deletions
diff --git a/youtube_dl/extractor/thisoldhouse.py b/youtube_dl/extractor/thisoldhouse.py
index 0c321354f..6ab147ad7 100644
--- a/youtube_dl/extractor/thisoldhouse.py
+++ b/youtube_dl/extractor/thisoldhouse.py
@@ -2,6 +2,8 @@
 from __future__ import unicode_literals
 
 from .common import InfoExtractor
+from ..compat import compat_str
+from ..utils import try_get
 
 
 class ThisOldHouseIE(InfoExtractor):
@@ -28,8 +30,15 @@ class ThisOldHouseIE(InfoExtractor):
     def _real_extract(self, url):
         display_id = self._match_id(url)
         webpage = self._download_webpage(url, display_id)
-        drupal_settings = self._parse_json(self._search_regex(
-            r'jQuery\.extend\(Drupal\.settings\s*,\s*({.+?})\);',
-            webpage, 'drupal settings'), display_id)
-        video_id = list(drupal_settings['comScore'])[0]
+        video_id = self._search_regex(
+            (r'data-mid=(["\'])(?P<id>(?:(?!\1).)+)\1',
+             r'id=(["\'])inline-video-player-(?P<id>(?:(?!\1).)+)\1'),
+            webpage, 'video id', default=None, group='id')
+        if not video_id:
+            drupal_settings = self._parse_json(self._search_regex(
+                r'jQuery\.extend\(Drupal\.settings\s*,\s*({.+?})\);',
+                webpage, 'drupal settings'), display_id)
+            video_id = try_get(
+                drupal_settings, lambda x: x['jwplatform']['video_id'],
+                compat_str) or list(drupal_settings['comScore'])[0]
         return self.url_result('jwplatform:' + video_id, 'JWPlatform', video_id)