[rumble] add support for embed pages(#10785)

author: Remita Amine <remitamine@gmail.com> 2020-11-22 13:07:04 +0100
committer: Remita Amine <remitamine@gmail.com> 2020-11-22 13:07:04 +0100
commit: 9d531aa2918067570e4827fcced59c60accac220 (patch)
tree: 6df99db373dd2794e4f834048eeaacd9f4e91cde
parent: e9cbb98a0f63e08cf7c42d1612450e2534c8de7e (diff)
download: youtube-dl-9d531aa2918067570e4827fcced59c60accac220.tar.gz
youtube-dl-9d531aa2918067570e4827fcced59c60accac220.tar.xz
youtube-dl-9d531aa2918067570e4827fcced59c60accac220.zip
2 files changed, 68 insertions, 0 deletions
diff --git a/youtube_dl/extractor/extractors.py b/youtube_dl/extractor/extractors.py
index 356f4cc6b..31fb4c95a 100644
--- a/youtube_dl/extractor/extractors.py
+++ b/youtube_dl/extractor/extractors.py
@@ -963,6 +963,7 @@ from .rtve import RTVEALaCartaIE, RTVELiveIE, RTVEInfantilIE, RTVELiveIE, RTVETe
 from .rtvnh import RTVNHIE
 from .rtvs import RTVSIE
 from .ruhd import RUHDIE
+from .rumble import RumbleEmbedIE
 from .rutube import (
     RutubeIE,
     RutubeChannelIE,
diff --git a/youtube_dl/extractor/rumble.py b/youtube_dl/extractor/rumble.py
new file mode 100644
index 000000000..4a0225109
--- /dev/null
+++ b/youtube_dl/extractor/rumble.py
@@ -0,0 +1,67 @@
+# coding: utf-8
+from __future__ import unicode_literals
+
+from .common import InfoExtractor
+from ..compat import compat_str
+from ..utils import (
+    determine_ext,
+    int_or_none,
+    parse_iso8601,
+    try_get,
+)
+
+
+class RumbleEmbedIE(InfoExtractor):
+    _VALID_URL = r'https?://(?:www\.)?rumble\.com/embed/(?:[0-9a-z]+\.)?(?P<id>[0-9a-z]+)'
+    _TESTS = [{
+        'url': 'https://rumble.com/embed/v5pv5f',
+        'md5': '36a18a049856720189f30977ccbb2c34',
+        'info_dict': {
+            'id': 'v5pv5f',
+            'ext': 'mp4',
+            'title': 'WMAR 2 News Latest Headlines | October 20, 6pm',
+            'timestamp': 1571611968,
+            'upload_date': '20191020',
+        }
+    }, {
+        'url': 'https://rumble.com/embed/ufe9n.v5pv5f',
+        'only_matching': True,
+    }]
+
+    def _real_extract(self, url):
+        video_id = self._match_id(url)
+        video = self._download_json(
+            'https://rumble.com/embedJS/', video_id,
+            query={'request': 'video', 'v': video_id})
+        title = video['title']
+
+        formats = []
+        for height, ua in (video.get('ua') or {}).items():
+            for i in range(2):
+                f_url = try_get(ua, lambda x: x[i], compat_str)
+                if f_url:
+                    ext = determine_ext(f_url)
+                    f = {
+                        'ext': ext,
+                        'format_id': '%s-%sp' % (ext, height),
+                        'height': int_or_none(height),
+                        'url': f_url,
+                    }
+                    bitrate = try_get(ua, lambda x: x[i + 2]['bitrate'])
+                    if bitrate:
+                        f['tbr'] = int_or_none(bitrate)
+                    formats.append(f)
+        self._sort_formats(formats)
+
+        author = video.get('author') or {}
+
+        return {
+            'id': video_id,
+            'title': title,
+            'formats': formats,
+            'thumbnail': video.get('i'),
+            'timestamp': parse_iso8601(video.get('pubDate')),
+            'channel': author.get('name'),
+            'channel_url': author.get('url'),
+            'duration': int_or_none(video.get('duration')),
+        }
author	Remita Amine <remitamine@gmail.com>	2020-11-22 13:07:04 +0100
committer	Remita Amine <remitamine@gmail.com>	2020-11-22 13:07:04 +0100
commit	9d531aa2918067570e4827fcced59c60accac220 (patch)
tree	6df99db373dd2794e4f834048eeaacd9f4e91cde
parent	e9cbb98a0f63e08cf7c42d1612450e2534c8de7e (diff)
download	youtube-dl-9d531aa2918067570e4827fcced59c60accac220.tar.gz youtube-dl-9d531aa2918067570e4827fcced59c60accac220.tar.xz youtube-dl-9d531aa2918067570e4827fcced59c60accac220.zip