about summary refs log tree commit diff
diff options
context:
space:
mode:
authorJaime Marquínez Ferrándiz <jaime.marquinez.ferrandiz@gmail.com>2013-06-20 14:15:29 +0200
committerJaime Marquínez Ferrándiz <jaime.marquinez.ferrandiz@gmail.com>2013-06-20 14:15:29 +0200
commit587c68b2cdef65766d4dc408b04bd67cf8d2daf2 (patch)
tree652a25e2b51627c484d603d52ba72c98f774e1c3
parent377fdf5dde6a8fe477f5c3cd721df82112d41de7 (diff)
downloadyoutube-dl-587c68b2cdef65766d4dc408b04bd67cf8d2daf2.tar.gz
youtube-dl-587c68b2cdef65766d4dc408b04bd67cf8d2daf2.tar.xz
youtube-dl-587c68b2cdef65766d4dc408b04bd67cf8d2daf2.zip
DailymotionIE: fix the extraction of the video uploader and use _search_regex for getting it
-rwxr-xr-xyoutube_dl/InfoExtractors.py14
1 files changed, 4 insertions, 10 deletions
diff --git a/youtube_dl/InfoExtractors.py b/youtube_dl/InfoExtractors.py
index 59f65aca3..c80a74ef6 100755
--- a/youtube_dl/InfoExtractors.py
+++ b/youtube_dl/InfoExtractors.py
@@ -940,16 +940,10 @@ class DailymotionIE(InfoExtractor):
         video_title = unescapeHTML(mobj.group('title'))
 
         video_uploader = None
-        mobj = re.search(r'(?im)<span class="owner[^\"]+?">[^<]+?<a [^>]+?>([^<]+?)</a>', webpage)
-        if mobj is None:
-            # lookin for official user
-            mobj_official = re.search(r'<span rel="author"[^>]+?>([^<]+?)</span>', webpage)
-            if mobj_official is None:
-                self._downloader.report_warning(u'unable to extract uploader nickname')
-            else:
-                video_uploader = mobj_official.group(1)
-        else:
-            video_uploader = mobj.group(1)
+        video_uploader = self._search_regex([r'(?im)<span class="owner[^\"]+?">[^<]+?<a [^>]+?>([^<]+?)</a>',
+                                             # Looking for official user
+                                             r'<(?:span|a) .*?rel="author".*?>([^<]+?)</'],
+                                            webpage, 'video uploader')
 
         video_upload_date = None
         mobj = re.search(r'<div class="[^"]*uploaded_cont[^"]*" title="[^"]*">([0-9]{2})-([0-9]{2})-([0-9]{4})</div>', webpage)