|
@ -73,6 +73,17 @@ class SohuIE(InfoExtractor): |
|
|
'title': '【神探苍实战秘籍】第13期 战争之影 赫卡里姆', |
|
|
'title': '【神探苍实战秘籍】第13期 战争之影 赫卡里姆', |
|
|
} |
|
|
} |
|
|
}] |
|
|
}] |
|
|
|
|
|
}, { |
|
|
|
|
|
'info': 'Video with title containing dash', |
|
|
|
|
|
'url': 'http://my.tv.sohu.com/us/249884221/78932792.shtml', |
|
|
|
|
|
'info_dict': { |
|
|
|
|
|
'id': '78932792', |
|
|
|
|
|
'ext': 'mp4', |
|
|
|
|
|
'title': 'youtube-dl testing video', |
|
|
|
|
|
}, |
|
|
|
|
|
'params': { |
|
|
|
|
|
'skip_download': True |
|
|
|
|
|
} |
|
|
}] |
|
|
}] |
|
|
|
|
|
|
|
|
def _real_extract(self, url): |
|
|
def _real_extract(self, url): |
|
@ -97,10 +108,8 @@ class SohuIE(InfoExtractor): |
|
|
mytv = mobj.group('mytv') is not None |
|
|
mytv = mobj.group('mytv') is not None |
|
|
|
|
|
|
|
|
webpage = self._download_webpage(url, video_id) |
|
|
webpage = self._download_webpage(url, video_id) |
|
|
raw_title = self._html_search_regex( |
|
|
|
|
|
r'(?s)<title>(.+?)</title>', |
|
|
|
|
|
webpage, 'video title') |
|
|
|
|
|
title = raw_title.partition('-')[0].strip() |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
title = self._og_search_title(webpage) |
|
|
|
|
|
|
|
|
vid = self._html_search_regex( |
|
|
vid = self._html_search_regex( |
|
|
r'var vid ?= ?["\'](\d+)["\']', |
|
|
r'var vid ?= ?["\'](\d+)["\']', |
|
|