|
|
@ -0,0 +1,69 @@ |
|
|
|
# coding: utf-8 |
|
|
|
from __future__ import unicode_literals |
|
|
|
|
|
|
|
from .common import InfoExtractor |
|
|
|
from ..compat import compat_urllib_parse_unquote |
|
|
|
from ..utils import ( |
|
|
|
int_or_none, |
|
|
|
xpath_text, |
|
|
|
) |
|
|
|
|
|
|
|
|
|
|
|
class NozIE(InfoExtractor): |
|
|
|
_VALID_URL = r'https?://(?:www\.)?noz\.de/video/(?P<id>[0-9]+)/' |
|
|
|
_TESTS = [{ |
|
|
|
'url': 'http://www.noz.de/video/25151/32-Deutschland-gewinnt-Badminton-Lnderspiel-in-Melle', |
|
|
|
'info_dict': { |
|
|
|
'id': '25151', |
|
|
|
'ext': 'mp4', |
|
|
|
'duration': 215, |
|
|
|
'title': '3:2 - Deutschland gewinnt Badminton-Länderspiel in Melle', |
|
|
|
'description': 'Vor rund 370 Zuschauern gewinnt die deutsche Badminton-Nationalmannschaft am Donnerstag ein EM-Vorbereitungsspiel gegen Frankreich in Melle. Video Moritz Frankenberg.', |
|
|
|
'thumbnail': 're:^http://.*\.jpg', |
|
|
|
}, |
|
|
|
}] |
|
|
|
|
|
|
|
def _real_extract(self, url): |
|
|
|
video_id = self._match_id(url) |
|
|
|
webpage = self._download_webpage(url, video_id) |
|
|
|
description = self._og_search_description(webpage) |
|
|
|
|
|
|
|
edge_url = self._html_search_regex( |
|
|
|
r'<script\s+(?:type="text/javascript"\s+)?src="(.*?/videojs_.*?)"', |
|
|
|
webpage, 'edge URL') |
|
|
|
edge_content = self._download_webpage(edge_url, 'meta configuration') |
|
|
|
|
|
|
|
config_url_encoded = self._search_regex( |
|
|
|
r'so\.addVariable\("config_url","[^,]*,(.*?)"', |
|
|
|
edge_content, 'config URL' |
|
|
|
) |
|
|
|
config_url = compat_urllib_parse_unquote(config_url_encoded) |
|
|
|
|
|
|
|
doc = self._download_xml(config_url, 'video configuration') |
|
|
|
title = xpath_text(doc, './/title') |
|
|
|
thumbnail = xpath_text(doc, './/article/thumbnail/url') |
|
|
|
duration = int_or_none(xpath_text( |
|
|
|
doc, './/article/movie/file/duration')) |
|
|
|
formats = [] |
|
|
|
for qnode in doc.findall('.//article/movie/file/qualities/qual'): |
|
|
|
video_node = qnode.find('./html_urls/video_url[@format="video/mp4"]') |
|
|
|
if video_node is None: |
|
|
|
continue # auto |
|
|
|
formats.append({ |
|
|
|
'url': video_node.text, |
|
|
|
'format_name': xpath_text(qnode, './name'), |
|
|
|
'format_id': xpath_text(qnode, './id'), |
|
|
|
'height': int_or_none(xpath_text(qnode, './height')), |
|
|
|
'width': int_or_none(xpath_text(qnode, './width')), |
|
|
|
'tbr': int_or_none(xpath_text(qnode, './bitrate'), scale=1000), |
|
|
|
}) |
|
|
|
self._sort_formats(formats) |
|
|
|
|
|
|
|
return { |
|
|
|
'id': video_id, |
|
|
|
'formats': formats, |
|
|
|
'title': title, |
|
|
|
'duration': duration, |
|
|
|
'description': description, |
|
|
|
'thumbnail': thumbnail, |
|
|
|
} |