|
|
@ -1,54 +1,80 @@ |
|
|
|
from __future__ import unicode_literals |
|
|
|
|
|
|
|
import re |
|
|
|
|
|
|
|
from .common import InfoExtractor |
|
|
|
from ..utils import ExtractorError |
|
|
|
|
|
|
|
|
|
|
|
class NhkVodIE(InfoExtractor): |
|
|
|
_VALID_URL = r'https?://www3\.nhk\.or\.jp/nhkworld/en/(?:vod|ondemand)/(?P<id>[^/]+/[^/?#&]+)' |
|
|
|
_VALID_URL = r'https?://www3\.nhk\.or\.jp/nhkworld/(?P<lang>[a-z]{2})/ondemand/(?P<type>video|audio)/(?P<id>\d{7}|[a-z]+-\d{8}-\d+)' |
|
|
|
# Content available only for a limited period of time. Visit |
|
|
|
# https://www3.nhk.or.jp/nhkworld/en/ondemand/ for working samples. |
|
|
|
_TESTS = [{ |
|
|
|
# Videos available only for a limited period of time. Visit |
|
|
|
# http://www3.nhk.or.jp/nhkworld/en/vod/ for working samples. |
|
|
|
'url': 'http://www3.nhk.or.jp/nhkworld/en/vod/tokyofashion/20160815', |
|
|
|
'info_dict': { |
|
|
|
'id': 'A1bnNiNTE6nY3jLllS-BIISfcC_PpvF5', |
|
|
|
'ext': 'flv', |
|
|
|
'title': 'TOKYO FASHION EXPRESS - The Kimono as Global Fashion', |
|
|
|
'description': 'md5:db338ee6ce8204f415b754782f819824', |
|
|
|
'series': 'TOKYO FASHION EXPRESS', |
|
|
|
'episode': 'The Kimono as Global Fashion', |
|
|
|
}, |
|
|
|
'skip': 'Videos available only for a limited period of time', |
|
|
|
}, { |
|
|
|
'url': 'https://www3.nhk.or.jp/nhkworld/en/ondemand/video/2015173/', |
|
|
|
'only_matching': True, |
|
|
|
}, { |
|
|
|
'url': 'https://www3.nhk.or.jp/nhkworld/en/ondemand/audio/plugin-20190404-1/', |
|
|
|
'only_matching': True, |
|
|
|
}, { |
|
|
|
'url': 'https://www3.nhk.or.jp/nhkworld/fr/ondemand/audio/plugin-20190404-1/', |
|
|
|
'only_matching': True, |
|
|
|
}] |
|
|
|
_API_URL = 'http://api.nhk.or.jp/nhkworld/vodesdlist/v1/all/all/all.json?apikey=EJfK8jdS57GqlupFgAfAAwr573q01y6k' |
|
|
|
_API_URL_TEMPLATE = 'https://api.nhk.or.jp/nhkworld/%sodesdlist/v7/episode/%s/%s/all%s.json' |
|
|
|
|
|
|
|
def _real_extract(self, url): |
|
|
|
video_id = self._match_id(url) |
|
|
|
lang, m_type, episode_id = re.match(self._VALID_URL, url).groups() |
|
|
|
if episode_id.isdigit(): |
|
|
|
episode_id = episode_id[:4] + '-' + episode_id[4:] |
|
|
|
|
|
|
|
data = self._download_json(self._API_URL, video_id) |
|
|
|
is_video = m_type == 'video' |
|
|
|
episode = self._download_json( |
|
|
|
self._API_URL_TEMPLATE % ('v' if is_video else 'r', episode_id, lang, '/all' if is_video else ''), |
|
|
|
episode_id, query={'apikey': 'EJfK8jdS57GqlupFgAfAAwr573q01y6k'})['data']['episodes'][0] |
|
|
|
title = episode.get('sub_title_clean') or episode['sub_title'] |
|
|
|
|
|
|
|
try: |
|
|
|
episode = next( |
|
|
|
e for e in data['data']['episodes'] |
|
|
|
if e.get('url') and video_id in e['url']) |
|
|
|
except StopIteration: |
|
|
|
raise ExtractorError('Unable to find episode') |
|
|
|
def get_clean_field(key): |
|
|
|
return episode.get(key + '_clean') or episode.get(key) |
|
|
|
|
|
|
|
embed_code = episode['vod_id'] |
|
|
|
series = get_clean_field('title') |
|
|
|
|
|
|
|
title = episode.get('sub_title_clean') or episode['sub_title'] |
|
|
|
description = episode.get('description_clean') or episode.get('description') |
|
|
|
series = episode.get('title_clean') or episode.get('title') |
|
|
|
thumbnails = [] |
|
|
|
for s, w, h in [('', 640, 360), ('_l', 1280, 720)]: |
|
|
|
img_path = episode.get('image' + s) |
|
|
|
if not img_path: |
|
|
|
continue |
|
|
|
thumbnails.append({ |
|
|
|
'id': '%dp' % h, |
|
|
|
'height': h, |
|
|
|
'width': w, |
|
|
|
'url': 'https://www3.nhk.or.jp' + img_path, |
|
|
|
}) |
|
|
|
|
|
|
|
return { |
|
|
|
'_type': 'url_transparent', |
|
|
|
'ie_key': 'Ooyala', |
|
|
|
'url': 'ooyala:%s' % embed_code, |
|
|
|
info = { |
|
|
|
'id': episode_id + '-' + lang, |
|
|
|
'title': '%s - %s' % (series, title) if series and title else title, |
|
|
|
'description': description, |
|
|
|
'description': get_clean_field('description'), |
|
|
|
'thumbnails': thumbnails, |
|
|
|
'series': series, |
|
|
|
'episode': title, |
|
|
|
} |
|
|
|
if is_video: |
|
|
|
info.update({ |
|
|
|
'_type': 'url_transparent', |
|
|
|
'ie_key': 'Ooyala', |
|
|
|
'url': 'ooyala:' + episode['vod_id'], |
|
|
|
}) |
|
|
|
else: |
|
|
|
audio = episode['audio'] |
|
|
|
audio_path = audio['audio'] |
|
|
|
info['formats'] = self._extract_m3u8_formats( |
|
|
|
'https://nhks-vh.akamaihd.net/i%s/master.m3u8' % audio_path, |
|
|
|
episode_id, 'm4a', m3u8_id='hls', fatal=False) |
|
|
|
info['formats'].append({ |
|
|
|
'ext': 'flv', |
|
|
|
'format_id': 'flv', |
|
|
|
'url': 'rtmp://flv.nhk.or.jp/ondemand/mp4:flv' + audio_path, |
|
|
|
'vcodec': 'none', |
|
|
|
}) |
|
|
|
for f in info['formats']: |
|
|
|
f['language'] = lang |
|
|
|
return info |